You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

667 lines
19KB

  1. /*
  2. * H261 decoder
  3. * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
  4. * Copyright (c) 2004 Maarten Daniels
  5. *
  6. * This file is part of Libav.
  7. *
  8. * Libav is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * Libav is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with Libav; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. /**
  23. * @file
  24. * H.261 decoder.
  25. */
  26. #include "avcodec.h"
  27. #include "mpegvideo.h"
  28. #include "h263.h"
  29. #include "h261.h"
  30. #include "h261data.h"
  31. #define H261_MBA_VLC_BITS 9
  32. #define H261_MTYPE_VLC_BITS 6
  33. #define H261_MV_VLC_BITS 7
  34. #define H261_CBP_VLC_BITS 9
  35. #define TCOEFF_VLC_BITS 9
  36. #define MBA_STUFFING 33
  37. #define MBA_STARTCODE 34
  38. static VLC h261_mba_vlc;
  39. static VLC h261_mtype_vlc;
  40. static VLC h261_mv_vlc;
  41. static VLC h261_cbp_vlc;
  42. static int h261_decode_block(H261Context *h, int16_t *block, int n, int coded);
  43. static av_cold void h261_decode_init_vlc(H261Context *h)
  44. {
  45. static int done = 0;
  46. if (!done) {
  47. done = 1;
  48. INIT_VLC_STATIC(&h261_mba_vlc, H261_MBA_VLC_BITS, 35,
  49. h261_mba_bits, 1, 1,
  50. h261_mba_code, 1, 1, 662);
  51. INIT_VLC_STATIC(&h261_mtype_vlc, H261_MTYPE_VLC_BITS, 10,
  52. h261_mtype_bits, 1, 1,
  53. h261_mtype_code, 1, 1, 80);
  54. INIT_VLC_STATIC(&h261_mv_vlc, H261_MV_VLC_BITS, 17,
  55. &h261_mv_tab[0][1], 2, 1,
  56. &h261_mv_tab[0][0], 2, 1, 144);
  57. INIT_VLC_STATIC(&h261_cbp_vlc, H261_CBP_VLC_BITS, 63,
  58. &h261_cbp_tab[0][1], 2, 1,
  59. &h261_cbp_tab[0][0], 2, 1, 512);
  60. ff_init_rl(&h261_rl_tcoeff, ff_h261_rl_table_store);
  61. INIT_VLC_RL(h261_rl_tcoeff, 552);
  62. }
  63. }
  64. static av_cold int h261_decode_init(AVCodecContext *avctx)
  65. {
  66. H261Context *h = avctx->priv_data;
  67. MpegEncContext *const s = &h->s;
  68. // set defaults
  69. ff_MPV_decode_defaults(s);
  70. s->avctx = avctx;
  71. s->width = s->avctx->coded_width;
  72. s->height = s->avctx->coded_height;
  73. s->codec_id = s->avctx->codec->id;
  74. s->out_format = FMT_H261;
  75. s->low_delay = 1;
  76. avctx->pix_fmt = AV_PIX_FMT_YUV420P;
  77. s->codec_id = avctx->codec->id;
  78. h261_decode_init_vlc(h);
  79. h->gob_start_code_skipped = 0;
  80. return 0;
  81. }
  82. /**
  83. * Decode the group of blocks header or slice header.
  84. * @return <0 if an error occurred
  85. */
  86. static int h261_decode_gob_header(H261Context *h)
  87. {
  88. unsigned int val;
  89. MpegEncContext *const s = &h->s;
  90. if (!h->gob_start_code_skipped) {
  91. /* Check for GOB Start Code */
  92. val = show_bits(&s->gb, 15);
  93. if (val)
  94. return -1;
  95. /* We have a GBSC */
  96. skip_bits(&s->gb, 16);
  97. }
  98. h->gob_start_code_skipped = 0;
  99. h->gob_number = get_bits(&s->gb, 4); /* GN */
  100. s->qscale = get_bits(&s->gb, 5); /* GQUANT */
  101. /* Check if gob_number is valid */
  102. if (s->mb_height == 18) { // CIF
  103. if ((h->gob_number <= 0) || (h->gob_number > 12))
  104. return -1;
  105. } else { // QCIF
  106. if ((h->gob_number != 1) && (h->gob_number != 3) &&
  107. (h->gob_number != 5))
  108. return -1;
  109. }
  110. /* GEI */
  111. while (get_bits1(&s->gb) != 0)
  112. skip_bits(&s->gb, 8);
  113. if (s->qscale == 0) {
  114. av_log(s->avctx, AV_LOG_ERROR, "qscale has forbidden 0 value\n");
  115. if (s->avctx->err_recognition & AV_EF_BITSTREAM)
  116. return -1;
  117. }
  118. /* For the first transmitted macroblock in a GOB, MBA is the absolute
  119. * address. For subsequent macroblocks, MBA is the difference between
  120. * the absolute addresses of the macroblock and the last transmitted
  121. * macroblock. */
  122. h->current_mba = 0;
  123. h->mba_diff = 0;
  124. return 0;
  125. }
  126. /**
  127. * Decode the group of blocks / video packet header.
  128. * @return <0 if no resync found
  129. */
  130. static int ff_h261_resync(H261Context *h)
  131. {
  132. MpegEncContext *const s = &h->s;
  133. int left, ret;
  134. if (h->gob_start_code_skipped) {
  135. ret = h261_decode_gob_header(h);
  136. if (ret >= 0)
  137. return 0;
  138. } else {
  139. if (show_bits(&s->gb, 15) == 0) {
  140. ret = h261_decode_gob_header(h);
  141. if (ret >= 0)
  142. return 0;
  143. }
  144. // OK, it is not where it is supposed to be ...
  145. s->gb = s->last_resync_gb;
  146. align_get_bits(&s->gb);
  147. left = get_bits_left(&s->gb);
  148. for (; left > 15 + 1 + 4 + 5; left -= 8) {
  149. if (show_bits(&s->gb, 15) == 0) {
  150. GetBitContext bak = s->gb;
  151. ret = h261_decode_gob_header(h);
  152. if (ret >= 0)
  153. return 0;
  154. s->gb = bak;
  155. }
  156. skip_bits(&s->gb, 8);
  157. }
  158. }
  159. return -1;
  160. }
  161. /**
  162. * Decode skipped macroblocks.
  163. * @return 0
  164. */
  165. static int h261_decode_mb_skipped(H261Context *h, int mba1, int mba2)
  166. {
  167. MpegEncContext *const s = &h->s;
  168. int i;
  169. s->mb_intra = 0;
  170. for (i = mba1; i < mba2; i++) {
  171. int j, xy;
  172. s->mb_x = ((h->gob_number - 1) % 2) * 11 + i % 11;
  173. s->mb_y = ((h->gob_number - 1) / 2) * 3 + i / 11;
  174. xy = s->mb_x + s->mb_y * s->mb_stride;
  175. ff_init_block_index(s);
  176. ff_update_block_index(s);
  177. for (j = 0; j < 6; j++)
  178. s->block_last_index[j] = -1;
  179. s->mv_dir = MV_DIR_FORWARD;
  180. s->mv_type = MV_TYPE_16X16;
  181. s->current_picture.mb_type[xy] = MB_TYPE_SKIP | MB_TYPE_16x16 | MB_TYPE_L0;
  182. s->mv[0][0][0] = 0;
  183. s->mv[0][0][1] = 0;
  184. s->mb_skipped = 1;
  185. h->mtype &= ~MB_TYPE_H261_FIL;
  186. ff_MPV_decode_mb(s, s->block);
  187. }
  188. return 0;
  189. }
  190. static int decode_mv_component(GetBitContext *gb, int v)
  191. {
  192. int mv_diff = get_vlc2(gb, h261_mv_vlc.table, H261_MV_VLC_BITS, 2);
  193. /* check if mv_diff is valid */
  194. if (mv_diff < 0)
  195. return v;
  196. mv_diff = mvmap[mv_diff];
  197. if (mv_diff && !get_bits1(gb))
  198. mv_diff = -mv_diff;
  199. v += mv_diff;
  200. if (v <= -16)
  201. v += 32;
  202. else if (v >= 16)
  203. v -= 32;
  204. return v;
  205. }
  206. static int h261_decode_mb(H261Context *h)
  207. {
  208. MpegEncContext *const s = &h->s;
  209. int i, cbp, xy;
  210. cbp = 63;
  211. // Read mba
  212. do {
  213. h->mba_diff = get_vlc2(&s->gb, h261_mba_vlc.table,
  214. H261_MBA_VLC_BITS, 2);
  215. /* Check for slice end */
  216. /* NOTE: GOB can be empty (no MB data) or exist only of MBA_stuffing */
  217. if (h->mba_diff == MBA_STARTCODE) { // start code
  218. h->gob_start_code_skipped = 1;
  219. return SLICE_END;
  220. }
  221. } while (h->mba_diff == MBA_STUFFING); // stuffing
  222. if (h->mba_diff < 0) {
  223. if (get_bits_left(&s->gb) <= 7)
  224. return SLICE_END;
  225. av_log(s->avctx, AV_LOG_ERROR, "illegal mba at %d %d\n", s->mb_x, s->mb_y);
  226. return SLICE_ERROR;
  227. }
  228. h->mba_diff += 1;
  229. h->current_mba += h->mba_diff;
  230. if (h->current_mba > MBA_STUFFING)
  231. return SLICE_ERROR;
  232. s->mb_x = ((h->gob_number - 1) % 2) * 11 + ((h->current_mba - 1) % 11);
  233. s->mb_y = ((h->gob_number - 1) / 2) * 3 + ((h->current_mba - 1) / 11);
  234. xy = s->mb_x + s->mb_y * s->mb_stride;
  235. ff_init_block_index(s);
  236. ff_update_block_index(s);
  237. // Read mtype
  238. h->mtype = get_vlc2(&s->gb, h261_mtype_vlc.table, H261_MTYPE_VLC_BITS, 2);
  239. h->mtype = h261_mtype_map[h->mtype];
  240. // Read mquant
  241. if (IS_QUANT(h->mtype))
  242. ff_set_qscale(s, get_bits(&s->gb, 5));
  243. s->mb_intra = IS_INTRA4x4(h->mtype);
  244. // Read mv
  245. if (IS_16X16(h->mtype)) {
  246. /* Motion vector data is included for all MC macroblocks. MVD is
  247. * obtained from the macroblock vector by subtracting the vector
  248. * of the preceding macroblock. For this calculation the vector
  249. * of the preceding macroblock is regarded as zero in the
  250. * following three situations:
  251. * 1) evaluating MVD for macroblocks 1, 12 and 23;
  252. * 2) evaluating MVD for macroblocks in which MBA does not represent a difference of 1;
  253. * 3) MTYPE of the previous macroblock was not MC. */
  254. if ((h->current_mba == 1) || (h->current_mba == 12) ||
  255. (h->current_mba == 23) || (h->mba_diff != 1)) {
  256. h->current_mv_x = 0;
  257. h->current_mv_y = 0;
  258. }
  259. h->current_mv_x = decode_mv_component(&s->gb, h->current_mv_x);
  260. h->current_mv_y = decode_mv_component(&s->gb, h->current_mv_y);
  261. } else {
  262. h->current_mv_x = 0;
  263. h->current_mv_y = 0;
  264. }
  265. // Read cbp
  266. if (HAS_CBP(h->mtype))
  267. cbp = get_vlc2(&s->gb, h261_cbp_vlc.table, H261_CBP_VLC_BITS, 2) + 1;
  268. if (s->mb_intra) {
  269. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  270. goto intra;
  271. }
  272. //set motion vectors
  273. s->mv_dir = MV_DIR_FORWARD;
  274. s->mv_type = MV_TYPE_16X16;
  275. s->current_picture.mb_type[xy] = MB_TYPE_16x16 | MB_TYPE_L0;
  276. s->mv[0][0][0] = h->current_mv_x * 2; // gets divided by 2 in motion compensation
  277. s->mv[0][0][1] = h->current_mv_y * 2;
  278. intra:
  279. /* decode each block */
  280. if (s->mb_intra || HAS_CBP(h->mtype)) {
  281. s->dsp.clear_blocks(s->block[0]);
  282. for (i = 0; i < 6; i++) {
  283. if (h261_decode_block(h, s->block[i], i, cbp & 32) < 0)
  284. return SLICE_ERROR;
  285. cbp += cbp;
  286. }
  287. } else {
  288. for (i = 0; i < 6; i++)
  289. s->block_last_index[i] = -1;
  290. }
  291. ff_MPV_decode_mb(s, s->block);
  292. return SLICE_OK;
  293. }
  294. /**
  295. * Decode a macroblock.
  296. * @return <0 if an error occurred
  297. */
  298. static int h261_decode_block(H261Context *h, int16_t *block, int n, int coded)
  299. {
  300. MpegEncContext *const s = &h->s;
  301. int code, level, i, j, run;
  302. RLTable *rl = &h261_rl_tcoeff;
  303. const uint8_t *scan_table;
  304. /* For the variable length encoding there are two code tables, one being
  305. * used for the first transmitted LEVEL in INTER, INTER + MC and
  306. * INTER + MC + FIL blocks, the second for all other LEVELs except the
  307. * first one in INTRA blocks which is fixed length coded with 8 bits.
  308. * NOTE: The two code tables only differ in one VLC so we handle that
  309. * manually. */
  310. scan_table = s->intra_scantable.permutated;
  311. if (s->mb_intra) {
  312. /* DC coef */
  313. level = get_bits(&s->gb, 8);
  314. // 0 (00000000b) and -128 (10000000b) are FORBIDDEN
  315. if ((level & 0x7F) == 0) {
  316. av_log(s->avctx, AV_LOG_ERROR, "illegal dc %d at %d %d\n",
  317. level, s->mb_x, s->mb_y);
  318. return -1;
  319. }
  320. /* The code 1000 0000 is not used, the reconstruction level of 1024
  321. * being coded as 1111 1111. */
  322. if (level == 255)
  323. level = 128;
  324. block[0] = level;
  325. i = 1;
  326. } else if (coded) {
  327. // Run Level Code
  328. // EOB Not possible for first level when cbp is available (that's why the table is different)
  329. // 0 1 1s
  330. // * * 0*
  331. int check = show_bits(&s->gb, 2);
  332. i = 0;
  333. if (check & 0x2) {
  334. skip_bits(&s->gb, 2);
  335. block[0] = (check & 0x1) ? -1 : 1;
  336. i = 1;
  337. }
  338. } else {
  339. i = 0;
  340. }
  341. if (!coded) {
  342. s->block_last_index[n] = i - 1;
  343. return 0;
  344. }
  345. for (;;) {
  346. code = get_vlc2(&s->gb, rl->vlc.table, TCOEFF_VLC_BITS, 2);
  347. if (code < 0) {
  348. av_log(s->avctx, AV_LOG_ERROR, "illegal ac vlc code at %dx%d\n",
  349. s->mb_x, s->mb_y);
  350. return -1;
  351. }
  352. if (code == rl->n) {
  353. /* escape */
  354. /* The remaining combinations of (run, level) are encoded with a
  355. * 20-bit word consisting of 6 bits escape, 6 bits run and 8 bits
  356. * level. */
  357. run = get_bits(&s->gb, 6);
  358. level = get_sbits(&s->gb, 8);
  359. } else if (code == 0) {
  360. break;
  361. } else {
  362. run = rl->table_run[code];
  363. level = rl->table_level[code];
  364. if (get_bits1(&s->gb))
  365. level = -level;
  366. }
  367. i += run;
  368. if (i >= 64) {
  369. av_log(s->avctx, AV_LOG_ERROR, "run overflow at %dx%d\n",
  370. s->mb_x, s->mb_y);
  371. return -1;
  372. }
  373. j = scan_table[i];
  374. block[j] = level;
  375. i++;
  376. }
  377. s->block_last_index[n] = i - 1;
  378. return 0;
  379. }
  380. /**
  381. * Decode the H.261 picture header.
  382. * @return <0 if no startcode found
  383. */
  384. static int h261_decode_picture_header(H261Context *h)
  385. {
  386. MpegEncContext *const s = &h->s;
  387. int format, i;
  388. uint32_t startcode = 0;
  389. for (i = get_bits_left(&s->gb); i > 24; i -= 1) {
  390. startcode = ((startcode << 1) | get_bits(&s->gb, 1)) & 0x000FFFFF;
  391. if (startcode == 0x10)
  392. break;
  393. }
  394. if (startcode != 0x10) {
  395. av_log(s->avctx, AV_LOG_ERROR, "Bad picture start code\n");
  396. return -1;
  397. }
  398. /* temporal reference */
  399. i = get_bits(&s->gb, 5); /* picture timestamp */
  400. if (i < (s->picture_number & 31))
  401. i += 32;
  402. s->picture_number = (s->picture_number & ~31) + i;
  403. s->avctx->time_base = (AVRational) { 1001, 30000 };
  404. s->current_picture.f.pts = s->picture_number;
  405. /* PTYPE starts here */
  406. skip_bits1(&s->gb); /* split screen off */
  407. skip_bits1(&s->gb); /* camera off */
  408. skip_bits1(&s->gb); /* freeze picture release off */
  409. format = get_bits1(&s->gb);
  410. // only 2 formats possible
  411. if (format == 0) { // QCIF
  412. s->width = 176;
  413. s->height = 144;
  414. s->mb_width = 11;
  415. s->mb_height = 9;
  416. } else { // CIF
  417. s->width = 352;
  418. s->height = 288;
  419. s->mb_width = 22;
  420. s->mb_height = 18;
  421. }
  422. s->mb_num = s->mb_width * s->mb_height;
  423. skip_bits1(&s->gb); /* still image mode off */
  424. skip_bits1(&s->gb); /* Reserved */
  425. /* PEI */
  426. while (get_bits1(&s->gb) != 0)
  427. skip_bits(&s->gb, 8);
  428. /* H.261 has no I-frames, but if we pass AV_PICTURE_TYPE_I for the first
  429. * frame, the codec crashes if it does not contain all I-blocks
  430. * (e.g. when a packet is lost). */
  431. s->pict_type = AV_PICTURE_TYPE_P;
  432. h->gob_number = 0;
  433. return 0;
  434. }
  435. static int h261_decode_gob(H261Context *h)
  436. {
  437. MpegEncContext *const s = &h->s;
  438. ff_set_qscale(s, s->qscale);
  439. /* decode mb's */
  440. while (h->current_mba <= MBA_STUFFING) {
  441. int ret;
  442. /* DCT & quantize */
  443. ret = h261_decode_mb(h);
  444. if (ret < 0) {
  445. if (ret == SLICE_END) {
  446. h261_decode_mb_skipped(h, h->current_mba, 33);
  447. return 0;
  448. }
  449. av_log(s->avctx, AV_LOG_ERROR, "Error at MB: %d\n",
  450. s->mb_x + s->mb_y * s->mb_stride);
  451. return -1;
  452. }
  453. h261_decode_mb_skipped(h,
  454. h->current_mba - h->mba_diff,
  455. h->current_mba - 1);
  456. }
  457. return -1;
  458. }
  459. /**
  460. * returns the number of bytes consumed for building the current frame
  461. */
  462. static int get_consumed_bytes(MpegEncContext *s, int buf_size)
  463. {
  464. int pos = get_bits_count(&s->gb) >> 3;
  465. if (pos == 0)
  466. pos = 1; // avoid infinite loops (i doubt that is needed but ...)
  467. if (pos + 10 > buf_size)
  468. pos = buf_size; // oops ;)
  469. return pos;
  470. }
  471. static int h261_decode_frame(AVCodecContext *avctx, void *data,
  472. int *got_frame, AVPacket *avpkt)
  473. {
  474. const uint8_t *buf = avpkt->data;
  475. int buf_size = avpkt->size;
  476. H261Context *h = avctx->priv_data;
  477. MpegEncContext *s = &h->s;
  478. int ret;
  479. AVFrame *pict = data;
  480. av_dlog(avctx, "*****frame %d size=%d\n", avctx->frame_number, buf_size);
  481. av_dlog(avctx, "bytes=%x %x %x %x\n", buf[0], buf[1], buf[2], buf[3]);
  482. s->flags = avctx->flags;
  483. s->flags2 = avctx->flags2;
  484. h->gob_start_code_skipped = 0;
  485. retry:
  486. init_get_bits(&s->gb, buf, buf_size * 8);
  487. if (!s->context_initialized)
  488. // we need the IDCT permutaton for reading a custom matrix
  489. if (ff_MPV_common_init(s) < 0)
  490. return -1;
  491. /* We need to set current_picture_ptr before reading the header,
  492. * otherwise we cannot store anything in there. */
  493. if (s->current_picture_ptr == NULL || s->current_picture_ptr->f.data[0]) {
  494. int i = ff_find_unused_picture(s, 0);
  495. if (i < 0)
  496. return i;
  497. s->current_picture_ptr = &s->picture[i];
  498. }
  499. ret = h261_decode_picture_header(h);
  500. /* skip if the header was thrashed */
  501. if (ret < 0) {
  502. av_log(s->avctx, AV_LOG_ERROR, "header damaged\n");
  503. return -1;
  504. }
  505. if (s->width != avctx->coded_width || s->height != avctx->coded_height) {
  506. ParseContext pc = s->parse_context; // FIXME move this demuxing hack to libavformat
  507. s->parse_context.buffer = 0;
  508. ff_MPV_common_end(s);
  509. s->parse_context = pc;
  510. }
  511. if (!s->context_initialized) {
  512. avcodec_set_dimensions(avctx, s->width, s->height);
  513. goto retry;
  514. }
  515. // for skipping the frame
  516. s->current_picture.f.pict_type = s->pict_type;
  517. s->current_picture.f.key_frame = s->pict_type == AV_PICTURE_TYPE_I;
  518. if ((avctx->skip_frame >= AVDISCARD_NONREF && s->pict_type == AV_PICTURE_TYPE_B) ||
  519. (avctx->skip_frame >= AVDISCARD_NONKEY && s->pict_type != AV_PICTURE_TYPE_I) ||
  520. avctx->skip_frame >= AVDISCARD_ALL)
  521. return get_consumed_bytes(s, buf_size);
  522. if (ff_MPV_frame_start(s, avctx) < 0)
  523. return -1;
  524. ff_mpeg_er_frame_start(s);
  525. /* decode each macroblock */
  526. s->mb_x = 0;
  527. s->mb_y = 0;
  528. while (h->gob_number < (s->mb_height == 18 ? 12 : 5)) {
  529. if (ff_h261_resync(h) < 0)
  530. break;
  531. h261_decode_gob(h);
  532. }
  533. ff_MPV_frame_end(s);
  534. assert(s->current_picture.f.pict_type == s->current_picture_ptr->f.pict_type);
  535. assert(s->current_picture.f.pict_type == s->pict_type);
  536. if ((ret = av_frame_ref(pict, &s->current_picture_ptr->f)) < 0)
  537. return ret;
  538. ff_print_debug_info(s, s->current_picture_ptr);
  539. *got_frame = 1;
  540. return get_consumed_bytes(s, buf_size);
  541. }
  542. static av_cold int h261_decode_end(AVCodecContext *avctx)
  543. {
  544. H261Context *h = avctx->priv_data;
  545. MpegEncContext *s = &h->s;
  546. ff_MPV_common_end(s);
  547. return 0;
  548. }
  549. AVCodec ff_h261_decoder = {
  550. .name = "h261",
  551. .type = AVMEDIA_TYPE_VIDEO,
  552. .id = AV_CODEC_ID_H261,
  553. .priv_data_size = sizeof(H261Context),
  554. .init = h261_decode_init,
  555. .close = h261_decode_end,
  556. .decode = h261_decode_frame,
  557. .capabilities = CODEC_CAP_DR1,
  558. .long_name = NULL_IF_CONFIG_SMALL("H.261"),
  559. };