You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

2623 lines
99KB

  1. /*
  2. * MPEG4 decoder.
  3. * Copyright (c) 2000,2001 Fabrice Bellard
  4. * Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #define UNCHECKED_BITSTREAM_READER 1
  23. #include "libavutil/opt.h"
  24. #include "error_resilience.h"
  25. #include "internal.h"
  26. #include "mpegvideo.h"
  27. #include "mpeg4video.h"
  28. #include "h263.h"
  29. #include "thread.h"
  30. /* The defines below define the number of bits that are read at once for
  31. * reading vlc values. Changing these may improve speed and data cache needs
  32. * be aware though that decreasing them may need the number of stages that is
  33. * passed to get_vlc* to be increased. */
  34. #define SPRITE_TRAJ_VLC_BITS 6
  35. #define DC_VLC_BITS 9
  36. #define MB_TYPE_B_VLC_BITS 4
  37. static VLC dc_lum, dc_chrom;
  38. static VLC sprite_trajectory;
  39. static VLC mb_type_b_vlc;
  40. static const int mb_type_b_map[4] = {
  41. MB_TYPE_DIRECT2 | MB_TYPE_L0L1,
  42. MB_TYPE_L0L1 | MB_TYPE_16x16,
  43. MB_TYPE_L1 | MB_TYPE_16x16,
  44. MB_TYPE_L0 | MB_TYPE_16x16,
  45. };
  46. /**
  47. * Predict the ac.
  48. * @param n block index (0-3 are luma, 4-5 are chroma)
  49. * @param dir the ac prediction direction
  50. */
  51. void ff_mpeg4_pred_ac(MpegEncContext *s, int16_t *block, int n, int dir)
  52. {
  53. int i;
  54. int16_t *ac_val, *ac_val1;
  55. int8_t *const qscale_table = s->current_picture.qscale_table;
  56. /* find prediction */
  57. ac_val = s->ac_val[0][0] + s->block_index[n] * 16;
  58. ac_val1 = ac_val;
  59. if (s->ac_pred) {
  60. if (dir == 0) {
  61. const int xy = s->mb_x - 1 + s->mb_y * s->mb_stride;
  62. /* left prediction */
  63. ac_val -= 16;
  64. if (s->mb_x == 0 || s->qscale == qscale_table[xy] ||
  65. n == 1 || n == 3) {
  66. /* same qscale */
  67. for (i = 1; i < 8; i++)
  68. block[s->dsp.idct_permutation[i << 3]] += ac_val[i];
  69. } else {
  70. /* different qscale, we must rescale */
  71. for (i = 1; i < 8; i++)
  72. block[s->dsp.idct_permutation[i << 3]] += ROUNDED_DIV(ac_val[i] * qscale_table[xy], s->qscale);
  73. }
  74. } else {
  75. const int xy = s->mb_x + s->mb_y * s->mb_stride - s->mb_stride;
  76. /* top prediction */
  77. ac_val -= 16 * s->block_wrap[n];
  78. if (s->mb_y == 0 || s->qscale == qscale_table[xy] ||
  79. n == 2 || n == 3) {
  80. /* same qscale */
  81. for (i = 1; i < 8; i++)
  82. block[s->dsp.idct_permutation[i]] += ac_val[i + 8];
  83. } else {
  84. /* different qscale, we must rescale */
  85. for (i = 1; i < 8; i++)
  86. block[s->dsp.idct_permutation[i]] += ROUNDED_DIV(ac_val[i + 8] * qscale_table[xy], s->qscale);
  87. }
  88. }
  89. }
  90. /* left copy */
  91. for (i = 1; i < 8; i++)
  92. ac_val1[i] = block[s->dsp.idct_permutation[i << 3]];
  93. /* top copy */
  94. for (i = 1; i < 8; i++)
  95. ac_val1[8 + i] = block[s->dsp.idct_permutation[i]];
  96. }
  97. /**
  98. * check if the next stuff is a resync marker or the end.
  99. * @return 0 if not
  100. */
  101. static inline int mpeg4_is_resync(MpegEncContext *s)
  102. {
  103. int bits_count = get_bits_count(&s->gb);
  104. int v = show_bits(&s->gb, 16);
  105. if (s->workaround_bugs & FF_BUG_NO_PADDING && !s->resync_marker)
  106. return 0;
  107. while (v <= 0xFF) {
  108. if (s->pict_type == AV_PICTURE_TYPE_B ||
  109. (v >> (8 - s->pict_type) != 1) || s->partitioned_frame)
  110. break;
  111. skip_bits(&s->gb, 8 + s->pict_type);
  112. bits_count += 8 + s->pict_type;
  113. v = show_bits(&s->gb, 16);
  114. }
  115. if (bits_count + 8 >= s->gb.size_in_bits) {
  116. v >>= 8;
  117. v |= 0x7F >> (7 - (bits_count & 7));
  118. if (v == 0x7F)
  119. return s->mb_num;
  120. } else {
  121. if (v == ff_mpeg4_resync_prefix[bits_count & 7]) {
  122. int len, mb_num;
  123. int mb_num_bits = av_log2(s->mb_num - 1) + 1;
  124. GetBitContext gb = s->gb;
  125. skip_bits(&s->gb, 1);
  126. align_get_bits(&s->gb);
  127. for (len = 0; len < 32; len++)
  128. if (get_bits1(&s->gb))
  129. break;
  130. mb_num = get_bits(&s->gb, mb_num_bits);
  131. if (!mb_num || mb_num > s->mb_num || get_bits_count(&s->gb)+6 > s->gb.size_in_bits)
  132. mb_num= -1;
  133. s->gb = gb;
  134. if (len >= ff_mpeg4_get_video_packet_prefix_length(s))
  135. return mb_num;
  136. }
  137. }
  138. return 0;
  139. }
  140. static int mpeg4_decode_sprite_trajectory(MpegEncContext *s, GetBitContext *gb)
  141. {
  142. int a = 2 << s->sprite_warping_accuracy;
  143. int rho = 3 - s->sprite_warping_accuracy;
  144. int r = 16 / a;
  145. int alpha = 0;
  146. int beta = 0;
  147. int w = s->width;
  148. int h = s->height;
  149. int min_ab, i, w2, h2, w3, h3;
  150. int sprite_ref[4][2];
  151. int virtual_ref[2][2];
  152. // only true for rectangle shapes
  153. const int vop_ref[4][2] = { { 0, 0 }, { s->width, 0 },
  154. { 0, s->height }, { s->width, s->height } };
  155. int d[4][2] = { { 0, 0 }, { 0, 0 }, { 0, 0 }, { 0, 0 } };
  156. if (w <= 0 || h <= 0)
  157. return AVERROR_INVALIDDATA;
  158. for (i = 0; i < s->num_sprite_warping_points; i++) {
  159. int length;
  160. int x = 0, y = 0;
  161. length = get_vlc2(gb, sprite_trajectory.table, SPRITE_TRAJ_VLC_BITS, 3);
  162. if (length)
  163. x = get_xbits(gb, length);
  164. if (!(s->divx_version == 500 && s->divx_build == 413))
  165. skip_bits1(gb); /* marker bit */
  166. length = get_vlc2(gb, sprite_trajectory.table, SPRITE_TRAJ_VLC_BITS, 3);
  167. if (length)
  168. y = get_xbits(gb, length);
  169. skip_bits1(gb); /* marker bit */
  170. s->sprite_traj[i][0] = d[i][0] = x;
  171. s->sprite_traj[i][1] = d[i][1] = y;
  172. }
  173. for (; i < 4; i++)
  174. s->sprite_traj[i][0] = s->sprite_traj[i][1] = 0;
  175. while ((1 << alpha) < w)
  176. alpha++;
  177. while ((1 << beta) < h)
  178. beta++; /* typo in the mpeg4 std for the definition of w' and h' */
  179. w2 = 1 << alpha;
  180. h2 = 1 << beta;
  181. // Note, the 4th point isn't used for GMC
  182. if (s->divx_version == 500 && s->divx_build == 413) {
  183. sprite_ref[0][0] = a * vop_ref[0][0] + d[0][0];
  184. sprite_ref[0][1] = a * vop_ref[0][1] + d[0][1];
  185. sprite_ref[1][0] = a * vop_ref[1][0] + d[0][0] + d[1][0];
  186. sprite_ref[1][1] = a * vop_ref[1][1] + d[0][1] + d[1][1];
  187. sprite_ref[2][0] = a * vop_ref[2][0] + d[0][0] + d[2][0];
  188. sprite_ref[2][1] = a * vop_ref[2][1] + d[0][1] + d[2][1];
  189. } else {
  190. sprite_ref[0][0] = (a >> 1) * (2 * vop_ref[0][0] + d[0][0]);
  191. sprite_ref[0][1] = (a >> 1) * (2 * vop_ref[0][1] + d[0][1]);
  192. sprite_ref[1][0] = (a >> 1) * (2 * vop_ref[1][0] + d[0][0] + d[1][0]);
  193. sprite_ref[1][1] = (a >> 1) * (2 * vop_ref[1][1] + d[0][1] + d[1][1]);
  194. sprite_ref[2][0] = (a >> 1) * (2 * vop_ref[2][0] + d[0][0] + d[2][0]);
  195. sprite_ref[2][1] = (a >> 1) * (2 * vop_ref[2][1] + d[0][1] + d[2][1]);
  196. }
  197. /* sprite_ref[3][0] = (a >> 1) * (2 * vop_ref[3][0] + d[0][0] + d[1][0] + d[2][0] + d[3][0]);
  198. * sprite_ref[3][1] = (a >> 1) * (2 * vop_ref[3][1] + d[0][1] + d[1][1] + d[2][1] + d[3][1]); */
  199. /* this is mostly identical to the mpeg4 std (and is totally unreadable
  200. * because of that...). Perhaps it should be reordered to be more readable.
  201. * The idea behind this virtual_ref mess is to be able to use shifts later
  202. * per pixel instead of divides so the distance between points is converted
  203. * from w&h based to w2&h2 based which are of the 2^x form. */
  204. virtual_ref[0][0] = 16 * (vop_ref[0][0] + w2) +
  205. ROUNDED_DIV(((w - w2) *
  206. (r * sprite_ref[0][0] - 16 * vop_ref[0][0]) +
  207. w2 * (r * sprite_ref[1][0] - 16 * vop_ref[1][0])), w);
  208. virtual_ref[0][1] = 16 * vop_ref[0][1] +
  209. ROUNDED_DIV(((w - w2) *
  210. (r * sprite_ref[0][1] - 16 * vop_ref[0][1]) +
  211. w2 * (r * sprite_ref[1][1] - 16 * vop_ref[1][1])), w);
  212. virtual_ref[1][0] = 16 * vop_ref[0][0] +
  213. ROUNDED_DIV(((h - h2) * (r * sprite_ref[0][0] - 16 * vop_ref[0][0]) +
  214. h2 * (r * sprite_ref[2][0] - 16 * vop_ref[2][0])), h);
  215. virtual_ref[1][1] = 16 * (vop_ref[0][1] + h2) +
  216. ROUNDED_DIV(((h - h2) * (r * sprite_ref[0][1] - 16 * vop_ref[0][1]) +
  217. h2 * (r * sprite_ref[2][1] - 16 * vop_ref[2][1])), h);
  218. switch (s->num_sprite_warping_points) {
  219. case 0:
  220. s->sprite_offset[0][0] =
  221. s->sprite_offset[0][1] =
  222. s->sprite_offset[1][0] =
  223. s->sprite_offset[1][1] = 0;
  224. s->sprite_delta[0][0] = a;
  225. s->sprite_delta[0][1] =
  226. s->sprite_delta[1][0] = 0;
  227. s->sprite_delta[1][1] = a;
  228. s->sprite_shift[0] =
  229. s->sprite_shift[1] = 0;
  230. break;
  231. case 1: // GMC only
  232. s->sprite_offset[0][0] = sprite_ref[0][0] - a * vop_ref[0][0];
  233. s->sprite_offset[0][1] = sprite_ref[0][1] - a * vop_ref[0][1];
  234. s->sprite_offset[1][0] = ((sprite_ref[0][0] >> 1) | (sprite_ref[0][0] & 1)) -
  235. a * (vop_ref[0][0] / 2);
  236. s->sprite_offset[1][1] = ((sprite_ref[0][1] >> 1) | (sprite_ref[0][1] & 1)) -
  237. a * (vop_ref[0][1] / 2);
  238. s->sprite_delta[0][0] = a;
  239. s->sprite_delta[0][1] =
  240. s->sprite_delta[1][0] = 0;
  241. s->sprite_delta[1][1] = a;
  242. s->sprite_shift[0] =
  243. s->sprite_shift[1] = 0;
  244. break;
  245. case 2:
  246. s->sprite_offset[0][0] = (sprite_ref[0][0] << (alpha + rho)) +
  247. (-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  248. (-vop_ref[0][0]) +
  249. (r * sprite_ref[0][1] - virtual_ref[0][1]) *
  250. (-vop_ref[0][1]) + (1 << (alpha + rho - 1));
  251. s->sprite_offset[0][1] = (sprite_ref[0][1] << (alpha + rho)) +
  252. (-r * sprite_ref[0][1] + virtual_ref[0][1]) *
  253. (-vop_ref[0][0]) +
  254. (-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  255. (-vop_ref[0][1]) + (1 << (alpha + rho - 1));
  256. s->sprite_offset[1][0] = ((-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  257. (-2 * vop_ref[0][0] + 1) +
  258. (r * sprite_ref[0][1] - virtual_ref[0][1]) *
  259. (-2 * vop_ref[0][1] + 1) + 2 * w2 * r *
  260. sprite_ref[0][0] - 16 * w2 + (1 << (alpha + rho + 1)));
  261. s->sprite_offset[1][1] = ((-r * sprite_ref[0][1] + virtual_ref[0][1]) *
  262. (-2 * vop_ref[0][0] + 1) +
  263. (-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  264. (-2 * vop_ref[0][1] + 1) + 2 * w2 * r *
  265. sprite_ref[0][1] - 16 * w2 + (1 << (alpha + rho + 1)));
  266. s->sprite_delta[0][0] = (-r * sprite_ref[0][0] + virtual_ref[0][0]);
  267. s->sprite_delta[0][1] = (+r * sprite_ref[0][1] - virtual_ref[0][1]);
  268. s->sprite_delta[1][0] = (-r * sprite_ref[0][1] + virtual_ref[0][1]);
  269. s->sprite_delta[1][1] = (-r * sprite_ref[0][0] + virtual_ref[0][0]);
  270. s->sprite_shift[0] = alpha + rho;
  271. s->sprite_shift[1] = alpha + rho + 2;
  272. break;
  273. case 3:
  274. min_ab = FFMIN(alpha, beta);
  275. w3 = w2 >> min_ab;
  276. h3 = h2 >> min_ab;
  277. s->sprite_offset[0][0] = (sprite_ref[0][0] << (alpha + beta + rho - min_ab)) +
  278. (-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  279. h3 * (-vop_ref[0][0]) +
  280. (-r * sprite_ref[0][0] + virtual_ref[1][0]) *
  281. w3 * (-vop_ref[0][1]) +
  282. (1 << (alpha + beta + rho - min_ab - 1));
  283. s->sprite_offset[0][1] = (sprite_ref[0][1] << (alpha + beta + rho - min_ab)) +
  284. (-r * sprite_ref[0][1] + virtual_ref[0][1]) *
  285. h3 * (-vop_ref[0][0]) +
  286. (-r * sprite_ref[0][1] + virtual_ref[1][1]) *
  287. w3 * (-vop_ref[0][1]) +
  288. (1 << (alpha + beta + rho - min_ab - 1));
  289. s->sprite_offset[1][0] = (-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  290. h3 * (-2 * vop_ref[0][0] + 1) +
  291. (-r * sprite_ref[0][0] + virtual_ref[1][0]) *
  292. w3 * (-2 * vop_ref[0][1] + 1) + 2 * w2 * h3 *
  293. r * sprite_ref[0][0] - 16 * w2 * h3 +
  294. (1 << (alpha + beta + rho - min_ab + 1));
  295. s->sprite_offset[1][1] = (-r * sprite_ref[0][1] + virtual_ref[0][1]) *
  296. h3 * (-2 * vop_ref[0][0] + 1) +
  297. (-r * sprite_ref[0][1] + virtual_ref[1][1]) *
  298. w3 * (-2 * vop_ref[0][1] + 1) + 2 * w2 * h3 *
  299. r * sprite_ref[0][1] - 16 * w2 * h3 +
  300. (1 << (alpha + beta + rho - min_ab + 1));
  301. s->sprite_delta[0][0] = (-r * sprite_ref[0][0] + virtual_ref[0][0]) * h3;
  302. s->sprite_delta[0][1] = (-r * sprite_ref[0][0] + virtual_ref[1][0]) * w3;
  303. s->sprite_delta[1][0] = (-r * sprite_ref[0][1] + virtual_ref[0][1]) * h3;
  304. s->sprite_delta[1][1] = (-r * sprite_ref[0][1] + virtual_ref[1][1]) * w3;
  305. s->sprite_shift[0] = alpha + beta + rho - min_ab;
  306. s->sprite_shift[1] = alpha + beta + rho - min_ab + 2;
  307. break;
  308. }
  309. /* try to simplify the situation */
  310. if (s->sprite_delta[0][0] == a << s->sprite_shift[0] &&
  311. s->sprite_delta[0][1] == 0 &&
  312. s->sprite_delta[1][0] == 0 &&
  313. s->sprite_delta[1][1] == a << s->sprite_shift[0]) {
  314. s->sprite_offset[0][0] >>= s->sprite_shift[0];
  315. s->sprite_offset[0][1] >>= s->sprite_shift[0];
  316. s->sprite_offset[1][0] >>= s->sprite_shift[1];
  317. s->sprite_offset[1][1] >>= s->sprite_shift[1];
  318. s->sprite_delta[0][0] = a;
  319. s->sprite_delta[0][1] = 0;
  320. s->sprite_delta[1][0] = 0;
  321. s->sprite_delta[1][1] = a;
  322. s->sprite_shift[0] = 0;
  323. s->sprite_shift[1] = 0;
  324. s->real_sprite_warping_points = 1;
  325. } else {
  326. int shift_y = 16 - s->sprite_shift[0];
  327. int shift_c = 16 - s->sprite_shift[1];
  328. for (i = 0; i < 2; i++) {
  329. s->sprite_offset[0][i] <<= shift_y;
  330. s->sprite_offset[1][i] <<= shift_c;
  331. s->sprite_delta[0][i] <<= shift_y;
  332. s->sprite_delta[1][i] <<= shift_y;
  333. s->sprite_shift[i] = 16;
  334. }
  335. s->real_sprite_warping_points = s->num_sprite_warping_points;
  336. }
  337. return 0;
  338. }
  339. static int decode_new_pred(MpegEncContext *s, GetBitContext *gb) {
  340. int len = FFMIN(s->time_increment_bits + 3, 15);
  341. get_bits(gb, len);
  342. if (get_bits1(gb))
  343. get_bits(gb, len);
  344. check_marker(gb, "after new_pred");
  345. return 0;
  346. }
  347. /**
  348. * Decode the next video packet.
  349. * @return <0 if something went wrong
  350. */
  351. int ff_mpeg4_decode_video_packet_header(MpegEncContext *s)
  352. {
  353. int mb_num_bits = av_log2(s->mb_num - 1) + 1;
  354. int header_extension = 0, mb_num, len;
  355. /* is there enough space left for a video packet + header */
  356. if (get_bits_count(&s->gb) > s->gb.size_in_bits - 20)
  357. return -1;
  358. for (len = 0; len < 32; len++)
  359. if (get_bits1(&s->gb))
  360. break;
  361. if (len != ff_mpeg4_get_video_packet_prefix_length(s)) {
  362. av_log(s->avctx, AV_LOG_ERROR, "marker does not match f_code\n");
  363. return -1;
  364. }
  365. if (s->shape != RECT_SHAPE) {
  366. header_extension = get_bits1(&s->gb);
  367. // FIXME more stuff here
  368. }
  369. mb_num = get_bits(&s->gb, mb_num_bits);
  370. if (mb_num >= s->mb_num) {
  371. av_log(s->avctx, AV_LOG_ERROR,
  372. "illegal mb_num in video packet (%d %d) \n", mb_num, s->mb_num);
  373. return -1;
  374. }
  375. s->mb_x = mb_num % s->mb_width;
  376. s->mb_y = mb_num / s->mb_width;
  377. if (s->shape != BIN_ONLY_SHAPE) {
  378. int qscale = get_bits(&s->gb, s->quant_precision);
  379. if (qscale)
  380. s->chroma_qscale = s->qscale = qscale;
  381. }
  382. if (s->shape == RECT_SHAPE)
  383. header_extension = get_bits1(&s->gb);
  384. if (header_extension) {
  385. int time_incr = 0;
  386. while (get_bits1(&s->gb) != 0)
  387. time_incr++;
  388. check_marker(&s->gb, "before time_increment in video packed header");
  389. skip_bits(&s->gb, s->time_increment_bits); /* time_increment */
  390. check_marker(&s->gb, "before vop_coding_type in video packed header");
  391. skip_bits(&s->gb, 2); /* vop coding type */
  392. // FIXME not rect stuff here
  393. if (s->shape != BIN_ONLY_SHAPE) {
  394. skip_bits(&s->gb, 3); /* intra dc vlc threshold */
  395. // FIXME don't just ignore everything
  396. if (s->pict_type == AV_PICTURE_TYPE_S &&
  397. s->vol_sprite_usage == GMC_SPRITE) {
  398. if (mpeg4_decode_sprite_trajectory(s, &s->gb) < 0)
  399. return AVERROR_INVALIDDATA;
  400. av_log(s->avctx, AV_LOG_ERROR, "untested\n");
  401. }
  402. // FIXME reduced res stuff here
  403. if (s->pict_type != AV_PICTURE_TYPE_I) {
  404. int f_code = get_bits(&s->gb, 3); /* fcode_for */
  405. if (f_code == 0)
  406. av_log(s->avctx, AV_LOG_ERROR,
  407. "Error, video packet header damaged (f_code=0)\n");
  408. }
  409. if (s->pict_type == AV_PICTURE_TYPE_B) {
  410. int b_code = get_bits(&s->gb, 3);
  411. if (b_code == 0)
  412. av_log(s->avctx, AV_LOG_ERROR,
  413. "Error, video packet header damaged (b_code=0)\n");
  414. }
  415. }
  416. }
  417. if (s->new_pred)
  418. decode_new_pred(s, &s->gb);
  419. return 0;
  420. }
  421. /**
  422. * Get the average motion vector for a GMC MB.
  423. * @param n either 0 for the x component or 1 for y
  424. * @return the average MV for a GMC MB
  425. */
  426. static inline int get_amv(MpegEncContext *s, int n)
  427. {
  428. int x, y, mb_v, sum, dx, dy, shift;
  429. int len = 1 << (s->f_code + 4);
  430. const int a = s->sprite_warping_accuracy;
  431. if (s->workaround_bugs & FF_BUG_AMV)
  432. len >>= s->quarter_sample;
  433. if (s->real_sprite_warping_points == 1) {
  434. if (s->divx_version == 500 && s->divx_build == 413)
  435. sum = s->sprite_offset[0][n] / (1 << (a - s->quarter_sample));
  436. else
  437. sum = RSHIFT(s->sprite_offset[0][n] << s->quarter_sample, a);
  438. } else {
  439. dx = s->sprite_delta[n][0];
  440. dy = s->sprite_delta[n][1];
  441. shift = s->sprite_shift[0];
  442. if (n)
  443. dy -= 1 << (shift + a + 1);
  444. else
  445. dx -= 1 << (shift + a + 1);
  446. mb_v = s->sprite_offset[0][n] + dx * s->mb_x * 16 + dy * s->mb_y * 16;
  447. sum = 0;
  448. for (y = 0; y < 16; y++) {
  449. int v;
  450. v = mb_v + dy * y;
  451. // FIXME optimize
  452. for (x = 0; x < 16; x++) {
  453. sum += v >> shift;
  454. v += dx;
  455. }
  456. }
  457. sum = RSHIFT(sum, a + 8 - s->quarter_sample);
  458. }
  459. if (sum < -len)
  460. sum = -len;
  461. else if (sum >= len)
  462. sum = len - 1;
  463. return sum;
  464. }
  465. /**
  466. * Decode the dc value.
  467. * @param n block index (0-3 are luma, 4-5 are chroma)
  468. * @param dir_ptr the prediction direction will be stored here
  469. * @return the quantized dc
  470. */
  471. static inline int mpeg4_decode_dc(MpegEncContext *s, int n, int *dir_ptr)
  472. {
  473. int level, code;
  474. if (n < 4)
  475. code = get_vlc2(&s->gb, dc_lum.table, DC_VLC_BITS, 1);
  476. else
  477. code = get_vlc2(&s->gb, dc_chrom.table, DC_VLC_BITS, 1);
  478. if (code < 0 || code > 9 /* && s->nbit < 9 */) {
  479. av_log(s->avctx, AV_LOG_ERROR, "illegal dc vlc\n");
  480. return -1;
  481. }
  482. if (code == 0) {
  483. level = 0;
  484. } else {
  485. if (IS_3IV1) {
  486. if (code == 1)
  487. level = 2 * get_bits1(&s->gb) - 1;
  488. else {
  489. if (get_bits1(&s->gb))
  490. level = get_bits(&s->gb, code - 1) + (1 << (code - 1));
  491. else
  492. level = -get_bits(&s->gb, code - 1) - (1 << (code - 1));
  493. }
  494. } else {
  495. level = get_xbits(&s->gb, code);
  496. }
  497. if (code > 8) {
  498. if (get_bits1(&s->gb) == 0) { /* marker */
  499. if (s->err_recognition & (AV_EF_BITSTREAM|AV_EF_COMPLIANT)) {
  500. av_log(s->avctx, AV_LOG_ERROR, "dc marker bit missing\n");
  501. return -1;
  502. }
  503. }
  504. }
  505. }
  506. return ff_mpeg4_pred_dc(s, n, level, dir_ptr, 0);
  507. }
  508. /**
  509. * Decode first partition.
  510. * @return number of MBs decoded or <0 if an error occurred
  511. */
  512. static int mpeg4_decode_partition_a(MpegEncContext *s)
  513. {
  514. int mb_num = 0;
  515. static const int8_t quant_tab[4] = { -1, -2, 1, 2 };
  516. /* decode first partition */
  517. s->first_slice_line = 1;
  518. for (; s->mb_y < s->mb_height; s->mb_y++) {
  519. ff_init_block_index(s);
  520. for (; s->mb_x < s->mb_width; s->mb_x++) {
  521. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  522. int cbpc;
  523. int dir = 0;
  524. mb_num++;
  525. ff_update_block_index(s);
  526. if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1)
  527. s->first_slice_line = 0;
  528. if (s->pict_type == AV_PICTURE_TYPE_I) {
  529. int i;
  530. do {
  531. if (show_bits_long(&s->gb, 19) == DC_MARKER)
  532. return mb_num - 1;
  533. cbpc = get_vlc2(&s->gb, ff_h263_intra_MCBPC_vlc.table, INTRA_MCBPC_VLC_BITS, 2);
  534. if (cbpc < 0) {
  535. av_log(s->avctx, AV_LOG_ERROR,
  536. "cbpc corrupted at %d %d\n", s->mb_x, s->mb_y);
  537. return -1;
  538. }
  539. } while (cbpc == 8);
  540. s->cbp_table[xy] = cbpc & 3;
  541. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  542. s->mb_intra = 1;
  543. if (cbpc & 4)
  544. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  545. s->current_picture.qscale_table[xy] = s->qscale;
  546. s->mbintra_table[xy] = 1;
  547. for (i = 0; i < 6; i++) {
  548. int dc_pred_dir;
  549. int dc = mpeg4_decode_dc(s, i, &dc_pred_dir);
  550. if (dc < 0) {
  551. av_log(s->avctx, AV_LOG_ERROR,
  552. "DC corrupted at %d %d\n", s->mb_x, s->mb_y);
  553. return -1;
  554. }
  555. dir <<= 1;
  556. if (dc_pred_dir)
  557. dir |= 1;
  558. }
  559. s->pred_dir_table[xy] = dir;
  560. } else { /* P/S_TYPE */
  561. int mx, my, pred_x, pred_y, bits;
  562. int16_t *const mot_val = s->current_picture.motion_val[0][s->block_index[0]];
  563. const int stride = s->b8_stride * 2;
  564. try_again:
  565. bits = show_bits(&s->gb, 17);
  566. if (bits == MOTION_MARKER)
  567. return mb_num - 1;
  568. skip_bits1(&s->gb);
  569. if (bits & 0x10000) {
  570. /* skip mb */
  571. if (s->pict_type == AV_PICTURE_TYPE_S &&
  572. s->vol_sprite_usage == GMC_SPRITE) {
  573. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  574. MB_TYPE_16x16 |
  575. MB_TYPE_GMC |
  576. MB_TYPE_L0;
  577. mx = get_amv(s, 0);
  578. my = get_amv(s, 1);
  579. } else {
  580. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  581. MB_TYPE_16x16 |
  582. MB_TYPE_L0;
  583. mx = my = 0;
  584. }
  585. mot_val[0] =
  586. mot_val[2] =
  587. mot_val[0 + stride] =
  588. mot_val[2 + stride] = mx;
  589. mot_val[1] =
  590. mot_val[3] =
  591. mot_val[1 + stride] =
  592. mot_val[3 + stride] = my;
  593. if (s->mbintra_table[xy])
  594. ff_clean_intra_table_entries(s);
  595. continue;
  596. }
  597. cbpc = get_vlc2(&s->gb, ff_h263_inter_MCBPC_vlc.table, INTER_MCBPC_VLC_BITS, 2);
  598. if (cbpc < 0) {
  599. av_log(s->avctx, AV_LOG_ERROR,
  600. "cbpc corrupted at %d %d\n", s->mb_x, s->mb_y);
  601. return -1;
  602. }
  603. if (cbpc == 20)
  604. goto try_again;
  605. s->cbp_table[xy] = cbpc & (8 + 3); // 8 is dquant
  606. s->mb_intra = ((cbpc & 4) != 0);
  607. if (s->mb_intra) {
  608. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  609. s->mbintra_table[xy] = 1;
  610. mot_val[0] =
  611. mot_val[2] =
  612. mot_val[0 + stride] =
  613. mot_val[2 + stride] = 0;
  614. mot_val[1] =
  615. mot_val[3] =
  616. mot_val[1 + stride] =
  617. mot_val[3 + stride] = 0;
  618. } else {
  619. if (s->mbintra_table[xy])
  620. ff_clean_intra_table_entries(s);
  621. if (s->pict_type == AV_PICTURE_TYPE_S &&
  622. s->vol_sprite_usage == GMC_SPRITE &&
  623. (cbpc & 16) == 0)
  624. s->mcsel = get_bits1(&s->gb);
  625. else
  626. s->mcsel = 0;
  627. if ((cbpc & 16) == 0) {
  628. /* 16x16 motion prediction */
  629. ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
  630. if (!s->mcsel) {
  631. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  632. if (mx >= 0xffff)
  633. return -1;
  634. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  635. if (my >= 0xffff)
  636. return -1;
  637. s->current_picture.mb_type[xy] = MB_TYPE_16x16 |
  638. MB_TYPE_L0;
  639. } else {
  640. mx = get_amv(s, 0);
  641. my = get_amv(s, 1);
  642. s->current_picture.mb_type[xy] = MB_TYPE_16x16 |
  643. MB_TYPE_GMC |
  644. MB_TYPE_L0;
  645. }
  646. mot_val[0] =
  647. mot_val[2] =
  648. mot_val[0 + stride] =
  649. mot_val[2 + stride] = mx;
  650. mot_val[1] =
  651. mot_val[3] =
  652. mot_val[1 + stride] =
  653. mot_val[3 + stride] = my;
  654. } else {
  655. int i;
  656. s->current_picture.mb_type[xy] = MB_TYPE_8x8 |
  657. MB_TYPE_L0;
  658. for (i = 0; i < 4; i++) {
  659. int16_t *mot_val = ff_h263_pred_motion(s, i, 0, &pred_x, &pred_y);
  660. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  661. if (mx >= 0xffff)
  662. return -1;
  663. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  664. if (my >= 0xffff)
  665. return -1;
  666. mot_val[0] = mx;
  667. mot_val[1] = my;
  668. }
  669. }
  670. }
  671. }
  672. }
  673. s->mb_x = 0;
  674. }
  675. return mb_num;
  676. }
  677. /**
  678. * decode second partition.
  679. * @return <0 if an error occurred
  680. */
  681. static int mpeg4_decode_partition_b(MpegEncContext *s, int mb_count)
  682. {
  683. int mb_num = 0;
  684. static const int8_t quant_tab[4] = { -1, -2, 1, 2 };
  685. s->mb_x = s->resync_mb_x;
  686. s->first_slice_line = 1;
  687. for (s->mb_y = s->resync_mb_y; mb_num < mb_count; s->mb_y++) {
  688. ff_init_block_index(s);
  689. for (; mb_num < mb_count && s->mb_x < s->mb_width; s->mb_x++) {
  690. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  691. mb_num++;
  692. ff_update_block_index(s);
  693. if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1)
  694. s->first_slice_line = 0;
  695. if (s->pict_type == AV_PICTURE_TYPE_I) {
  696. int ac_pred = get_bits1(&s->gb);
  697. int cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  698. if (cbpy < 0) {
  699. av_log(s->avctx, AV_LOG_ERROR,
  700. "cbpy corrupted at %d %d\n", s->mb_x, s->mb_y);
  701. return -1;
  702. }
  703. s->cbp_table[xy] |= cbpy << 2;
  704. s->current_picture.mb_type[xy] |= ac_pred * MB_TYPE_ACPRED;
  705. } else { /* P || S_TYPE */
  706. if (IS_INTRA(s->current_picture.mb_type[xy])) {
  707. int i;
  708. int dir = 0;
  709. int ac_pred = get_bits1(&s->gb);
  710. int cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  711. if (cbpy < 0) {
  712. av_log(s->avctx, AV_LOG_ERROR,
  713. "I cbpy corrupted at %d %d\n", s->mb_x, s->mb_y);
  714. return -1;
  715. }
  716. if (s->cbp_table[xy] & 8)
  717. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  718. s->current_picture.qscale_table[xy] = s->qscale;
  719. for (i = 0; i < 6; i++) {
  720. int dc_pred_dir;
  721. int dc = mpeg4_decode_dc(s, i, &dc_pred_dir);
  722. if (dc < 0) {
  723. av_log(s->avctx, AV_LOG_ERROR,
  724. "DC corrupted at %d %d\n", s->mb_x, s->mb_y);
  725. return -1;
  726. }
  727. dir <<= 1;
  728. if (dc_pred_dir)
  729. dir |= 1;
  730. }
  731. s->cbp_table[xy] &= 3; // remove dquant
  732. s->cbp_table[xy] |= cbpy << 2;
  733. s->current_picture.mb_type[xy] |= ac_pred * MB_TYPE_ACPRED;
  734. s->pred_dir_table[xy] = dir;
  735. } else if (IS_SKIP(s->current_picture.mb_type[xy])) {
  736. s->current_picture.qscale_table[xy] = s->qscale;
  737. s->cbp_table[xy] = 0;
  738. } else {
  739. int cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  740. if (cbpy < 0) {
  741. av_log(s->avctx, AV_LOG_ERROR,
  742. "P cbpy corrupted at %d %d\n", s->mb_x, s->mb_y);
  743. return -1;
  744. }
  745. if (s->cbp_table[xy] & 8)
  746. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  747. s->current_picture.qscale_table[xy] = s->qscale;
  748. s->cbp_table[xy] &= 3; // remove dquant
  749. s->cbp_table[xy] |= (cbpy ^ 0xf) << 2;
  750. }
  751. }
  752. }
  753. if (mb_num >= mb_count)
  754. return 0;
  755. s->mb_x = 0;
  756. }
  757. return 0;
  758. }
  759. /**
  760. * Decode the first and second partition.
  761. * @return <0 if error (and sets error type in the error_status_table)
  762. */
  763. int ff_mpeg4_decode_partitions(MpegEncContext *s)
  764. {
  765. int mb_num;
  766. const int part_a_error = s->pict_type == AV_PICTURE_TYPE_I ? (ER_DC_ERROR | ER_MV_ERROR) : ER_MV_ERROR;
  767. const int part_a_end = s->pict_type == AV_PICTURE_TYPE_I ? (ER_DC_END | ER_MV_END) : ER_MV_END;
  768. mb_num = mpeg4_decode_partition_a(s);
  769. if (mb_num < 0) {
  770. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  771. s->mb_x, s->mb_y, part_a_error);
  772. return -1;
  773. }
  774. if (s->resync_mb_x + s->resync_mb_y * s->mb_width + mb_num > s->mb_num) {
  775. av_log(s->avctx, AV_LOG_ERROR, "slice below monitor ...\n");
  776. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  777. s->mb_x, s->mb_y, part_a_error);
  778. return -1;
  779. }
  780. s->mb_num_left = mb_num;
  781. if (s->pict_type == AV_PICTURE_TYPE_I) {
  782. while (show_bits(&s->gb, 9) == 1)
  783. skip_bits(&s->gb, 9);
  784. if (get_bits_long(&s->gb, 19) != DC_MARKER) {
  785. av_log(s->avctx, AV_LOG_ERROR,
  786. "marker missing after first I partition at %d %d\n",
  787. s->mb_x, s->mb_y);
  788. return -1;
  789. }
  790. } else {
  791. while (show_bits(&s->gb, 10) == 1)
  792. skip_bits(&s->gb, 10);
  793. if (get_bits(&s->gb, 17) != MOTION_MARKER) {
  794. av_log(s->avctx, AV_LOG_ERROR,
  795. "marker missing after first P partition at %d %d\n",
  796. s->mb_x, s->mb_y);
  797. return -1;
  798. }
  799. }
  800. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  801. s->mb_x - 1, s->mb_y, part_a_end);
  802. if (mpeg4_decode_partition_b(s, mb_num) < 0) {
  803. if (s->pict_type == AV_PICTURE_TYPE_P)
  804. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  805. s->mb_x, s->mb_y, ER_DC_ERROR);
  806. return -1;
  807. } else {
  808. if (s->pict_type == AV_PICTURE_TYPE_P)
  809. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  810. s->mb_x - 1, s->mb_y, ER_DC_END);
  811. }
  812. return 0;
  813. }
  814. /**
  815. * Decode a block.
  816. * @return <0 if an error occurred
  817. */
  818. static inline int mpeg4_decode_block(MpegEncContext *s, int16_t *block,
  819. int n, int coded, int intra, int rvlc)
  820. {
  821. int level, i, last, run, qmul, qadd;
  822. int av_uninit(dc_pred_dir);
  823. RLTable *rl;
  824. RL_VLC_ELEM *rl_vlc;
  825. const uint8_t *scan_table;
  826. // Note intra & rvlc should be optimized away if this is inlined
  827. if (intra) {
  828. if (s->use_intra_dc_vlc) {
  829. /* DC coef */
  830. if (s->partitioned_frame) {
  831. level = s->dc_val[0][s->block_index[n]];
  832. if (n < 4)
  833. level = FASTDIV((level + (s->y_dc_scale >> 1)), s->y_dc_scale);
  834. else
  835. level = FASTDIV((level + (s->c_dc_scale >> 1)), s->c_dc_scale);
  836. dc_pred_dir = (s->pred_dir_table[s->mb_x + s->mb_y * s->mb_stride] << n) & 32;
  837. } else {
  838. level = mpeg4_decode_dc(s, n, &dc_pred_dir);
  839. if (level < 0)
  840. return -1;
  841. }
  842. block[0] = level;
  843. i = 0;
  844. } else {
  845. i = -1;
  846. ff_mpeg4_pred_dc(s, n, 0, &dc_pred_dir, 0);
  847. }
  848. if (!coded)
  849. goto not_coded;
  850. if (rvlc) {
  851. rl = &ff_rvlc_rl_intra;
  852. rl_vlc = ff_rvlc_rl_intra.rl_vlc[0];
  853. } else {
  854. rl = &ff_mpeg4_rl_intra;
  855. rl_vlc = ff_mpeg4_rl_intra.rl_vlc[0];
  856. }
  857. if (s->ac_pred) {
  858. if (dc_pred_dir == 0)
  859. scan_table = s->intra_v_scantable.permutated; /* left */
  860. else
  861. scan_table = s->intra_h_scantable.permutated; /* top */
  862. } else {
  863. scan_table = s->intra_scantable.permutated;
  864. }
  865. qmul = 1;
  866. qadd = 0;
  867. } else {
  868. i = -1;
  869. if (!coded) {
  870. s->block_last_index[n] = i;
  871. return 0;
  872. }
  873. if (rvlc)
  874. rl = &ff_rvlc_rl_inter;
  875. else
  876. rl = &ff_h263_rl_inter;
  877. scan_table = s->intra_scantable.permutated;
  878. if (s->mpeg_quant) {
  879. qmul = 1;
  880. qadd = 0;
  881. if (rvlc)
  882. rl_vlc = ff_rvlc_rl_inter.rl_vlc[0];
  883. else
  884. rl_vlc = ff_h263_rl_inter.rl_vlc[0];
  885. } else {
  886. qmul = s->qscale << 1;
  887. qadd = (s->qscale - 1) | 1;
  888. if (rvlc)
  889. rl_vlc = ff_rvlc_rl_inter.rl_vlc[s->qscale];
  890. else
  891. rl_vlc = ff_h263_rl_inter.rl_vlc[s->qscale];
  892. }
  893. }
  894. {
  895. OPEN_READER(re, &s->gb);
  896. for (;;) {
  897. UPDATE_CACHE(re, &s->gb);
  898. GET_RL_VLC(level, run, re, &s->gb, rl_vlc, TEX_VLC_BITS, 2, 0);
  899. if (level == 0) {
  900. /* escape */
  901. if (rvlc) {
  902. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  903. av_log(s->avctx, AV_LOG_ERROR,
  904. "1. marker bit missing in rvlc esc\n");
  905. return -1;
  906. }
  907. SKIP_CACHE(re, &s->gb, 1);
  908. last = SHOW_UBITS(re, &s->gb, 1);
  909. SKIP_CACHE(re, &s->gb, 1);
  910. run = SHOW_UBITS(re, &s->gb, 6);
  911. SKIP_COUNTER(re, &s->gb, 1 + 1 + 6);
  912. UPDATE_CACHE(re, &s->gb);
  913. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  914. av_log(s->avctx, AV_LOG_ERROR,
  915. "2. marker bit missing in rvlc esc\n");
  916. return -1;
  917. }
  918. SKIP_CACHE(re, &s->gb, 1);
  919. level = SHOW_UBITS(re, &s->gb, 11);
  920. SKIP_CACHE(re, &s->gb, 11);
  921. if (SHOW_UBITS(re, &s->gb, 5) != 0x10) {
  922. av_log(s->avctx, AV_LOG_ERROR, "reverse esc missing\n");
  923. return -1;
  924. }
  925. SKIP_CACHE(re, &s->gb, 5);
  926. level = level * qmul + qadd;
  927. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  928. SKIP_COUNTER(re, &s->gb, 1 + 11 + 5 + 1);
  929. i += run + 1;
  930. if (last)
  931. i += 192;
  932. } else {
  933. int cache;
  934. cache = GET_CACHE(re, &s->gb);
  935. if (IS_3IV1)
  936. cache ^= 0xC0000000;
  937. if (cache & 0x80000000) {
  938. if (cache & 0x40000000) {
  939. /* third escape */
  940. SKIP_CACHE(re, &s->gb, 2);
  941. last = SHOW_UBITS(re, &s->gb, 1);
  942. SKIP_CACHE(re, &s->gb, 1);
  943. run = SHOW_UBITS(re, &s->gb, 6);
  944. SKIP_COUNTER(re, &s->gb, 2 + 1 + 6);
  945. UPDATE_CACHE(re, &s->gb);
  946. if (IS_3IV1) {
  947. level = SHOW_SBITS(re, &s->gb, 12);
  948. LAST_SKIP_BITS(re, &s->gb, 12);
  949. } else {
  950. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  951. av_log(s->avctx, AV_LOG_ERROR,
  952. "1. marker bit missing in 3. esc\n");
  953. return -1;
  954. }
  955. SKIP_CACHE(re, &s->gb, 1);
  956. level = SHOW_SBITS(re, &s->gb, 12);
  957. SKIP_CACHE(re, &s->gb, 12);
  958. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  959. av_log(s->avctx, AV_LOG_ERROR,
  960. "2. marker bit missing in 3. esc\n");
  961. return -1;
  962. }
  963. SKIP_COUNTER(re, &s->gb, 1 + 12 + 1);
  964. }
  965. #if 0
  966. if (s->error_recognition >= FF_ER_COMPLIANT) {
  967. const int abs_level= FFABS(level);
  968. if (abs_level<=MAX_LEVEL && run<=MAX_RUN) {
  969. const int run1= run - rl->max_run[last][abs_level] - 1;
  970. if (abs_level <= rl->max_level[last][run]) {
  971. av_log(s->avctx, AV_LOG_ERROR, "illegal 3. esc, vlc encoding possible\n");
  972. return -1;
  973. }
  974. if (s->error_recognition > FF_ER_COMPLIANT) {
  975. if (abs_level <= rl->max_level[last][run]*2) {
  976. av_log(s->avctx, AV_LOG_ERROR, "illegal 3. esc, esc 1 encoding possible\n");
  977. return -1;
  978. }
  979. if (run1 >= 0 && abs_level <= rl->max_level[last][run1]) {
  980. av_log(s->avctx, AV_LOG_ERROR, "illegal 3. esc, esc 2 encoding possible\n");
  981. return -1;
  982. }
  983. }
  984. }
  985. }
  986. #endif
  987. if (level > 0)
  988. level = level * qmul + qadd;
  989. else
  990. level = level * qmul - qadd;
  991. if ((unsigned)(level + 2048) > 4095) {
  992. if (s->err_recognition & (AV_EF_BITSTREAM|AV_EF_AGGRESSIVE)) {
  993. if (level > 2560 || level < -2560) {
  994. av_log(s->avctx, AV_LOG_ERROR,
  995. "|level| overflow in 3. esc, qp=%d\n",
  996. s->qscale);
  997. return -1;
  998. }
  999. }
  1000. level = level < 0 ? -2048 : 2047;
  1001. }
  1002. i += run + 1;
  1003. if (last)
  1004. i += 192;
  1005. } else {
  1006. /* second escape */
  1007. SKIP_BITS(re, &s->gb, 2);
  1008. GET_RL_VLC(level, run, re, &s->gb, rl_vlc, TEX_VLC_BITS, 2, 1);
  1009. i += run + rl->max_run[run >> 7][level / qmul] + 1; // FIXME opt indexing
  1010. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1011. LAST_SKIP_BITS(re, &s->gb, 1);
  1012. }
  1013. } else {
  1014. /* first escape */
  1015. SKIP_BITS(re, &s->gb, 1);
  1016. GET_RL_VLC(level, run, re, &s->gb, rl_vlc, TEX_VLC_BITS, 2, 1);
  1017. i += run;
  1018. level = level + rl->max_level[run >> 7][(run - 1) & 63] * qmul; // FIXME opt indexing
  1019. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1020. LAST_SKIP_BITS(re, &s->gb, 1);
  1021. }
  1022. }
  1023. } else {
  1024. i += run;
  1025. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1026. LAST_SKIP_BITS(re, &s->gb, 1);
  1027. }
  1028. if (i > 62) {
  1029. i -= 192;
  1030. if (i & (~63)) {
  1031. av_log(s->avctx, AV_LOG_ERROR,
  1032. "ac-tex damaged at %d %d\n", s->mb_x, s->mb_y);
  1033. return -1;
  1034. }
  1035. block[scan_table[i]] = level;
  1036. break;
  1037. }
  1038. block[scan_table[i]] = level;
  1039. }
  1040. CLOSE_READER(re, &s->gb);
  1041. }
  1042. not_coded:
  1043. if (intra) {
  1044. if (!s->use_intra_dc_vlc) {
  1045. block[0] = ff_mpeg4_pred_dc(s, n, block[0], &dc_pred_dir, 0);
  1046. i -= i >> 31; // if (i == -1) i = 0;
  1047. }
  1048. ff_mpeg4_pred_ac(s, block, n, dc_pred_dir);
  1049. if (s->ac_pred)
  1050. i = 63; // FIXME not optimal
  1051. }
  1052. s->block_last_index[n] = i;
  1053. return 0;
  1054. }
  1055. /**
  1056. * decode partition C of one MB.
  1057. * @return <0 if an error occurred
  1058. */
  1059. static int mpeg4_decode_partitioned_mb(MpegEncContext *s, int16_t block[6][64])
  1060. {
  1061. int cbp, mb_type;
  1062. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  1063. mb_type = s->current_picture.mb_type[xy];
  1064. cbp = s->cbp_table[xy];
  1065. s->use_intra_dc_vlc = s->qscale < s->intra_dc_threshold;
  1066. if (s->current_picture.qscale_table[xy] != s->qscale)
  1067. ff_set_qscale(s, s->current_picture.qscale_table[xy]);
  1068. if (s->pict_type == AV_PICTURE_TYPE_P ||
  1069. s->pict_type == AV_PICTURE_TYPE_S) {
  1070. int i;
  1071. for (i = 0; i < 4; i++) {
  1072. s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0];
  1073. s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1];
  1074. }
  1075. s->mb_intra = IS_INTRA(mb_type);
  1076. if (IS_SKIP(mb_type)) {
  1077. /* skip mb */
  1078. for (i = 0; i < 6; i++)
  1079. s->block_last_index[i] = -1;
  1080. s->mv_dir = MV_DIR_FORWARD;
  1081. s->mv_type = MV_TYPE_16X16;
  1082. if (s->pict_type == AV_PICTURE_TYPE_S
  1083. && s->vol_sprite_usage == GMC_SPRITE) {
  1084. s->mcsel = 1;
  1085. s->mb_skipped = 0;
  1086. } else {
  1087. s->mcsel = 0;
  1088. s->mb_skipped = 1;
  1089. }
  1090. } else if (s->mb_intra) {
  1091. s->ac_pred = IS_ACPRED(s->current_picture.mb_type[xy]);
  1092. } else if (!s->mb_intra) {
  1093. // s->mcsel = 0; // FIXME do we need to init that?
  1094. s->mv_dir = MV_DIR_FORWARD;
  1095. if (IS_8X8(mb_type)) {
  1096. s->mv_type = MV_TYPE_8X8;
  1097. } else {
  1098. s->mv_type = MV_TYPE_16X16;
  1099. }
  1100. }
  1101. } else { /* I-Frame */
  1102. s->mb_intra = 1;
  1103. s->ac_pred = IS_ACPRED(s->current_picture.mb_type[xy]);
  1104. }
  1105. if (!IS_SKIP(mb_type)) {
  1106. int i;
  1107. s->dsp.clear_blocks(s->block[0]);
  1108. /* decode each block */
  1109. for (i = 0; i < 6; i++) {
  1110. if (mpeg4_decode_block(s, block[i], i, cbp & 32, s->mb_intra, s->rvlc) < 0) {
  1111. av_log(s->avctx, AV_LOG_ERROR,
  1112. "texture corrupted at %d %d %d\n",
  1113. s->mb_x, s->mb_y, s->mb_intra);
  1114. return -1;
  1115. }
  1116. cbp += cbp;
  1117. }
  1118. }
  1119. /* per-MB end of slice check */
  1120. if (--s->mb_num_left <= 0) {
  1121. if (mpeg4_is_resync(s))
  1122. return SLICE_END;
  1123. else
  1124. return SLICE_NOEND;
  1125. } else {
  1126. if (mpeg4_is_resync(s)) {
  1127. const int delta = s->mb_x + 1 == s->mb_width ? 2 : 1;
  1128. if (s->cbp_table[xy + delta])
  1129. return SLICE_END;
  1130. }
  1131. return SLICE_OK;
  1132. }
  1133. }
  1134. static int mpeg4_decode_mb(MpegEncContext *s, int16_t block[6][64])
  1135. {
  1136. int cbpc, cbpy, i, cbp, pred_x, pred_y, mx, my, dquant;
  1137. int16_t *mot_val;
  1138. static int8_t quant_tab[4] = { -1, -2, 1, 2 };
  1139. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  1140. av_assert2(s->h263_pred);
  1141. if (s->pict_type == AV_PICTURE_TYPE_P ||
  1142. s->pict_type == AV_PICTURE_TYPE_S) {
  1143. do {
  1144. if (get_bits1(&s->gb)) {
  1145. /* skip mb */
  1146. s->mb_intra = 0;
  1147. for (i = 0; i < 6; i++)
  1148. s->block_last_index[i] = -1;
  1149. s->mv_dir = MV_DIR_FORWARD;
  1150. s->mv_type = MV_TYPE_16X16;
  1151. if (s->pict_type == AV_PICTURE_TYPE_S &&
  1152. s->vol_sprite_usage == GMC_SPRITE) {
  1153. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  1154. MB_TYPE_GMC |
  1155. MB_TYPE_16x16 |
  1156. MB_TYPE_L0;
  1157. s->mcsel = 1;
  1158. s->mv[0][0][0] = get_amv(s, 0);
  1159. s->mv[0][0][1] = get_amv(s, 1);
  1160. s->mb_skipped = 0;
  1161. } else {
  1162. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  1163. MB_TYPE_16x16 |
  1164. MB_TYPE_L0;
  1165. s->mcsel = 0;
  1166. s->mv[0][0][0] = 0;
  1167. s->mv[0][0][1] = 0;
  1168. s->mb_skipped = 1;
  1169. }
  1170. goto end;
  1171. }
  1172. cbpc = get_vlc2(&s->gb, ff_h263_inter_MCBPC_vlc.table, INTER_MCBPC_VLC_BITS, 2);
  1173. if (cbpc < 0) {
  1174. av_log(s->avctx, AV_LOG_ERROR,
  1175. "cbpc damaged at %d %d\n", s->mb_x, s->mb_y);
  1176. return -1;
  1177. }
  1178. } while (cbpc == 20);
  1179. s->dsp.clear_blocks(s->block[0]);
  1180. dquant = cbpc & 8;
  1181. s->mb_intra = ((cbpc & 4) != 0);
  1182. if (s->mb_intra)
  1183. goto intra;
  1184. if (s->pict_type == AV_PICTURE_TYPE_S &&
  1185. s->vol_sprite_usage == GMC_SPRITE && (cbpc & 16) == 0)
  1186. s->mcsel = get_bits1(&s->gb);
  1187. else
  1188. s->mcsel = 0;
  1189. cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1) ^ 0x0F;
  1190. cbp = (cbpc & 3) | (cbpy << 2);
  1191. if (dquant)
  1192. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  1193. if ((!s->progressive_sequence) &&
  1194. (cbp || (s->workaround_bugs & FF_BUG_XVID_ILACE)))
  1195. s->interlaced_dct = get_bits1(&s->gb);
  1196. s->mv_dir = MV_DIR_FORWARD;
  1197. if ((cbpc & 16) == 0) {
  1198. if (s->mcsel) {
  1199. s->current_picture.mb_type[xy] = MB_TYPE_GMC |
  1200. MB_TYPE_16x16 |
  1201. MB_TYPE_L0;
  1202. /* 16x16 global motion prediction */
  1203. s->mv_type = MV_TYPE_16X16;
  1204. mx = get_amv(s, 0);
  1205. my = get_amv(s, 1);
  1206. s->mv[0][0][0] = mx;
  1207. s->mv[0][0][1] = my;
  1208. } else if ((!s->progressive_sequence) && get_bits1(&s->gb)) {
  1209. s->current_picture.mb_type[xy] = MB_TYPE_16x8 |
  1210. MB_TYPE_L0 |
  1211. MB_TYPE_INTERLACED;
  1212. /* 16x8 field motion prediction */
  1213. s->mv_type = MV_TYPE_FIELD;
  1214. s->field_select[0][0] = get_bits1(&s->gb);
  1215. s->field_select[0][1] = get_bits1(&s->gb);
  1216. ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
  1217. for (i = 0; i < 2; i++) {
  1218. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  1219. if (mx >= 0xffff)
  1220. return -1;
  1221. my = ff_h263_decode_motion(s, pred_y / 2, s->f_code);
  1222. if (my >= 0xffff)
  1223. return -1;
  1224. s->mv[0][i][0] = mx;
  1225. s->mv[0][i][1] = my;
  1226. }
  1227. } else {
  1228. s->current_picture.mb_type[xy] = MB_TYPE_16x16 | MB_TYPE_L0;
  1229. /* 16x16 motion prediction */
  1230. s->mv_type = MV_TYPE_16X16;
  1231. ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
  1232. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  1233. if (mx >= 0xffff)
  1234. return -1;
  1235. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  1236. if (my >= 0xffff)
  1237. return -1;
  1238. s->mv[0][0][0] = mx;
  1239. s->mv[0][0][1] = my;
  1240. }
  1241. } else {
  1242. s->current_picture.mb_type[xy] = MB_TYPE_8x8 | MB_TYPE_L0;
  1243. s->mv_type = MV_TYPE_8X8;
  1244. for (i = 0; i < 4; i++) {
  1245. mot_val = ff_h263_pred_motion(s, i, 0, &pred_x, &pred_y);
  1246. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  1247. if (mx >= 0xffff)
  1248. return -1;
  1249. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  1250. if (my >= 0xffff)
  1251. return -1;
  1252. s->mv[0][i][0] = mx;
  1253. s->mv[0][i][1] = my;
  1254. mot_val[0] = mx;
  1255. mot_val[1] = my;
  1256. }
  1257. }
  1258. } else if (s->pict_type == AV_PICTURE_TYPE_B) {
  1259. int modb1; // first bit of modb
  1260. int modb2; // second bit of modb
  1261. int mb_type;
  1262. s->mb_intra = 0; // B-frames never contain intra blocks
  1263. s->mcsel = 0; // ... true gmc blocks
  1264. if (s->mb_x == 0) {
  1265. for (i = 0; i < 2; i++) {
  1266. s->last_mv[i][0][0] =
  1267. s->last_mv[i][0][1] =
  1268. s->last_mv[i][1][0] =
  1269. s->last_mv[i][1][1] = 0;
  1270. }
  1271. ff_thread_await_progress(&s->next_picture_ptr->tf, s->mb_y, 0);
  1272. }
  1273. /* if we skipped it in the future P Frame than skip it now too */
  1274. s->mb_skipped = s->next_picture.mbskip_table[s->mb_y * s->mb_stride + s->mb_x]; // Note, skiptab=0 if last was GMC
  1275. if (s->mb_skipped) {
  1276. /* skip mb */
  1277. for (i = 0; i < 6; i++)
  1278. s->block_last_index[i] = -1;
  1279. s->mv_dir = MV_DIR_FORWARD;
  1280. s->mv_type = MV_TYPE_16X16;
  1281. s->mv[0][0][0] =
  1282. s->mv[0][0][1] =
  1283. s->mv[1][0][0] =
  1284. s->mv[1][0][1] = 0;
  1285. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  1286. MB_TYPE_16x16 |
  1287. MB_TYPE_L0;
  1288. goto end;
  1289. }
  1290. modb1 = get_bits1(&s->gb);
  1291. if (modb1) {
  1292. // like MB_TYPE_B_DIRECT but no vectors coded
  1293. mb_type = MB_TYPE_DIRECT2 | MB_TYPE_SKIP | MB_TYPE_L0L1;
  1294. cbp = 0;
  1295. } else {
  1296. modb2 = get_bits1(&s->gb);
  1297. mb_type = get_vlc2(&s->gb, mb_type_b_vlc.table, MB_TYPE_B_VLC_BITS, 1);
  1298. if (mb_type < 0) {
  1299. av_log(s->avctx, AV_LOG_ERROR, "illegal MB_type\n");
  1300. return -1;
  1301. }
  1302. mb_type = mb_type_b_map[mb_type];
  1303. if (modb2) {
  1304. cbp = 0;
  1305. } else {
  1306. s->dsp.clear_blocks(s->block[0]);
  1307. cbp = get_bits(&s->gb, 6);
  1308. }
  1309. if ((!IS_DIRECT(mb_type)) && cbp) {
  1310. if (get_bits1(&s->gb))
  1311. ff_set_qscale(s, s->qscale + get_bits1(&s->gb) * 4 - 2);
  1312. }
  1313. if (!s->progressive_sequence) {
  1314. if (cbp)
  1315. s->interlaced_dct = get_bits1(&s->gb);
  1316. if (!IS_DIRECT(mb_type) && get_bits1(&s->gb)) {
  1317. mb_type |= MB_TYPE_16x8 | MB_TYPE_INTERLACED;
  1318. mb_type &= ~MB_TYPE_16x16;
  1319. if (USES_LIST(mb_type, 0)) {
  1320. s->field_select[0][0] = get_bits1(&s->gb);
  1321. s->field_select[0][1] = get_bits1(&s->gb);
  1322. }
  1323. if (USES_LIST(mb_type, 1)) {
  1324. s->field_select[1][0] = get_bits1(&s->gb);
  1325. s->field_select[1][1] = get_bits1(&s->gb);
  1326. }
  1327. }
  1328. }
  1329. s->mv_dir = 0;
  1330. if ((mb_type & (MB_TYPE_DIRECT2 | MB_TYPE_INTERLACED)) == 0) {
  1331. s->mv_type = MV_TYPE_16X16;
  1332. if (USES_LIST(mb_type, 0)) {
  1333. s->mv_dir = MV_DIR_FORWARD;
  1334. mx = ff_h263_decode_motion(s, s->last_mv[0][0][0], s->f_code);
  1335. my = ff_h263_decode_motion(s, s->last_mv[0][0][1], s->f_code);
  1336. s->last_mv[0][1][0] =
  1337. s->last_mv[0][0][0] =
  1338. s->mv[0][0][0] = mx;
  1339. s->last_mv[0][1][1] =
  1340. s->last_mv[0][0][1] =
  1341. s->mv[0][0][1] = my;
  1342. }
  1343. if (USES_LIST(mb_type, 1)) {
  1344. s->mv_dir |= MV_DIR_BACKWARD;
  1345. mx = ff_h263_decode_motion(s, s->last_mv[1][0][0], s->b_code);
  1346. my = ff_h263_decode_motion(s, s->last_mv[1][0][1], s->b_code);
  1347. s->last_mv[1][1][0] =
  1348. s->last_mv[1][0][0] =
  1349. s->mv[1][0][0] = mx;
  1350. s->last_mv[1][1][1] =
  1351. s->last_mv[1][0][1] =
  1352. s->mv[1][0][1] = my;
  1353. }
  1354. } else if (!IS_DIRECT(mb_type)) {
  1355. s->mv_type = MV_TYPE_FIELD;
  1356. if (USES_LIST(mb_type, 0)) {
  1357. s->mv_dir = MV_DIR_FORWARD;
  1358. for (i = 0; i < 2; i++) {
  1359. mx = ff_h263_decode_motion(s, s->last_mv[0][i][0], s->f_code);
  1360. my = ff_h263_decode_motion(s, s->last_mv[0][i][1] / 2, s->f_code);
  1361. s->last_mv[0][i][0] =
  1362. s->mv[0][i][0] = mx;
  1363. s->last_mv[0][i][1] = (s->mv[0][i][1] = my) * 2;
  1364. }
  1365. }
  1366. if (USES_LIST(mb_type, 1)) {
  1367. s->mv_dir |= MV_DIR_BACKWARD;
  1368. for (i = 0; i < 2; i++) {
  1369. mx = ff_h263_decode_motion(s, s->last_mv[1][i][0], s->b_code);
  1370. my = ff_h263_decode_motion(s, s->last_mv[1][i][1] / 2, s->b_code);
  1371. s->last_mv[1][i][0] =
  1372. s->mv[1][i][0] = mx;
  1373. s->last_mv[1][i][1] = (s->mv[1][i][1] = my) * 2;
  1374. }
  1375. }
  1376. }
  1377. }
  1378. if (IS_DIRECT(mb_type)) {
  1379. if (IS_SKIP(mb_type)) {
  1380. mx =
  1381. my = 0;
  1382. } else {
  1383. mx = ff_h263_decode_motion(s, 0, 1);
  1384. my = ff_h263_decode_motion(s, 0, 1);
  1385. }
  1386. s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
  1387. mb_type |= ff_mpeg4_set_direct_mv(s, mx, my);
  1388. }
  1389. s->current_picture.mb_type[xy] = mb_type;
  1390. } else { /* I-Frame */
  1391. do {
  1392. cbpc = get_vlc2(&s->gb, ff_h263_intra_MCBPC_vlc.table, INTRA_MCBPC_VLC_BITS, 2);
  1393. if (cbpc < 0) {
  1394. av_log(s->avctx, AV_LOG_ERROR,
  1395. "I cbpc damaged at %d %d\n", s->mb_x, s->mb_y);
  1396. return -1;
  1397. }
  1398. } while (cbpc == 8);
  1399. dquant = cbpc & 4;
  1400. s->mb_intra = 1;
  1401. intra:
  1402. s->ac_pred = get_bits1(&s->gb);
  1403. if (s->ac_pred)
  1404. s->current_picture.mb_type[xy] = MB_TYPE_INTRA | MB_TYPE_ACPRED;
  1405. else
  1406. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  1407. cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  1408. if (cbpy < 0) {
  1409. av_log(s->avctx, AV_LOG_ERROR,
  1410. "I cbpy damaged at %d %d\n", s->mb_x, s->mb_y);
  1411. return -1;
  1412. }
  1413. cbp = (cbpc & 3) | (cbpy << 2);
  1414. s->use_intra_dc_vlc = s->qscale < s->intra_dc_threshold;
  1415. if (dquant)
  1416. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  1417. if (!s->progressive_sequence)
  1418. s->interlaced_dct = get_bits1(&s->gb);
  1419. s->dsp.clear_blocks(s->block[0]);
  1420. /* decode each block */
  1421. for (i = 0; i < 6; i++) {
  1422. if (mpeg4_decode_block(s, block[i], i, cbp & 32, 1, 0) < 0)
  1423. return -1;
  1424. cbp += cbp;
  1425. }
  1426. goto end;
  1427. }
  1428. /* decode each block */
  1429. for (i = 0; i < 6; i++) {
  1430. if (mpeg4_decode_block(s, block[i], i, cbp & 32, 0, 0) < 0)
  1431. return -1;
  1432. cbp += cbp;
  1433. }
  1434. end:
  1435. /* per-MB end of slice check */
  1436. if (s->codec_id == AV_CODEC_ID_MPEG4) {
  1437. int next = mpeg4_is_resync(s);
  1438. if (next) {
  1439. if (s->mb_x + s->mb_y*s->mb_width + 1 > next && (s->avctx->err_recognition & AV_EF_AGGRESSIVE)) {
  1440. return -1;
  1441. } else if (s->mb_x + s->mb_y*s->mb_width + 1 >= next)
  1442. return SLICE_END;
  1443. if (s->pict_type == AV_PICTURE_TYPE_B) {
  1444. const int delta= s->mb_x + 1 == s->mb_width ? 2 : 1;
  1445. ff_thread_await_progress(&s->next_picture_ptr->tf,
  1446. (s->mb_x + delta >= s->mb_width)
  1447. ? FFMIN(s->mb_y + 1, s->mb_height - 1)
  1448. : s->mb_y, 0);
  1449. if (s->next_picture.mbskip_table[xy + delta])
  1450. return SLICE_OK;
  1451. }
  1452. return SLICE_END;
  1453. }
  1454. }
  1455. return SLICE_OK;
  1456. }
  1457. static int mpeg4_decode_gop_header(MpegEncContext *s, GetBitContext *gb)
  1458. {
  1459. int hours, minutes, seconds;
  1460. if (!show_bits(gb, 23)) {
  1461. av_log(s->avctx, AV_LOG_WARNING, "GOP header invalid\n");
  1462. return -1;
  1463. }
  1464. hours = get_bits(gb, 5);
  1465. minutes = get_bits(gb, 6);
  1466. skip_bits1(gb);
  1467. seconds = get_bits(gb, 6);
  1468. s->time_base = seconds + 60*(minutes + 60*hours);
  1469. skip_bits1(gb);
  1470. skip_bits1(gb);
  1471. return 0;
  1472. }
  1473. static int mpeg4_decode_profile_level(MpegEncContext *s, GetBitContext *gb)
  1474. {
  1475. s->avctx->profile = get_bits(gb, 4);
  1476. s->avctx->level = get_bits(gb, 4);
  1477. // for Simple profile, level 0
  1478. if (s->avctx->profile == 0 && s->avctx->level == 8) {
  1479. s->avctx->level = 0;
  1480. }
  1481. return 0;
  1482. }
  1483. static int decode_vol_header(MpegEncContext *s, GetBitContext *gb)
  1484. {
  1485. int width, height, vo_ver_id;
  1486. /* vol header */
  1487. skip_bits(gb, 1); /* random access */
  1488. s->vo_type = get_bits(gb, 8);
  1489. if (get_bits1(gb) != 0) { /* is_ol_id */
  1490. vo_ver_id = get_bits(gb, 4); /* vo_ver_id */
  1491. skip_bits(gb, 3); /* vo_priority */
  1492. } else {
  1493. vo_ver_id = 1;
  1494. }
  1495. s->aspect_ratio_info = get_bits(gb, 4);
  1496. if (s->aspect_ratio_info == FF_ASPECT_EXTENDED) {
  1497. s->avctx->sample_aspect_ratio.num = get_bits(gb, 8); // par_width
  1498. s->avctx->sample_aspect_ratio.den = get_bits(gb, 8); // par_height
  1499. } else {
  1500. s->avctx->sample_aspect_ratio = ff_h263_pixel_aspect[s->aspect_ratio_info];
  1501. }
  1502. if ((s->vol_control_parameters = get_bits1(gb))) { /* vol control parameter */
  1503. int chroma_format = get_bits(gb, 2);
  1504. if (chroma_format != CHROMA_420)
  1505. av_log(s->avctx, AV_LOG_ERROR, "illegal chroma format\n");
  1506. s->low_delay = get_bits1(gb);
  1507. if (get_bits1(gb)) { /* vbv parameters */
  1508. get_bits(gb, 15); /* first_half_bitrate */
  1509. skip_bits1(gb); /* marker */
  1510. get_bits(gb, 15); /* latter_half_bitrate */
  1511. skip_bits1(gb); /* marker */
  1512. get_bits(gb, 15); /* first_half_vbv_buffer_size */
  1513. skip_bits1(gb); /* marker */
  1514. get_bits(gb, 3); /* latter_half_vbv_buffer_size */
  1515. get_bits(gb, 11); /* first_half_vbv_occupancy */
  1516. skip_bits1(gb); /* marker */
  1517. get_bits(gb, 15); /* latter_half_vbv_occupancy */
  1518. skip_bits1(gb); /* marker */
  1519. }
  1520. } else {
  1521. /* is setting low delay flag only once the smartest thing to do?
  1522. * low delay detection won't be overriden. */
  1523. if (s->picture_number == 0)
  1524. s->low_delay = 0;
  1525. }
  1526. s->shape = get_bits(gb, 2); /* vol shape */
  1527. if (s->shape != RECT_SHAPE)
  1528. av_log(s->avctx, AV_LOG_ERROR, "only rectangular vol supported\n");
  1529. if (s->shape == GRAY_SHAPE && vo_ver_id != 1) {
  1530. av_log(s->avctx, AV_LOG_ERROR, "Gray shape not supported\n");
  1531. skip_bits(gb, 4); /* video_object_layer_shape_extension */
  1532. }
  1533. check_marker(gb, "before time_increment_resolution");
  1534. s->avctx->time_base.den = get_bits(gb, 16);
  1535. if (!s->avctx->time_base.den) {
  1536. av_log(s->avctx, AV_LOG_ERROR, "time_base.den==0\n");
  1537. s->avctx->time_base.num = 0;
  1538. return -1;
  1539. }
  1540. s->time_increment_bits = av_log2(s->avctx->time_base.den - 1) + 1;
  1541. if (s->time_increment_bits < 1)
  1542. s->time_increment_bits = 1;
  1543. check_marker(gb, "before fixed_vop_rate");
  1544. if (get_bits1(gb) != 0) /* fixed_vop_rate */
  1545. s->avctx->time_base.num = get_bits(gb, s->time_increment_bits);
  1546. else
  1547. s->avctx->time_base.num = 1;
  1548. s->t_frame = 0;
  1549. if (s->shape != BIN_ONLY_SHAPE) {
  1550. if (s->shape == RECT_SHAPE) {
  1551. check_marker(gb, "before width");
  1552. width = get_bits(gb, 13);
  1553. check_marker(gb, "before height");
  1554. height = get_bits(gb, 13);
  1555. check_marker(gb, "after height");
  1556. if (width && height && /* they should be non zero but who knows */
  1557. !(s->width && s->codec_tag == AV_RL32("MP4S"))) {
  1558. if (s->width && s->height &&
  1559. (s->width != width || s->height != height))
  1560. s->context_reinit = 1;
  1561. s->width = width;
  1562. s->height = height;
  1563. }
  1564. }
  1565. s->progressive_sequence =
  1566. s->progressive_frame = get_bits1(gb) ^ 1;
  1567. s->interlaced_dct = 0;
  1568. if (!get_bits1(gb) && (s->avctx->debug & FF_DEBUG_PICT_INFO))
  1569. av_log(s->avctx, AV_LOG_INFO, /* OBMC Disable */
  1570. "MPEG4 OBMC not supported (very likely buggy encoder)\n");
  1571. if (vo_ver_id == 1)
  1572. s->vol_sprite_usage = get_bits1(gb); /* vol_sprite_usage */
  1573. else
  1574. s->vol_sprite_usage = get_bits(gb, 2); /* vol_sprite_usage */
  1575. if (s->vol_sprite_usage == STATIC_SPRITE)
  1576. av_log(s->avctx, AV_LOG_ERROR, "Static Sprites not supported\n");
  1577. if (s->vol_sprite_usage == STATIC_SPRITE ||
  1578. s->vol_sprite_usage == GMC_SPRITE) {
  1579. if (s->vol_sprite_usage == STATIC_SPRITE) {
  1580. s->sprite_width = get_bits(gb, 13);
  1581. skip_bits1(gb); /* marker */
  1582. s->sprite_height = get_bits(gb, 13);
  1583. skip_bits1(gb); /* marker */
  1584. s->sprite_left = get_bits(gb, 13);
  1585. skip_bits1(gb); /* marker */
  1586. s->sprite_top = get_bits(gb, 13);
  1587. skip_bits1(gb); /* marker */
  1588. }
  1589. s->num_sprite_warping_points = get_bits(gb, 6);
  1590. if (s->num_sprite_warping_points > 3) {
  1591. av_log(s->avctx, AV_LOG_ERROR,
  1592. "%d sprite_warping_points\n",
  1593. s->num_sprite_warping_points);
  1594. s->num_sprite_warping_points = 0;
  1595. return -1;
  1596. }
  1597. s->sprite_warping_accuracy = get_bits(gb, 2);
  1598. s->sprite_brightness_change = get_bits1(gb);
  1599. if (s->vol_sprite_usage == STATIC_SPRITE)
  1600. s->low_latency_sprite = get_bits1(gb);
  1601. }
  1602. // FIXME sadct disable bit if verid!=1 && shape not rect
  1603. if (get_bits1(gb) == 1) { /* not_8_bit */
  1604. s->quant_precision = get_bits(gb, 4); /* quant_precision */
  1605. if (get_bits(gb, 4) != 8) /* bits_per_pixel */
  1606. av_log(s->avctx, AV_LOG_ERROR, "N-bit not supported\n");
  1607. if (s->quant_precision != 5)
  1608. av_log(s->avctx, AV_LOG_ERROR,
  1609. "quant precision %d\n", s->quant_precision);
  1610. if (s->quant_precision<3 || s->quant_precision>9) {
  1611. s->quant_precision = 5;
  1612. }
  1613. } else {
  1614. s->quant_precision = 5;
  1615. }
  1616. // FIXME a bunch of grayscale shape things
  1617. if ((s->mpeg_quant = get_bits1(gb))) { /* vol_quant_type */
  1618. int i, v;
  1619. /* load default matrixes */
  1620. for (i = 0; i < 64; i++) {
  1621. int j = s->dsp.idct_permutation[i];
  1622. v = ff_mpeg4_default_intra_matrix[i];
  1623. s->intra_matrix[j] = v;
  1624. s->chroma_intra_matrix[j] = v;
  1625. v = ff_mpeg4_default_non_intra_matrix[i];
  1626. s->inter_matrix[j] = v;
  1627. s->chroma_inter_matrix[j] = v;
  1628. }
  1629. /* load custom intra matrix */
  1630. if (get_bits1(gb)) {
  1631. int last = 0;
  1632. for (i = 0; i < 64; i++) {
  1633. int j;
  1634. v = get_bits(gb, 8);
  1635. if (v == 0)
  1636. break;
  1637. last = v;
  1638. j = s->dsp.idct_permutation[ff_zigzag_direct[i]];
  1639. s->intra_matrix[j] = last;
  1640. s->chroma_intra_matrix[j] = last;
  1641. }
  1642. /* replicate last value */
  1643. for (; i < 64; i++) {
  1644. int j = s->dsp.idct_permutation[ff_zigzag_direct[i]];
  1645. s->intra_matrix[j] = last;
  1646. s->chroma_intra_matrix[j] = last;
  1647. }
  1648. }
  1649. /* load custom non intra matrix */
  1650. if (get_bits1(gb)) {
  1651. int last = 0;
  1652. for (i = 0; i < 64; i++) {
  1653. int j;
  1654. v = get_bits(gb, 8);
  1655. if (v == 0)
  1656. break;
  1657. last = v;
  1658. j = s->dsp.idct_permutation[ff_zigzag_direct[i]];
  1659. s->inter_matrix[j] = v;
  1660. s->chroma_inter_matrix[j] = v;
  1661. }
  1662. /* replicate last value */
  1663. for (; i < 64; i++) {
  1664. int j = s->dsp.idct_permutation[ff_zigzag_direct[i]];
  1665. s->inter_matrix[j] = last;
  1666. s->chroma_inter_matrix[j] = last;
  1667. }
  1668. }
  1669. // FIXME a bunch of grayscale shape things
  1670. }
  1671. if (vo_ver_id != 1)
  1672. s->quarter_sample = get_bits1(gb);
  1673. else
  1674. s->quarter_sample = 0;
  1675. if (!get_bits1(gb)) {
  1676. int pos = get_bits_count(gb);
  1677. int estimation_method = get_bits(gb, 2);
  1678. if (estimation_method < 2) {
  1679. if (!get_bits1(gb)) {
  1680. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* opaque */
  1681. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* transparent */
  1682. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* intra_cae */
  1683. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* inter_cae */
  1684. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* no_update */
  1685. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* upampling */
  1686. }
  1687. if (!get_bits1(gb)) {
  1688. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* intra_blocks */
  1689. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* inter_blocks */
  1690. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* inter4v_blocks */
  1691. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* not coded blocks */
  1692. }
  1693. if (!check_marker(gb, "in complexity estimation part 1")) {
  1694. skip_bits_long(gb, pos - get_bits_count(gb));
  1695. goto no_cplx_est;
  1696. }
  1697. if (!get_bits1(gb)) {
  1698. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* dct_coeffs */
  1699. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* dct_lines */
  1700. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* vlc_syms */
  1701. s->cplx_estimation_trash_i += 4 * get_bits1(gb); /* vlc_bits */
  1702. }
  1703. if (!get_bits1(gb)) {
  1704. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* apm */
  1705. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* npm */
  1706. s->cplx_estimation_trash_b += 8 * get_bits1(gb); /* interpolate_mc_q */
  1707. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* forwback_mc_q */
  1708. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* halfpel2 */
  1709. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* halfpel4 */
  1710. }
  1711. if (!check_marker(gb, "in complexity estimation part 2")) {
  1712. skip_bits_long(gb, pos - get_bits_count(gb));
  1713. goto no_cplx_est;
  1714. }
  1715. if (estimation_method == 1) {
  1716. s->cplx_estimation_trash_i += 8 * get_bits1(gb); /* sadct */
  1717. s->cplx_estimation_trash_p += 8 * get_bits1(gb); /* qpel */
  1718. }
  1719. } else
  1720. av_log(s->avctx, AV_LOG_ERROR,
  1721. "Invalid Complexity estimation method %d\n",
  1722. estimation_method);
  1723. } else {
  1724. no_cplx_est:
  1725. s->cplx_estimation_trash_i =
  1726. s->cplx_estimation_trash_p =
  1727. s->cplx_estimation_trash_b = 0;
  1728. }
  1729. s->resync_marker = !get_bits1(gb); /* resync_marker_disabled */
  1730. s->data_partitioning = get_bits1(gb);
  1731. if (s->data_partitioning)
  1732. s->rvlc = get_bits1(gb);
  1733. if (vo_ver_id != 1) {
  1734. s->new_pred = get_bits1(gb);
  1735. if (s->new_pred) {
  1736. av_log(s->avctx, AV_LOG_ERROR, "new pred not supported\n");
  1737. skip_bits(gb, 2); /* requested upstream message type */
  1738. skip_bits1(gb); /* newpred segment type */
  1739. }
  1740. s->reduced_res_vop = get_bits1(gb);
  1741. if (s->reduced_res_vop)
  1742. av_log(s->avctx, AV_LOG_ERROR,
  1743. "reduced resolution VOP not supported\n");
  1744. } else {
  1745. s->new_pred = 0;
  1746. s->reduced_res_vop = 0;
  1747. }
  1748. s->scalability = get_bits1(gb);
  1749. if (s->scalability) {
  1750. GetBitContext bak = *gb;
  1751. int h_sampling_factor_n;
  1752. int h_sampling_factor_m;
  1753. int v_sampling_factor_n;
  1754. int v_sampling_factor_m;
  1755. s->hierachy_type = get_bits1(gb);
  1756. skip_bits(gb, 4); /* ref_layer_id */
  1757. skip_bits1(gb); /* ref_layer_sampling_dir */
  1758. h_sampling_factor_n = get_bits(gb, 5);
  1759. h_sampling_factor_m = get_bits(gb, 5);
  1760. v_sampling_factor_n = get_bits(gb, 5);
  1761. v_sampling_factor_m = get_bits(gb, 5);
  1762. s->enhancement_type = get_bits1(gb);
  1763. if (h_sampling_factor_n == 0 || h_sampling_factor_m == 0 ||
  1764. v_sampling_factor_n == 0 || v_sampling_factor_m == 0) {
  1765. /* illegal scalability header (VERY broken encoder),
  1766. * trying to workaround */
  1767. s->scalability = 0;
  1768. *gb = bak;
  1769. } else
  1770. av_log(s->avctx, AV_LOG_ERROR, "scalability not supported\n");
  1771. // bin shape stuff FIXME
  1772. }
  1773. }
  1774. if (s->avctx->debug&FF_DEBUG_PICT_INFO) {
  1775. av_log(s->avctx, AV_LOG_DEBUG, "tb %d/%d, tincrbits:%d, qp_prec:%d, ps:%d, %s%s%s%s\n",
  1776. s->avctx->time_base.num, s->avctx->time_base.den,
  1777. s->time_increment_bits,
  1778. s->quant_precision,
  1779. s->progressive_sequence,
  1780. s->scalability ? "scalability " :"" , s->quarter_sample ? "qpel " : "",
  1781. s->data_partitioning ? "partition " : "", s->rvlc ? "rvlc " : ""
  1782. );
  1783. }
  1784. return 0;
  1785. }
  1786. /**
  1787. * Decode the user data stuff in the header.
  1788. * Also initializes divx/xvid/lavc_version/build.
  1789. */
  1790. static int decode_user_data(MpegEncContext *s, GetBitContext *gb)
  1791. {
  1792. char buf[256];
  1793. int i;
  1794. int e;
  1795. int ver = 0, build = 0, ver2 = 0, ver3 = 0;
  1796. char last;
  1797. for (i = 0; i < 255 && get_bits_count(gb) < gb->size_in_bits; i++) {
  1798. if (show_bits(gb, 23) == 0)
  1799. break;
  1800. buf[i] = get_bits(gb, 8);
  1801. }
  1802. buf[i] = 0;
  1803. /* divx detection */
  1804. e = sscanf(buf, "DivX%dBuild%d%c", &ver, &build, &last);
  1805. if (e < 2)
  1806. e = sscanf(buf, "DivX%db%d%c", &ver, &build, &last);
  1807. if (e >= 2) {
  1808. s->divx_version = ver;
  1809. s->divx_build = build;
  1810. s->divx_packed = e == 3 && last == 'p';
  1811. if (s->divx_packed && !s->showed_packed_warning) {
  1812. av_log(s->avctx, AV_LOG_INFO, "Video uses a non-standard and "
  1813. "wasteful way to store B-frames ('packed B-frames'). "
  1814. "Consider using a tool like VirtualDub or avidemux to fix it.\n");
  1815. s->showed_packed_warning = 1;
  1816. }
  1817. }
  1818. /* libavcodec detection */
  1819. e = sscanf(buf, "FFmpe%*[^b]b%d", &build) + 3;
  1820. if (e != 4)
  1821. e = sscanf(buf, "FFmpeg v%d.%d.%d / libavcodec build: %d", &ver, &ver2, &ver3, &build);
  1822. if (e != 4) {
  1823. e = sscanf(buf, "Lavc%d.%d.%d", &ver, &ver2, &ver3) + 1;
  1824. if (e > 1)
  1825. build = (ver << 16) + (ver2 << 8) + ver3;
  1826. }
  1827. if (e != 4) {
  1828. if (strcmp(buf, "ffmpeg") == 0)
  1829. s->lavc_build = 4600;
  1830. }
  1831. if (e == 4)
  1832. s->lavc_build = build;
  1833. /* Xvid detection */
  1834. e = sscanf(buf, "XviD%d", &build);
  1835. if (e == 1)
  1836. s->xvid_build = build;
  1837. return 0;
  1838. }
  1839. static int decode_vop_header(MpegEncContext *s, GetBitContext *gb)
  1840. {
  1841. int time_incr, time_increment;
  1842. int64_t pts;
  1843. s->pict_type = get_bits(gb, 2) + AV_PICTURE_TYPE_I; /* pict type: I = 0 , P = 1 */
  1844. if (s->pict_type == AV_PICTURE_TYPE_B && s->low_delay &&
  1845. s->vol_control_parameters == 0 && !(s->flags & CODEC_FLAG_LOW_DELAY)) {
  1846. av_log(s->avctx, AV_LOG_ERROR, "low_delay flag incorrectly, clearing it\n");
  1847. s->low_delay = 0;
  1848. }
  1849. s->partitioned_frame = s->data_partitioning && s->pict_type != AV_PICTURE_TYPE_B;
  1850. if (s->partitioned_frame)
  1851. s->decode_mb = mpeg4_decode_partitioned_mb;
  1852. else
  1853. s->decode_mb = mpeg4_decode_mb;
  1854. time_incr = 0;
  1855. while (get_bits1(gb) != 0)
  1856. time_incr++;
  1857. check_marker(gb, "before time_increment");
  1858. if (s->time_increment_bits == 0 ||
  1859. !(show_bits(gb, s->time_increment_bits + 1) & 1)) {
  1860. av_log(s->avctx, AV_LOG_ERROR,
  1861. "hmm, seems the headers are not complete, trying to guess time_increment_bits\n");
  1862. for (s->time_increment_bits = 1;
  1863. s->time_increment_bits < 16;
  1864. s->time_increment_bits++) {
  1865. if (s->pict_type == AV_PICTURE_TYPE_P ||
  1866. (s->pict_type == AV_PICTURE_TYPE_S &&
  1867. s->vol_sprite_usage == GMC_SPRITE)) {
  1868. if ((show_bits(gb, s->time_increment_bits + 6) & 0x37) == 0x30)
  1869. break;
  1870. } else if ((show_bits(gb, s->time_increment_bits + 5) & 0x1F) == 0x18)
  1871. break;
  1872. }
  1873. av_log(s->avctx, AV_LOG_ERROR,
  1874. "my guess is %d bits ;)\n", s->time_increment_bits);
  1875. if (s->avctx->time_base.den && 4*s->avctx->time_base.den < 1<<s->time_increment_bits) {
  1876. s->avctx->time_base.den = 1<<s->time_increment_bits;
  1877. }
  1878. }
  1879. if (IS_3IV1)
  1880. time_increment = get_bits1(gb); // FIXME investigate further
  1881. else
  1882. time_increment = get_bits(gb, s->time_increment_bits);
  1883. if (s->pict_type != AV_PICTURE_TYPE_B) {
  1884. s->last_time_base = s->time_base;
  1885. s->time_base += time_incr;
  1886. s->time = s->time_base * s->avctx->time_base.den + time_increment;
  1887. if (s->workaround_bugs & FF_BUG_UMP4) {
  1888. if (s->time < s->last_non_b_time) {
  1889. /* header is not mpeg-4-compatible, broken encoder,
  1890. * trying to workaround */
  1891. s->time_base++;
  1892. s->time += s->avctx->time_base.den;
  1893. }
  1894. }
  1895. s->pp_time = s->time - s->last_non_b_time;
  1896. s->last_non_b_time = s->time;
  1897. } else {
  1898. s->time = (s->last_time_base + time_incr) * s->avctx->time_base.den + time_increment;
  1899. s->pb_time = s->pp_time - (s->last_non_b_time - s->time);
  1900. if (s->pp_time <= s->pb_time ||
  1901. s->pp_time <= s->pp_time - s->pb_time ||
  1902. s->pp_time <= 0) {
  1903. /* messed up order, maybe after seeking? skipping current b-frame */
  1904. return FRAME_SKIPPED;
  1905. }
  1906. ff_mpeg4_init_direct_mv(s);
  1907. if (s->t_frame == 0)
  1908. s->t_frame = s->pb_time;
  1909. if (s->t_frame == 0)
  1910. s->t_frame = 1; // 1/0 protection
  1911. s->pp_field_time = (ROUNDED_DIV(s->last_non_b_time, s->t_frame) -
  1912. ROUNDED_DIV(s->last_non_b_time - s->pp_time, s->t_frame)) * 2;
  1913. s->pb_field_time = (ROUNDED_DIV(s->time, s->t_frame) -
  1914. ROUNDED_DIV(s->last_non_b_time - s->pp_time, s->t_frame)) * 2;
  1915. if (!s->progressive_sequence) {
  1916. if (s->pp_field_time <= s->pb_field_time || s->pb_field_time <= 1)
  1917. return FRAME_SKIPPED;
  1918. }
  1919. }
  1920. if (s->avctx->time_base.num)
  1921. pts = ROUNDED_DIV(s->time, s->avctx->time_base.num);
  1922. else
  1923. pts = AV_NOPTS_VALUE;
  1924. if (s->avctx->debug&FF_DEBUG_PTS)
  1925. av_log(s->avctx, AV_LOG_DEBUG, "MPEG4 PTS: %"PRId64"\n",
  1926. pts);
  1927. check_marker(gb, "before vop_coded");
  1928. /* vop coded */
  1929. if (get_bits1(gb) != 1) {
  1930. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  1931. av_log(s->avctx, AV_LOG_ERROR, "vop not coded\n");
  1932. return FRAME_SKIPPED;
  1933. }
  1934. if (s->new_pred)
  1935. decode_new_pred(s, gb);
  1936. if (s->shape != BIN_ONLY_SHAPE &&
  1937. (s->pict_type == AV_PICTURE_TYPE_P ||
  1938. (s->pict_type == AV_PICTURE_TYPE_S &&
  1939. s->vol_sprite_usage == GMC_SPRITE))) {
  1940. /* rounding type for motion estimation */
  1941. s->no_rounding = get_bits1(gb);
  1942. } else {
  1943. s->no_rounding = 0;
  1944. }
  1945. // FIXME reduced res stuff
  1946. if (s->shape != RECT_SHAPE) {
  1947. if (s->vol_sprite_usage != 1 || s->pict_type != AV_PICTURE_TYPE_I) {
  1948. skip_bits(gb, 13); /* width */
  1949. skip_bits1(gb); /* marker */
  1950. skip_bits(gb, 13); /* height */
  1951. skip_bits1(gb); /* marker */
  1952. skip_bits(gb, 13); /* hor_spat_ref */
  1953. skip_bits1(gb); /* marker */
  1954. skip_bits(gb, 13); /* ver_spat_ref */
  1955. }
  1956. skip_bits1(gb); /* change_CR_disable */
  1957. if (get_bits1(gb) != 0)
  1958. skip_bits(gb, 8); /* constant_alpha_value */
  1959. }
  1960. // FIXME complexity estimation stuff
  1961. if (s->shape != BIN_ONLY_SHAPE) {
  1962. skip_bits_long(gb, s->cplx_estimation_trash_i);
  1963. if (s->pict_type != AV_PICTURE_TYPE_I)
  1964. skip_bits_long(gb, s->cplx_estimation_trash_p);
  1965. if (s->pict_type == AV_PICTURE_TYPE_B)
  1966. skip_bits_long(gb, s->cplx_estimation_trash_b);
  1967. if (get_bits_left(gb) < 3) {
  1968. av_log(s->avctx, AV_LOG_ERROR, "Header truncated\n");
  1969. return -1;
  1970. }
  1971. s->intra_dc_threshold = ff_mpeg4_dc_threshold[get_bits(gb, 3)];
  1972. if (!s->progressive_sequence) {
  1973. s->top_field_first = get_bits1(gb);
  1974. s->alternate_scan = get_bits1(gb);
  1975. } else
  1976. s->alternate_scan = 0;
  1977. }
  1978. if (s->alternate_scan) {
  1979. ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable, ff_alternate_vertical_scan);
  1980. ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable, ff_alternate_vertical_scan);
  1981. ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_vertical_scan);
  1982. ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  1983. } else {
  1984. ff_init_scantable(s->dsp.idct_permutation, &s->inter_scantable, ff_zigzag_direct);
  1985. ff_init_scantable(s->dsp.idct_permutation, &s->intra_scantable, ff_zigzag_direct);
  1986. ff_init_scantable(s->dsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
  1987. ff_init_scantable(s->dsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  1988. }
  1989. if (s->pict_type == AV_PICTURE_TYPE_S &&
  1990. (s->vol_sprite_usage == STATIC_SPRITE ||
  1991. s->vol_sprite_usage == GMC_SPRITE)) {
  1992. if (mpeg4_decode_sprite_trajectory(s, gb) < 0)
  1993. return AVERROR_INVALIDDATA;
  1994. if (s->sprite_brightness_change)
  1995. av_log(s->avctx, AV_LOG_ERROR,
  1996. "sprite_brightness_change not supported\n");
  1997. if (s->vol_sprite_usage == STATIC_SPRITE)
  1998. av_log(s->avctx, AV_LOG_ERROR, "static sprite not supported\n");
  1999. }
  2000. if (s->shape != BIN_ONLY_SHAPE) {
  2001. s->chroma_qscale = s->qscale = get_bits(gb, s->quant_precision);
  2002. if (s->qscale == 0) {
  2003. av_log(s->avctx, AV_LOG_ERROR,
  2004. "Error, header damaged or not MPEG4 header (qscale=0)\n");
  2005. return -1; // makes no sense to continue, as there is nothing left from the image then
  2006. }
  2007. if (s->pict_type != AV_PICTURE_TYPE_I) {
  2008. s->f_code = get_bits(gb, 3); /* fcode_for */
  2009. if (s->f_code == 0) {
  2010. av_log(s->avctx, AV_LOG_ERROR,
  2011. "Error, header damaged or not MPEG4 header (f_code=0)\n");
  2012. s->f_code = 1;
  2013. return -1; // makes no sense to continue, as there is nothing left from the image then
  2014. }
  2015. } else
  2016. s->f_code = 1;
  2017. if (s->pict_type == AV_PICTURE_TYPE_B) {
  2018. s->b_code = get_bits(gb, 3);
  2019. if (s->b_code == 0) {
  2020. av_log(s->avctx, AV_LOG_ERROR,
  2021. "Error, header damaged or not MPEG4 header (b_code=0)\n");
  2022. s->b_code=1;
  2023. return -1; // makes no sense to continue, as the MV decoding will break very quickly
  2024. }
  2025. } else
  2026. s->b_code = 1;
  2027. if (s->avctx->debug & FF_DEBUG_PICT_INFO) {
  2028. av_log(s->avctx, AV_LOG_DEBUG,
  2029. "qp:%d fc:%d,%d %s size:%d pro:%d alt:%d top:%d %spel part:%d resync:%d w:%d a:%d rnd:%d vot:%d%s dc:%d ce:%d/%d/%d time:%"PRId64" tincr:%d\n",
  2030. s->qscale, s->f_code, s->b_code,
  2031. s->pict_type == AV_PICTURE_TYPE_I ? "I" : (s->pict_type == AV_PICTURE_TYPE_P ? "P" : (s->pict_type == AV_PICTURE_TYPE_B ? "B" : "S")),
  2032. gb->size_in_bits,s->progressive_sequence, s->alternate_scan,
  2033. s->top_field_first, s->quarter_sample ? "q" : "h",
  2034. s->data_partitioning, s->resync_marker,
  2035. s->num_sprite_warping_points, s->sprite_warping_accuracy,
  2036. 1 - s->no_rounding, s->vo_type,
  2037. s->vol_control_parameters ? " VOLC" : " ", s->intra_dc_threshold,
  2038. s->cplx_estimation_trash_i, s->cplx_estimation_trash_p,
  2039. s->cplx_estimation_trash_b,
  2040. s->time,
  2041. time_increment
  2042. );
  2043. }
  2044. if (!s->scalability) {
  2045. if (s->shape != RECT_SHAPE && s->pict_type != AV_PICTURE_TYPE_I)
  2046. skip_bits1(gb); // vop shape coding type
  2047. } else {
  2048. if (s->enhancement_type) {
  2049. int load_backward_shape = get_bits1(gb);
  2050. if (load_backward_shape)
  2051. av_log(s->avctx, AV_LOG_ERROR,
  2052. "load backward shape isn't supported\n");
  2053. }
  2054. skip_bits(gb, 2); // ref_select_code
  2055. }
  2056. }
  2057. /* detect buggy encoders which don't set the low_delay flag
  2058. * (divx4/xvid/opendivx). Note we cannot detect divx5 without b-frames
  2059. * easily (although it's buggy too) */
  2060. if (s->vo_type == 0 && s->vol_control_parameters == 0 &&
  2061. s->divx_version == -1 && s->picture_number == 0) {
  2062. av_log(s->avctx, AV_LOG_WARNING,
  2063. "looks like this file was encoded with (divx4/(old)xvid/opendivx) -> forcing low_delay flag\n");
  2064. s->low_delay = 1;
  2065. }
  2066. s->picture_number++; // better than pic number==0 always ;)
  2067. // FIXME add short header support
  2068. s->y_dc_scale_table = ff_mpeg4_y_dc_scale_table;
  2069. s->c_dc_scale_table = ff_mpeg4_c_dc_scale_table;
  2070. if (s->workaround_bugs & FF_BUG_EDGE) {
  2071. s->h_edge_pos = s->width;
  2072. s->v_edge_pos = s->height;
  2073. }
  2074. return 0;
  2075. }
  2076. /**
  2077. * Decode mpeg4 headers.
  2078. * @return <0 if no VOP found (or a damaged one)
  2079. * FRAME_SKIPPED if a not coded VOP is found
  2080. * 0 if a VOP is found
  2081. */
  2082. int ff_mpeg4_decode_picture_header(MpegEncContext *s, GetBitContext *gb)
  2083. {
  2084. unsigned startcode, v;
  2085. /* search next start code */
  2086. align_get_bits(gb);
  2087. if (s->codec_tag == AV_RL32("WV1F") && show_bits(gb, 24) == 0x575630) {
  2088. skip_bits(gb, 24);
  2089. if (get_bits(gb, 8) == 0xF0)
  2090. goto end;
  2091. }
  2092. startcode = 0xff;
  2093. for (;;) {
  2094. if (get_bits_count(gb) >= gb->size_in_bits) {
  2095. if (gb->size_in_bits == 8 &&
  2096. (s->divx_version >= 0 || s->xvid_build >= 0) || s->codec_tag == AV_RL32("QMP4")) {
  2097. av_log(s->avctx, AV_LOG_VERBOSE, "frame skip %d\n", gb->size_in_bits);
  2098. return FRAME_SKIPPED; // divx bug
  2099. } else
  2100. return -1; // end of stream
  2101. }
  2102. /* use the bits after the test */
  2103. v = get_bits(gb, 8);
  2104. startcode = ((startcode << 8) | v) & 0xffffffff;
  2105. if ((startcode & 0xFFFFFF00) != 0x100)
  2106. continue; // no startcode
  2107. if (s->avctx->debug & FF_DEBUG_STARTCODE) {
  2108. av_log(s->avctx, AV_LOG_DEBUG, "startcode: %3X ", startcode);
  2109. if (startcode <= 0x11F)
  2110. av_log(s->avctx, AV_LOG_DEBUG, "Video Object Start");
  2111. else if (startcode <= 0x12F)
  2112. av_log(s->avctx, AV_LOG_DEBUG, "Video Object Layer Start");
  2113. else if (startcode <= 0x13F)
  2114. av_log(s->avctx, AV_LOG_DEBUG, "Reserved");
  2115. else if (startcode <= 0x15F)
  2116. av_log(s->avctx, AV_LOG_DEBUG, "FGS bp start");
  2117. else if (startcode <= 0x1AF)
  2118. av_log(s->avctx, AV_LOG_DEBUG, "Reserved");
  2119. else if (startcode == 0x1B0)
  2120. av_log(s->avctx, AV_LOG_DEBUG, "Visual Object Seq Start");
  2121. else if (startcode == 0x1B1)
  2122. av_log(s->avctx, AV_LOG_DEBUG, "Visual Object Seq End");
  2123. else if (startcode == 0x1B2)
  2124. av_log(s->avctx, AV_LOG_DEBUG, "User Data");
  2125. else if (startcode == 0x1B3)
  2126. av_log(s->avctx, AV_LOG_DEBUG, "Group of VOP start");
  2127. else if (startcode == 0x1B4)
  2128. av_log(s->avctx, AV_LOG_DEBUG, "Video Session Error");
  2129. else if (startcode == 0x1B5)
  2130. av_log(s->avctx, AV_LOG_DEBUG, "Visual Object Start");
  2131. else if (startcode == 0x1B6)
  2132. av_log(s->avctx, AV_LOG_DEBUG, "Video Object Plane start");
  2133. else if (startcode == 0x1B7)
  2134. av_log(s->avctx, AV_LOG_DEBUG, "slice start");
  2135. else if (startcode == 0x1B8)
  2136. av_log(s->avctx, AV_LOG_DEBUG, "extension start");
  2137. else if (startcode == 0x1B9)
  2138. av_log(s->avctx, AV_LOG_DEBUG, "fgs start");
  2139. else if (startcode == 0x1BA)
  2140. av_log(s->avctx, AV_LOG_DEBUG, "FBA Object start");
  2141. else if (startcode == 0x1BB)
  2142. av_log(s->avctx, AV_LOG_DEBUG, "FBA Object Plane start");
  2143. else if (startcode == 0x1BC)
  2144. av_log(s->avctx, AV_LOG_DEBUG, "Mesh Object start");
  2145. else if (startcode == 0x1BD)
  2146. av_log(s->avctx, AV_LOG_DEBUG, "Mesh Object Plane start");
  2147. else if (startcode == 0x1BE)
  2148. av_log(s->avctx, AV_LOG_DEBUG, "Still Texture Object start");
  2149. else if (startcode == 0x1BF)
  2150. av_log(s->avctx, AV_LOG_DEBUG, "Texture Spatial Layer start");
  2151. else if (startcode == 0x1C0)
  2152. av_log(s->avctx, AV_LOG_DEBUG, "Texture SNR Layer start");
  2153. else if (startcode == 0x1C1)
  2154. av_log(s->avctx, AV_LOG_DEBUG, "Texture Tile start");
  2155. else if (startcode == 0x1C2)
  2156. av_log(s->avctx, AV_LOG_DEBUG, "Texture Shape Layer start");
  2157. else if (startcode == 0x1C3)
  2158. av_log(s->avctx, AV_LOG_DEBUG, "stuffing start");
  2159. else if (startcode <= 0x1C5)
  2160. av_log(s->avctx, AV_LOG_DEBUG, "reserved");
  2161. else if (startcode <= 0x1FF)
  2162. av_log(s->avctx, AV_LOG_DEBUG, "System start");
  2163. av_log(s->avctx, AV_LOG_DEBUG, " at %d\n", get_bits_count(gb));
  2164. }
  2165. if (startcode >= 0x120 && startcode <= 0x12F) {
  2166. if (decode_vol_header(s, gb) < 0)
  2167. return -1;
  2168. } else if (startcode == USER_DATA_STARTCODE) {
  2169. decode_user_data(s, gb);
  2170. } else if (startcode == GOP_STARTCODE) {
  2171. mpeg4_decode_gop_header(s, gb);
  2172. } else if (startcode == VOS_STARTCODE) {
  2173. mpeg4_decode_profile_level(s, gb);
  2174. } else if (startcode == VOP_STARTCODE) {
  2175. break;
  2176. }
  2177. align_get_bits(gb);
  2178. startcode = 0xff;
  2179. }
  2180. end:
  2181. if (s->flags & CODEC_FLAG_LOW_DELAY)
  2182. s->low_delay = 1;
  2183. s->avctx->has_b_frames = !s->low_delay;
  2184. return decode_vop_header(s, gb);
  2185. }
  2186. av_cold void ff_mpeg4videodec_static_init(void) {
  2187. static int done = 0;
  2188. if (!done) {
  2189. ff_init_rl(&ff_mpeg4_rl_intra, ff_mpeg4_static_rl_table_store[0]);
  2190. ff_init_rl(&ff_rvlc_rl_inter, ff_mpeg4_static_rl_table_store[1]);
  2191. ff_init_rl(&ff_rvlc_rl_intra, ff_mpeg4_static_rl_table_store[2]);
  2192. INIT_VLC_RL(ff_mpeg4_rl_intra, 554);
  2193. INIT_VLC_RL(ff_rvlc_rl_inter, 1072);
  2194. INIT_VLC_RL(ff_rvlc_rl_intra, 1072);
  2195. INIT_VLC_STATIC(&dc_lum, DC_VLC_BITS, 10 /* 13 */,
  2196. &ff_mpeg4_DCtab_lum[0][1], 2, 1,
  2197. &ff_mpeg4_DCtab_lum[0][0], 2, 1, 512);
  2198. INIT_VLC_STATIC(&dc_chrom, DC_VLC_BITS, 10 /* 13 */,
  2199. &ff_mpeg4_DCtab_chrom[0][1], 2, 1,
  2200. &ff_mpeg4_DCtab_chrom[0][0], 2, 1, 512);
  2201. INIT_VLC_STATIC(&sprite_trajectory, SPRITE_TRAJ_VLC_BITS, 15,
  2202. &ff_sprite_trajectory_tab[0][1], 4, 2,
  2203. &ff_sprite_trajectory_tab[0][0], 4, 2, 128);
  2204. INIT_VLC_STATIC(&mb_type_b_vlc, MB_TYPE_B_VLC_BITS, 4,
  2205. &ff_mb_type_b_tab[0][1], 2, 1,
  2206. &ff_mb_type_b_tab[0][0], 2, 1, 16);
  2207. done = 1;
  2208. }
  2209. }
  2210. static int mpeg4_update_thread_context(AVCodecContext *dst,
  2211. const AVCodecContext *src)
  2212. {
  2213. Mpeg4DecContext *s = dst->priv_data;
  2214. const Mpeg4DecContext *s1 = src->priv_data;
  2215. int ret = ff_mpeg_update_thread_context(dst, src);
  2216. if (ret < 0)
  2217. return ret;
  2218. return 0;
  2219. }
  2220. static av_cold int decode_init(AVCodecContext *avctx)
  2221. {
  2222. Mpeg4DecContext *ctx = avctx->priv_data;
  2223. MpegEncContext *s = &ctx->m;
  2224. int ret;
  2225. s->divx_version =
  2226. s->divx_build =
  2227. s->xvid_build =
  2228. s->lavc_build = -1;
  2229. if ((ret = ff_h263_decode_init(avctx)) < 0)
  2230. return ret;
  2231. ff_mpeg4videodec_static_init();
  2232. s->h263_pred = 1;
  2233. s->low_delay = 0; /* default, might be overridden in the vol header during header parsing */
  2234. s->decode_mb = mpeg4_decode_mb;
  2235. s->time_increment_bits = 4; /* default value for broken headers */
  2236. avctx->chroma_sample_location = AVCHROMA_LOC_LEFT;
  2237. avctx->internal->allocate_progress = 1;
  2238. return 0;
  2239. }
  2240. static const AVProfile mpeg4_video_profiles[] = {
  2241. { FF_PROFILE_MPEG4_SIMPLE, "Simple Profile" },
  2242. { FF_PROFILE_MPEG4_SIMPLE_SCALABLE, "Simple Scalable Profile" },
  2243. { FF_PROFILE_MPEG4_CORE, "Core Profile" },
  2244. { FF_PROFILE_MPEG4_MAIN, "Main Profile" },
  2245. { FF_PROFILE_MPEG4_N_BIT, "N-bit Profile" },
  2246. { FF_PROFILE_MPEG4_SCALABLE_TEXTURE, "Scalable Texture Profile" },
  2247. { FF_PROFILE_MPEG4_SIMPLE_FACE_ANIMATION, "Simple Face Animation Profile" },
  2248. { FF_PROFILE_MPEG4_BASIC_ANIMATED_TEXTURE, "Basic Animated Texture Profile" },
  2249. { FF_PROFILE_MPEG4_HYBRID, "Hybrid Profile" },
  2250. { FF_PROFILE_MPEG4_ADVANCED_REAL_TIME, "Advanced Real Time Simple Profile" },
  2251. { FF_PROFILE_MPEG4_CORE_SCALABLE, "Code Scalable Profile" },
  2252. { FF_PROFILE_MPEG4_ADVANCED_CODING, "Advanced Coding Profile" },
  2253. { FF_PROFILE_MPEG4_ADVANCED_CORE, "Advanced Core Profile" },
  2254. { FF_PROFILE_MPEG4_ADVANCED_SCALABLE_TEXTURE, "Advanced Scalable Texture Profile" },
  2255. { FF_PROFILE_MPEG4_SIMPLE_STUDIO, "Simple Studio Profile" },
  2256. { FF_PROFILE_MPEG4_ADVANCED_SIMPLE, "Advanced Simple Profile" },
  2257. { FF_PROFILE_UNKNOWN },
  2258. };
  2259. static const AVOption mpeg4_options[] = {
  2260. {"quarter_sample", "1/4 subpel MC", offsetof(MpegEncContext, quarter_sample), FF_OPT_TYPE_INT, {.i64 = 0}, 0, 1, 0},
  2261. {"divx_packed", "divx style packed b frames", offsetof(MpegEncContext, divx_packed), FF_OPT_TYPE_INT, {.i64 = 0}, 0, 1, 0},
  2262. {NULL}
  2263. };
  2264. static const AVClass mpeg4_class = {
  2265. "MPEG4 Video Decoder",
  2266. av_default_item_name,
  2267. mpeg4_options,
  2268. LIBAVUTIL_VERSION_INT,
  2269. };
  2270. static const AVClass mpeg4_vdpau_class = {
  2271. "MPEG4 Video VDPAU Decoder",
  2272. av_default_item_name,
  2273. mpeg4_options,
  2274. LIBAVUTIL_VERSION_INT,
  2275. };
  2276. AVCodec ff_mpeg4_decoder = {
  2277. .name = "mpeg4",
  2278. .long_name = NULL_IF_CONFIG_SMALL("MPEG-4 part 2"),
  2279. .type = AVMEDIA_TYPE_VIDEO,
  2280. .id = AV_CODEC_ID_MPEG4,
  2281. .priv_data_size = sizeof(Mpeg4DecContext),
  2282. .init = decode_init,
  2283. .close = ff_h263_decode_end,
  2284. .decode = ff_h263_decode_frame,
  2285. .capabilities = CODEC_CAP_DRAW_HORIZ_BAND | CODEC_CAP_DR1 |
  2286. CODEC_CAP_TRUNCATED | CODEC_CAP_DELAY |
  2287. CODEC_CAP_FRAME_THREADS,
  2288. .flush = ff_mpeg_flush,
  2289. .max_lowres = 3,
  2290. .pix_fmts = ff_h263_hwaccel_pixfmt_list_420,
  2291. .profiles = NULL_IF_CONFIG_SMALL(mpeg4_video_profiles),
  2292. .update_thread_context = ONLY_IF_THREADS_ENABLED(mpeg4_update_thread_context),
  2293. .priv_class = &mpeg4_class,
  2294. };
  2295. #if CONFIG_MPEG4_VDPAU_DECODER
  2296. AVCodec ff_mpeg4_vdpau_decoder = {
  2297. .name = "mpeg4_vdpau",
  2298. .long_name = NULL_IF_CONFIG_SMALL("MPEG-4 part 2 (VDPAU)"),
  2299. .type = AVMEDIA_TYPE_VIDEO,
  2300. .id = AV_CODEC_ID_MPEG4,
  2301. .priv_data_size = sizeof(MpegEncContext),
  2302. .init = decode_init,
  2303. .close = ff_h263_decode_end,
  2304. .decode = ff_h263_decode_frame,
  2305. .capabilities = CODEC_CAP_DR1 | CODEC_CAP_TRUNCATED | CODEC_CAP_DELAY |
  2306. CODEC_CAP_HWACCEL_VDPAU,
  2307. .pix_fmts = (const enum AVPixelFormat[]) { AV_PIX_FMT_VDPAU_MPEG4,
  2308. AV_PIX_FMT_NONE },
  2309. .priv_class = &mpeg4_vdpau_class,
  2310. };
  2311. #endif