You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

3605 lines
136KB

  1. /*
  2. * MPEG-4 decoder
  3. * Copyright (c) 2000,2001 Fabrice Bellard
  4. * Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #define UNCHECKED_BITSTREAM_READER 1
  23. #include "libavutil/internal.h"
  24. #include "libavutil/opt.h"
  25. #include "libavutil/pixdesc.h"
  26. #include "libavutil/thread.h"
  27. #include "error_resilience.h"
  28. #include "hwconfig.h"
  29. #include "idctdsp.h"
  30. #include "internal.h"
  31. #include "mpegutils.h"
  32. #include "mpegvideo.h"
  33. #include "mpegvideodata.h"
  34. #include "mpeg4video.h"
  35. #include "h263.h"
  36. #include "profiles.h"
  37. #include "thread.h"
  38. #include "xvididct.h"
  39. #include "unary.h"
  40. /* The defines below define the number of bits that are read at once for
  41. * reading vlc values. Changing these may improve speed and data cache needs
  42. * be aware though that decreasing them may need the number of stages that is
  43. * passed to get_vlc* to be increased. */
  44. #define SPRITE_TRAJ_VLC_BITS 6
  45. #define DC_VLC_BITS 9
  46. #define MB_TYPE_B_VLC_BITS 4
  47. #define STUDIO_INTRA_BITS 9
  48. static VLC dc_lum, dc_chrom;
  49. static VLC sprite_trajectory;
  50. static VLC mb_type_b_vlc;
  51. static VLC studio_intra_tab[12];
  52. static VLC studio_luma_dc;
  53. static VLC studio_chroma_dc;
  54. static const int mb_type_b_map[4] = {
  55. MB_TYPE_DIRECT2 | MB_TYPE_L0L1,
  56. MB_TYPE_L0L1 | MB_TYPE_16x16,
  57. MB_TYPE_L1 | MB_TYPE_16x16,
  58. MB_TYPE_L0 | MB_TYPE_16x16,
  59. };
  60. /**
  61. * Predict the ac.
  62. * @param n block index (0-3 are luma, 4-5 are chroma)
  63. * @param dir the ac prediction direction
  64. */
  65. void ff_mpeg4_pred_ac(MpegEncContext *s, int16_t *block, int n, int dir)
  66. {
  67. int i;
  68. int16_t *ac_val, *ac_val1;
  69. int8_t *const qscale_table = s->current_picture.qscale_table;
  70. /* find prediction */
  71. ac_val = &s->ac_val[0][0][0] + s->block_index[n] * 16;
  72. ac_val1 = ac_val;
  73. if (s->ac_pred) {
  74. if (dir == 0) {
  75. const int xy = s->mb_x - 1 + s->mb_y * s->mb_stride;
  76. /* left prediction */
  77. ac_val -= 16;
  78. if (s->mb_x == 0 || s->qscale == qscale_table[xy] ||
  79. n == 1 || n == 3) {
  80. /* same qscale */
  81. for (i = 1; i < 8; i++)
  82. block[s->idsp.idct_permutation[i << 3]] += ac_val[i];
  83. } else {
  84. /* different qscale, we must rescale */
  85. for (i = 1; i < 8; i++)
  86. block[s->idsp.idct_permutation[i << 3]] += ROUNDED_DIV(ac_val[i] * qscale_table[xy], s->qscale);
  87. }
  88. } else {
  89. const int xy = s->mb_x + s->mb_y * s->mb_stride - s->mb_stride;
  90. /* top prediction */
  91. ac_val -= 16 * s->block_wrap[n];
  92. if (s->mb_y == 0 || s->qscale == qscale_table[xy] ||
  93. n == 2 || n == 3) {
  94. /* same qscale */
  95. for (i = 1; i < 8; i++)
  96. block[s->idsp.idct_permutation[i]] += ac_val[i + 8];
  97. } else {
  98. /* different qscale, we must rescale */
  99. for (i = 1; i < 8; i++)
  100. block[s->idsp.idct_permutation[i]] += ROUNDED_DIV(ac_val[i + 8] * qscale_table[xy], s->qscale);
  101. }
  102. }
  103. }
  104. /* left copy */
  105. for (i = 1; i < 8; i++)
  106. ac_val1[i] = block[s->idsp.idct_permutation[i << 3]];
  107. /* top copy */
  108. for (i = 1; i < 8; i++)
  109. ac_val1[8 + i] = block[s->idsp.idct_permutation[i]];
  110. }
  111. /**
  112. * check if the next stuff is a resync marker or the end.
  113. * @return 0 if not
  114. */
  115. static inline int mpeg4_is_resync(Mpeg4DecContext *ctx)
  116. {
  117. MpegEncContext *s = &ctx->m;
  118. int bits_count = get_bits_count(&s->gb);
  119. int v = show_bits(&s->gb, 16);
  120. if (s->workaround_bugs & FF_BUG_NO_PADDING && !ctx->resync_marker)
  121. return 0;
  122. while (v <= 0xFF) {
  123. if (s->pict_type == AV_PICTURE_TYPE_B ||
  124. (v >> (8 - s->pict_type) != 1) || s->partitioned_frame)
  125. break;
  126. skip_bits(&s->gb, 8 + s->pict_type);
  127. bits_count += 8 + s->pict_type;
  128. v = show_bits(&s->gb, 16);
  129. }
  130. if (bits_count + 8 >= s->gb.size_in_bits) {
  131. v >>= 8;
  132. v |= 0x7F >> (7 - (bits_count & 7));
  133. if (v == 0x7F)
  134. return s->mb_num;
  135. } else {
  136. if (v == ff_mpeg4_resync_prefix[bits_count & 7]) {
  137. int len, mb_num;
  138. int mb_num_bits = av_log2(s->mb_num - 1) + 1;
  139. GetBitContext gb = s->gb;
  140. skip_bits(&s->gb, 1);
  141. align_get_bits(&s->gb);
  142. for (len = 0; len < 32; len++)
  143. if (get_bits1(&s->gb))
  144. break;
  145. mb_num = get_bits(&s->gb, mb_num_bits);
  146. if (!mb_num || mb_num > s->mb_num || get_bits_count(&s->gb)+6 > s->gb.size_in_bits)
  147. mb_num= -1;
  148. s->gb = gb;
  149. if (len >= ff_mpeg4_get_video_packet_prefix_length(s))
  150. return mb_num;
  151. }
  152. }
  153. return 0;
  154. }
  155. static int mpeg4_decode_sprite_trajectory(Mpeg4DecContext *ctx, GetBitContext *gb)
  156. {
  157. MpegEncContext *s = &ctx->m;
  158. int a = 2 << s->sprite_warping_accuracy;
  159. int rho = 3 - s->sprite_warping_accuracy;
  160. int r = 16 / a;
  161. int alpha = 1;
  162. int beta = 0;
  163. int w = s->width;
  164. int h = s->height;
  165. int min_ab, i, w2, h2, w3, h3;
  166. int sprite_ref[4][2];
  167. int virtual_ref[2][2];
  168. int64_t sprite_offset[2][2];
  169. int64_t sprite_delta[2][2];
  170. // only true for rectangle shapes
  171. const int vop_ref[4][2] = { { 0, 0 }, { s->width, 0 },
  172. { 0, s->height }, { s->width, s->height } };
  173. int d[4][2] = { { 0, 0 }, { 0, 0 }, { 0, 0 }, { 0, 0 } };
  174. if (w <= 0 || h <= 0)
  175. return AVERROR_INVALIDDATA;
  176. for (i = 0; i < ctx->num_sprite_warping_points; i++) {
  177. int length;
  178. int x = 0, y = 0;
  179. length = get_vlc2(gb, sprite_trajectory.table, SPRITE_TRAJ_VLC_BITS, 2);
  180. if (length > 0)
  181. x = get_xbits(gb, length);
  182. if (!(ctx->divx_version == 500 && ctx->divx_build == 413))
  183. check_marker(s->avctx, gb, "before sprite_trajectory");
  184. length = get_vlc2(gb, sprite_trajectory.table, SPRITE_TRAJ_VLC_BITS, 2);
  185. if (length > 0)
  186. y = get_xbits(gb, length);
  187. check_marker(s->avctx, gb, "after sprite_trajectory");
  188. ctx->sprite_traj[i][0] = d[i][0] = x;
  189. ctx->sprite_traj[i][1] = d[i][1] = y;
  190. }
  191. for (; i < 4; i++)
  192. ctx->sprite_traj[i][0] = ctx->sprite_traj[i][1] = 0;
  193. while ((1 << alpha) < w)
  194. alpha++;
  195. while ((1 << beta) < h)
  196. beta++; /* typo in the MPEG-4 std for the definition of w' and h' */
  197. w2 = 1 << alpha;
  198. h2 = 1 << beta;
  199. // Note, the 4th point isn't used for GMC
  200. if (ctx->divx_version == 500 && ctx->divx_build == 413) {
  201. sprite_ref[0][0] = a * vop_ref[0][0] + d[0][0];
  202. sprite_ref[0][1] = a * vop_ref[0][1] + d[0][1];
  203. sprite_ref[1][0] = a * vop_ref[1][0] + d[0][0] + d[1][0];
  204. sprite_ref[1][1] = a * vop_ref[1][1] + d[0][1] + d[1][1];
  205. sprite_ref[2][0] = a * vop_ref[2][0] + d[0][0] + d[2][0];
  206. sprite_ref[2][1] = a * vop_ref[2][1] + d[0][1] + d[2][1];
  207. } else {
  208. sprite_ref[0][0] = (a >> 1) * (2 * vop_ref[0][0] + d[0][0]);
  209. sprite_ref[0][1] = (a >> 1) * (2 * vop_ref[0][1] + d[0][1]);
  210. sprite_ref[1][0] = (a >> 1) * (2 * vop_ref[1][0] + d[0][0] + d[1][0]);
  211. sprite_ref[1][1] = (a >> 1) * (2 * vop_ref[1][1] + d[0][1] + d[1][1]);
  212. sprite_ref[2][0] = (a >> 1) * (2 * vop_ref[2][0] + d[0][0] + d[2][0]);
  213. sprite_ref[2][1] = (a >> 1) * (2 * vop_ref[2][1] + d[0][1] + d[2][1]);
  214. }
  215. /* sprite_ref[3][0] = (a >> 1) * (2 * vop_ref[3][0] + d[0][0] + d[1][0] + d[2][0] + d[3][0]);
  216. * sprite_ref[3][1] = (a >> 1) * (2 * vop_ref[3][1] + d[0][1] + d[1][1] + d[2][1] + d[3][1]); */
  217. /* This is mostly identical to the MPEG-4 std (and is totally unreadable
  218. * because of that...). Perhaps it should be reordered to be more readable.
  219. * The idea behind this virtual_ref mess is to be able to use shifts later
  220. * per pixel instead of divides so the distance between points is converted
  221. * from w&h based to w2&h2 based which are of the 2^x form. */
  222. virtual_ref[0][0] = 16 * (vop_ref[0][0] + w2) +
  223. ROUNDED_DIV(((w - w2) *
  224. (r * sprite_ref[0][0] - 16LL * vop_ref[0][0]) +
  225. w2 * (r * sprite_ref[1][0] - 16LL * vop_ref[1][0])), w);
  226. virtual_ref[0][1] = 16 * vop_ref[0][1] +
  227. ROUNDED_DIV(((w - w2) *
  228. (r * sprite_ref[0][1] - 16LL * vop_ref[0][1]) +
  229. w2 * (r * sprite_ref[1][1] - 16LL * vop_ref[1][1])), w);
  230. virtual_ref[1][0] = 16 * vop_ref[0][0] +
  231. ROUNDED_DIV(((h - h2) * (r * sprite_ref[0][0] - 16LL * vop_ref[0][0]) +
  232. h2 * (r * sprite_ref[2][0] - 16LL * vop_ref[2][0])), h);
  233. virtual_ref[1][1] = 16 * (vop_ref[0][1] + h2) +
  234. ROUNDED_DIV(((h - h2) * (r * sprite_ref[0][1] - 16LL * vop_ref[0][1]) +
  235. h2 * (r * sprite_ref[2][1] - 16LL * vop_ref[2][1])), h);
  236. switch (ctx->num_sprite_warping_points) {
  237. case 0:
  238. sprite_offset[0][0] =
  239. sprite_offset[0][1] =
  240. sprite_offset[1][0] =
  241. sprite_offset[1][1] = 0;
  242. sprite_delta[0][0] = a;
  243. sprite_delta[0][1] =
  244. sprite_delta[1][0] = 0;
  245. sprite_delta[1][1] = a;
  246. ctx->sprite_shift[0] =
  247. ctx->sprite_shift[1] = 0;
  248. break;
  249. case 1: // GMC only
  250. sprite_offset[0][0] = sprite_ref[0][0] - a * vop_ref[0][0];
  251. sprite_offset[0][1] = sprite_ref[0][1] - a * vop_ref[0][1];
  252. sprite_offset[1][0] = ((sprite_ref[0][0] >> 1) | (sprite_ref[0][0] & 1)) -
  253. a * (vop_ref[0][0] / 2);
  254. sprite_offset[1][1] = ((sprite_ref[0][1] >> 1) | (sprite_ref[0][1] & 1)) -
  255. a * (vop_ref[0][1] / 2);
  256. sprite_delta[0][0] = a;
  257. sprite_delta[0][1] =
  258. sprite_delta[1][0] = 0;
  259. sprite_delta[1][1] = a;
  260. ctx->sprite_shift[0] =
  261. ctx->sprite_shift[1] = 0;
  262. break;
  263. case 2:
  264. sprite_offset[0][0] = ((int64_t) sprite_ref[0][0] * (1 << alpha + rho)) +
  265. ((int64_t) -r * sprite_ref[0][0] + virtual_ref[0][0]) *
  266. ((int64_t) -vop_ref[0][0]) +
  267. ((int64_t) r * sprite_ref[0][1] - virtual_ref[0][1]) *
  268. ((int64_t) -vop_ref[0][1]) + (1 << (alpha + rho - 1));
  269. sprite_offset[0][1] = ((int64_t) sprite_ref[0][1] * (1 << alpha + rho)) +
  270. ((int64_t) -r * sprite_ref[0][1] + virtual_ref[0][1]) *
  271. ((int64_t) -vop_ref[0][0]) +
  272. ((int64_t) -r * sprite_ref[0][0] + virtual_ref[0][0]) *
  273. ((int64_t) -vop_ref[0][1]) + (1 << (alpha + rho - 1));
  274. sprite_offset[1][0] = (((int64_t)-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  275. ((int64_t)-2 * vop_ref[0][0] + 1) +
  276. ((int64_t) r * sprite_ref[0][1] - virtual_ref[0][1]) *
  277. ((int64_t)-2 * vop_ref[0][1] + 1) + 2 * w2 * r *
  278. (int64_t) sprite_ref[0][0] - 16 * w2 + (1 << (alpha + rho + 1)));
  279. sprite_offset[1][1] = (((int64_t)-r * sprite_ref[0][1] + virtual_ref[0][1]) *
  280. ((int64_t)-2 * vop_ref[0][0] + 1) +
  281. ((int64_t)-r * sprite_ref[0][0] + virtual_ref[0][0]) *
  282. ((int64_t)-2 * vop_ref[0][1] + 1) + 2 * w2 * r *
  283. (int64_t) sprite_ref[0][1] - 16 * w2 + (1 << (alpha + rho + 1)));
  284. sprite_delta[0][0] = (-r * sprite_ref[0][0] + virtual_ref[0][0]);
  285. sprite_delta[0][1] = (+r * sprite_ref[0][1] - virtual_ref[0][1]);
  286. sprite_delta[1][0] = (-r * sprite_ref[0][1] + virtual_ref[0][1]);
  287. sprite_delta[1][1] = (-r * sprite_ref[0][0] + virtual_ref[0][0]);
  288. ctx->sprite_shift[0] = alpha + rho;
  289. ctx->sprite_shift[1] = alpha + rho + 2;
  290. break;
  291. case 3:
  292. min_ab = FFMIN(alpha, beta);
  293. w3 = w2 >> min_ab;
  294. h3 = h2 >> min_ab;
  295. sprite_offset[0][0] = ((int64_t)sprite_ref[0][0] * (1 << (alpha + beta + rho - min_ab))) +
  296. ((int64_t)-r * sprite_ref[0][0] + virtual_ref[0][0]) * h3 * (-vop_ref[0][0]) +
  297. ((int64_t)-r * sprite_ref[0][0] + virtual_ref[1][0]) * w3 * (-vop_ref[0][1]) +
  298. ((int64_t)1 << (alpha + beta + rho - min_ab - 1));
  299. sprite_offset[0][1] = ((int64_t)sprite_ref[0][1] * (1 << (alpha + beta + rho - min_ab))) +
  300. ((int64_t)-r * sprite_ref[0][1] + virtual_ref[0][1]) * h3 * (-vop_ref[0][0]) +
  301. ((int64_t)-r * sprite_ref[0][1] + virtual_ref[1][1]) * w3 * (-vop_ref[0][1]) +
  302. ((int64_t)1 << (alpha + beta + rho - min_ab - 1));
  303. sprite_offset[1][0] = ((int64_t)-r * sprite_ref[0][0] + virtual_ref[0][0]) * h3 * (-2 * vop_ref[0][0] + 1) +
  304. ((int64_t)-r * sprite_ref[0][0] + virtual_ref[1][0]) * w3 * (-2 * vop_ref[0][1] + 1) +
  305. (int64_t)2 * w2 * h3 * r * sprite_ref[0][0] - 16 * w2 * h3 +
  306. ((int64_t)1 << (alpha + beta + rho - min_ab + 1));
  307. sprite_offset[1][1] = ((int64_t)-r * sprite_ref[0][1] + virtual_ref[0][1]) * h3 * (-2 * vop_ref[0][0] + 1) +
  308. ((int64_t)-r * sprite_ref[0][1] + virtual_ref[1][1]) * w3 * (-2 * vop_ref[0][1] + 1) +
  309. (int64_t)2 * w2 * h3 * r * sprite_ref[0][1] - 16 * w2 * h3 +
  310. ((int64_t)1 << (alpha + beta + rho - min_ab + 1));
  311. sprite_delta[0][0] = (-r * (int64_t)sprite_ref[0][0] + virtual_ref[0][0]) * h3;
  312. sprite_delta[0][1] = (-r * (int64_t)sprite_ref[0][0] + virtual_ref[1][0]) * w3;
  313. sprite_delta[1][0] = (-r * (int64_t)sprite_ref[0][1] + virtual_ref[0][1]) * h3;
  314. sprite_delta[1][1] = (-r * (int64_t)sprite_ref[0][1] + virtual_ref[1][1]) * w3;
  315. ctx->sprite_shift[0] = alpha + beta + rho - min_ab;
  316. ctx->sprite_shift[1] = alpha + beta + rho - min_ab + 2;
  317. break;
  318. }
  319. /* try to simplify the situation */
  320. if (sprite_delta[0][0] == a << ctx->sprite_shift[0] &&
  321. sprite_delta[0][1] == 0 &&
  322. sprite_delta[1][0] == 0 &&
  323. sprite_delta[1][1] == a << ctx->sprite_shift[0]) {
  324. sprite_offset[0][0] >>= ctx->sprite_shift[0];
  325. sprite_offset[0][1] >>= ctx->sprite_shift[0];
  326. sprite_offset[1][0] >>= ctx->sprite_shift[1];
  327. sprite_offset[1][1] >>= ctx->sprite_shift[1];
  328. sprite_delta[0][0] = a;
  329. sprite_delta[0][1] = 0;
  330. sprite_delta[1][0] = 0;
  331. sprite_delta[1][1] = a;
  332. ctx->sprite_shift[0] = 0;
  333. ctx->sprite_shift[1] = 0;
  334. s->real_sprite_warping_points = 1;
  335. } else {
  336. int shift_y = 16 - ctx->sprite_shift[0];
  337. int shift_c = 16 - ctx->sprite_shift[1];
  338. for (i = 0; i < 2; i++) {
  339. if (shift_c < 0 || shift_y < 0 ||
  340. FFABS( sprite_offset[0][i]) >= INT_MAX >> shift_y ||
  341. FFABS( sprite_offset[1][i]) >= INT_MAX >> shift_c ||
  342. FFABS( sprite_delta[0][i]) >= INT_MAX >> shift_y ||
  343. FFABS( sprite_delta[1][i]) >= INT_MAX >> shift_y
  344. ) {
  345. avpriv_request_sample(s->avctx, "Too large sprite shift, delta or offset");
  346. goto overflow;
  347. }
  348. }
  349. for (i = 0; i < 2; i++) {
  350. sprite_offset[0][i] *= 1 << shift_y;
  351. sprite_offset[1][i] *= 1 << shift_c;
  352. sprite_delta[0][i] *= 1 << shift_y;
  353. sprite_delta[1][i] *= 1 << shift_y;
  354. ctx->sprite_shift[i] = 16;
  355. }
  356. for (i = 0; i < 2; i++) {
  357. int64_t sd[2] = {
  358. sprite_delta[i][0] - a * (1LL<<16),
  359. sprite_delta[i][1] - a * (1LL<<16)
  360. };
  361. if (llabs(sprite_offset[0][i] + sprite_delta[i][0] * (w+16LL)) >= INT_MAX ||
  362. llabs(sprite_offset[0][i] + sprite_delta[i][1] * (h+16LL)) >= INT_MAX ||
  363. llabs(sprite_offset[0][i] + sprite_delta[i][0] * (w+16LL) + sprite_delta[i][1] * (h+16LL)) >= INT_MAX ||
  364. llabs(sprite_delta[i][0] * (w+16LL)) >= INT_MAX ||
  365. llabs(sprite_delta[i][1] * (h+16LL)) >= INT_MAX ||
  366. llabs(sd[0]) >= INT_MAX ||
  367. llabs(sd[1]) >= INT_MAX ||
  368. llabs(sprite_offset[0][i] + sd[0] * (w+16LL)) >= INT_MAX ||
  369. llabs(sprite_offset[0][i] + sd[1] * (h+16LL)) >= INT_MAX ||
  370. llabs(sprite_offset[0][i] + sd[0] * (w+16LL) + sd[1] * (h+16LL)) >= INT_MAX
  371. ) {
  372. avpriv_request_sample(s->avctx, "Overflow on sprite points");
  373. goto overflow;
  374. }
  375. }
  376. s->real_sprite_warping_points = ctx->num_sprite_warping_points;
  377. }
  378. for (i = 0; i < 4; i++) {
  379. s->sprite_offset[i&1][i>>1] = sprite_offset[i&1][i>>1];
  380. s->sprite_delta [i&1][i>>1] = sprite_delta [i&1][i>>1];
  381. }
  382. return 0;
  383. overflow:
  384. memset(s->sprite_offset, 0, sizeof(s->sprite_offset));
  385. memset(s->sprite_delta, 0, sizeof(s->sprite_delta));
  386. return AVERROR_PATCHWELCOME;
  387. }
  388. static int decode_new_pred(Mpeg4DecContext *ctx, GetBitContext *gb) {
  389. MpegEncContext *s = &ctx->m;
  390. int len = FFMIN(ctx->time_increment_bits + 3, 15);
  391. get_bits(gb, len);
  392. if (get_bits1(gb))
  393. get_bits(gb, len);
  394. check_marker(s->avctx, gb, "after new_pred");
  395. return 0;
  396. }
  397. /**
  398. * Decode the next video packet.
  399. * @return <0 if something went wrong
  400. */
  401. int ff_mpeg4_decode_video_packet_header(Mpeg4DecContext *ctx)
  402. {
  403. MpegEncContext *s = &ctx->m;
  404. int mb_num_bits = av_log2(s->mb_num - 1) + 1;
  405. int header_extension = 0, mb_num, len;
  406. /* is there enough space left for a video packet + header */
  407. if (get_bits_count(&s->gb) > s->gb.size_in_bits - 20)
  408. return AVERROR_INVALIDDATA;
  409. for (len = 0; len < 32; len++)
  410. if (get_bits1(&s->gb))
  411. break;
  412. if (len != ff_mpeg4_get_video_packet_prefix_length(s)) {
  413. av_log(s->avctx, AV_LOG_ERROR, "marker does not match f_code\n");
  414. return AVERROR_INVALIDDATA;
  415. }
  416. if (ctx->shape != RECT_SHAPE) {
  417. header_extension = get_bits1(&s->gb);
  418. // FIXME more stuff here
  419. }
  420. mb_num = get_bits(&s->gb, mb_num_bits);
  421. if (mb_num >= s->mb_num || !mb_num) {
  422. av_log(s->avctx, AV_LOG_ERROR,
  423. "illegal mb_num in video packet (%d %d) \n", mb_num, s->mb_num);
  424. return AVERROR_INVALIDDATA;
  425. }
  426. s->mb_x = mb_num % s->mb_width;
  427. s->mb_y = mb_num / s->mb_width;
  428. if (ctx->shape != BIN_ONLY_SHAPE) {
  429. int qscale = get_bits(&s->gb, s->quant_precision);
  430. if (qscale)
  431. s->chroma_qscale = s->qscale = qscale;
  432. }
  433. if (ctx->shape == RECT_SHAPE)
  434. header_extension = get_bits1(&s->gb);
  435. if (header_extension) {
  436. int time_incr = 0;
  437. while (get_bits1(&s->gb) != 0)
  438. time_incr++;
  439. check_marker(s->avctx, &s->gb, "before time_increment in video packed header");
  440. skip_bits(&s->gb, ctx->time_increment_bits); /* time_increment */
  441. check_marker(s->avctx, &s->gb, "before vop_coding_type in video packed header");
  442. skip_bits(&s->gb, 2); /* vop coding type */
  443. // FIXME not rect stuff here
  444. if (ctx->shape != BIN_ONLY_SHAPE) {
  445. skip_bits(&s->gb, 3); /* intra dc vlc threshold */
  446. // FIXME don't just ignore everything
  447. if (s->pict_type == AV_PICTURE_TYPE_S &&
  448. ctx->vol_sprite_usage == GMC_SPRITE) {
  449. if (mpeg4_decode_sprite_trajectory(ctx, &s->gb) < 0)
  450. return AVERROR_INVALIDDATA;
  451. av_log(s->avctx, AV_LOG_ERROR, "untested\n");
  452. }
  453. // FIXME reduced res stuff here
  454. if (s->pict_type != AV_PICTURE_TYPE_I) {
  455. int f_code = get_bits(&s->gb, 3); /* fcode_for */
  456. if (f_code == 0)
  457. av_log(s->avctx, AV_LOG_ERROR,
  458. "Error, video packet header damaged (f_code=0)\n");
  459. }
  460. if (s->pict_type == AV_PICTURE_TYPE_B) {
  461. int b_code = get_bits(&s->gb, 3);
  462. if (b_code == 0)
  463. av_log(s->avctx, AV_LOG_ERROR,
  464. "Error, video packet header damaged (b_code=0)\n");
  465. }
  466. }
  467. }
  468. if (ctx->new_pred)
  469. decode_new_pred(ctx, &s->gb);
  470. return 0;
  471. }
  472. static void reset_studio_dc_predictors(MpegEncContext *s)
  473. {
  474. /* Reset DC Predictors */
  475. s->last_dc[0] =
  476. s->last_dc[1] =
  477. s->last_dc[2] = 1 << (s->avctx->bits_per_raw_sample + s->dct_precision + s->intra_dc_precision - 1);
  478. }
  479. /**
  480. * Decode the next video packet.
  481. * @return <0 if something went wrong
  482. */
  483. int ff_mpeg4_decode_studio_slice_header(Mpeg4DecContext *ctx)
  484. {
  485. MpegEncContext *s = &ctx->m;
  486. GetBitContext *gb = &s->gb;
  487. unsigned vlc_len;
  488. uint16_t mb_num;
  489. if (get_bits_left(gb) >= 32 && get_bits_long(gb, 32) == SLICE_START_CODE) {
  490. vlc_len = av_log2(s->mb_width * s->mb_height) + 1;
  491. mb_num = get_bits(gb, vlc_len);
  492. if (mb_num >= s->mb_num)
  493. return AVERROR_INVALIDDATA;
  494. s->mb_x = mb_num % s->mb_width;
  495. s->mb_y = mb_num / s->mb_width;
  496. if (ctx->shape != BIN_ONLY_SHAPE)
  497. s->qscale = mpeg_get_qscale(s);
  498. if (get_bits1(gb)) { /* slice_extension_flag */
  499. skip_bits1(gb); /* intra_slice */
  500. skip_bits1(gb); /* slice_VOP_id_enable */
  501. skip_bits(gb, 6); /* slice_VOP_id */
  502. while (get_bits1(gb)) /* extra_bit_slice */
  503. skip_bits(gb, 8); /* extra_information_slice */
  504. }
  505. reset_studio_dc_predictors(s);
  506. }
  507. else {
  508. return AVERROR_INVALIDDATA;
  509. }
  510. return 0;
  511. }
  512. /**
  513. * Get the average motion vector for a GMC MB.
  514. * @param n either 0 for the x component or 1 for y
  515. * @return the average MV for a GMC MB
  516. */
  517. static inline int get_amv(Mpeg4DecContext *ctx, int n)
  518. {
  519. MpegEncContext *s = &ctx->m;
  520. int x, y, mb_v, sum, dx, dy, shift;
  521. int len = 1 << (s->f_code + 4);
  522. const int a = s->sprite_warping_accuracy;
  523. if (s->workaround_bugs & FF_BUG_AMV)
  524. len >>= s->quarter_sample;
  525. if (s->real_sprite_warping_points == 1) {
  526. if (ctx->divx_version == 500 && ctx->divx_build == 413 && a >= s->quarter_sample)
  527. sum = s->sprite_offset[0][n] / (1 << (a - s->quarter_sample));
  528. else
  529. sum = RSHIFT(s->sprite_offset[0][n] * (1 << s->quarter_sample), a);
  530. } else {
  531. dx = s->sprite_delta[n][0];
  532. dy = s->sprite_delta[n][1];
  533. shift = ctx->sprite_shift[0];
  534. if (n)
  535. dy -= 1 << (shift + a + 1);
  536. else
  537. dx -= 1 << (shift + a + 1);
  538. mb_v = s->sprite_offset[0][n] + dx * s->mb_x * 16U + dy * s->mb_y * 16U;
  539. sum = 0;
  540. for (y = 0; y < 16; y++) {
  541. int v;
  542. v = mb_v + dy * y;
  543. // FIXME optimize
  544. for (x = 0; x < 16; x++) {
  545. sum += v >> shift;
  546. v += dx;
  547. }
  548. }
  549. sum = RSHIFT(sum, a + 8 - s->quarter_sample);
  550. }
  551. if (sum < -len)
  552. sum = -len;
  553. else if (sum >= len)
  554. sum = len - 1;
  555. return sum;
  556. }
  557. /**
  558. * Decode the dc value.
  559. * @param n block index (0-3 are luma, 4-5 are chroma)
  560. * @param dir_ptr the prediction direction will be stored here
  561. * @return the quantized dc
  562. */
  563. static inline int mpeg4_decode_dc(MpegEncContext *s, int n, int *dir_ptr)
  564. {
  565. int level, code;
  566. if (n < 4)
  567. code = get_vlc2(&s->gb, dc_lum.table, DC_VLC_BITS, 1);
  568. else
  569. code = get_vlc2(&s->gb, dc_chrom.table, DC_VLC_BITS, 1);
  570. if (code < 0 || code > 9 /* && s->nbit < 9 */) {
  571. av_log(s->avctx, AV_LOG_ERROR, "illegal dc vlc\n");
  572. return AVERROR_INVALIDDATA;
  573. }
  574. if (code == 0) {
  575. level = 0;
  576. } else {
  577. if (IS_3IV1) {
  578. if (code == 1)
  579. level = 2 * get_bits1(&s->gb) - 1;
  580. else {
  581. if (get_bits1(&s->gb))
  582. level = get_bits(&s->gb, code - 1) + (1 << (code - 1));
  583. else
  584. level = -get_bits(&s->gb, code - 1) - (1 << (code - 1));
  585. }
  586. } else {
  587. level = get_xbits(&s->gb, code);
  588. }
  589. if (code > 8) {
  590. if (get_bits1(&s->gb) == 0) { /* marker */
  591. if (s->avctx->err_recognition & (AV_EF_BITSTREAM|AV_EF_COMPLIANT)) {
  592. av_log(s->avctx, AV_LOG_ERROR, "dc marker bit missing\n");
  593. return AVERROR_INVALIDDATA;
  594. }
  595. }
  596. }
  597. }
  598. return ff_mpeg4_pred_dc(s, n, level, dir_ptr, 0);
  599. }
  600. /**
  601. * Decode first partition.
  602. * @return number of MBs decoded or <0 if an error occurred
  603. */
  604. static int mpeg4_decode_partition_a(Mpeg4DecContext *ctx)
  605. {
  606. MpegEncContext *s = &ctx->m;
  607. int mb_num = 0;
  608. static const int8_t quant_tab[4] = { -1, -2, 1, 2 };
  609. /* decode first partition */
  610. s->first_slice_line = 1;
  611. for (; s->mb_y < s->mb_height; s->mb_y++) {
  612. ff_init_block_index(s);
  613. for (; s->mb_x < s->mb_width; s->mb_x++) {
  614. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  615. int cbpc;
  616. int dir = 0;
  617. mb_num++;
  618. ff_update_block_index(s);
  619. if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1)
  620. s->first_slice_line = 0;
  621. if (s->pict_type == AV_PICTURE_TYPE_I) {
  622. int i;
  623. do {
  624. if (show_bits(&s->gb, 19) == DC_MARKER)
  625. return mb_num - 1;
  626. cbpc = get_vlc2(&s->gb, ff_h263_intra_MCBPC_vlc.table, INTRA_MCBPC_VLC_BITS, 2);
  627. if (cbpc < 0) {
  628. av_log(s->avctx, AV_LOG_ERROR,
  629. "mcbpc corrupted at %d %d\n", s->mb_x, s->mb_y);
  630. return AVERROR_INVALIDDATA;
  631. }
  632. } while (cbpc == 8);
  633. s->cbp_table[xy] = cbpc & 3;
  634. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  635. s->mb_intra = 1;
  636. if (cbpc & 4)
  637. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  638. s->current_picture.qscale_table[xy] = s->qscale;
  639. s->mbintra_table[xy] = 1;
  640. for (i = 0; i < 6; i++) {
  641. int dc_pred_dir;
  642. int dc = mpeg4_decode_dc(s, i, &dc_pred_dir);
  643. if (dc < 0) {
  644. av_log(s->avctx, AV_LOG_ERROR,
  645. "DC corrupted at %d %d\n", s->mb_x, s->mb_y);
  646. return dc;
  647. }
  648. dir <<= 1;
  649. if (dc_pred_dir)
  650. dir |= 1;
  651. }
  652. s->pred_dir_table[xy] = dir;
  653. } else { /* P/S_TYPE */
  654. int mx, my, pred_x, pred_y, bits;
  655. int16_t *const mot_val = s->current_picture.motion_val[0][s->block_index[0]];
  656. const int stride = s->b8_stride * 2;
  657. try_again:
  658. bits = show_bits(&s->gb, 17);
  659. if (bits == MOTION_MARKER)
  660. return mb_num - 1;
  661. skip_bits1(&s->gb);
  662. if (bits & 0x10000) {
  663. /* skip mb */
  664. if (s->pict_type == AV_PICTURE_TYPE_S &&
  665. ctx->vol_sprite_usage == GMC_SPRITE) {
  666. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  667. MB_TYPE_16x16 |
  668. MB_TYPE_GMC |
  669. MB_TYPE_L0;
  670. mx = get_amv(ctx, 0);
  671. my = get_amv(ctx, 1);
  672. } else {
  673. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  674. MB_TYPE_16x16 |
  675. MB_TYPE_L0;
  676. mx = my = 0;
  677. }
  678. mot_val[0] =
  679. mot_val[2] =
  680. mot_val[0 + stride] =
  681. mot_val[2 + stride] = mx;
  682. mot_val[1] =
  683. mot_val[3] =
  684. mot_val[1 + stride] =
  685. mot_val[3 + stride] = my;
  686. if (s->mbintra_table[xy])
  687. ff_clean_intra_table_entries(s);
  688. continue;
  689. }
  690. cbpc = get_vlc2(&s->gb, ff_h263_inter_MCBPC_vlc.table, INTER_MCBPC_VLC_BITS, 2);
  691. if (cbpc < 0) {
  692. av_log(s->avctx, AV_LOG_ERROR,
  693. "mcbpc corrupted at %d %d\n", s->mb_x, s->mb_y);
  694. return AVERROR_INVALIDDATA;
  695. }
  696. if (cbpc == 20)
  697. goto try_again;
  698. s->cbp_table[xy] = cbpc & (8 + 3); // 8 is dquant
  699. s->mb_intra = ((cbpc & 4) != 0);
  700. if (s->mb_intra) {
  701. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  702. s->mbintra_table[xy] = 1;
  703. mot_val[0] =
  704. mot_val[2] =
  705. mot_val[0 + stride] =
  706. mot_val[2 + stride] = 0;
  707. mot_val[1] =
  708. mot_val[3] =
  709. mot_val[1 + stride] =
  710. mot_val[3 + stride] = 0;
  711. } else {
  712. if (s->mbintra_table[xy])
  713. ff_clean_intra_table_entries(s);
  714. if (s->pict_type == AV_PICTURE_TYPE_S &&
  715. ctx->vol_sprite_usage == GMC_SPRITE &&
  716. (cbpc & 16) == 0)
  717. s->mcsel = get_bits1(&s->gb);
  718. else
  719. s->mcsel = 0;
  720. if ((cbpc & 16) == 0) {
  721. /* 16x16 motion prediction */
  722. ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
  723. if (!s->mcsel) {
  724. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  725. if (mx >= 0xffff)
  726. return AVERROR_INVALIDDATA;
  727. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  728. if (my >= 0xffff)
  729. return AVERROR_INVALIDDATA;
  730. s->current_picture.mb_type[xy] = MB_TYPE_16x16 |
  731. MB_TYPE_L0;
  732. } else {
  733. mx = get_amv(ctx, 0);
  734. my = get_amv(ctx, 1);
  735. s->current_picture.mb_type[xy] = MB_TYPE_16x16 |
  736. MB_TYPE_GMC |
  737. MB_TYPE_L0;
  738. }
  739. mot_val[0] =
  740. mot_val[2] =
  741. mot_val[0 + stride] =
  742. mot_val[2 + stride] = mx;
  743. mot_val[1] =
  744. mot_val[3] =
  745. mot_val[1 + stride] =
  746. mot_val[3 + stride] = my;
  747. } else {
  748. int i;
  749. s->current_picture.mb_type[xy] = MB_TYPE_8x8 |
  750. MB_TYPE_L0;
  751. for (i = 0; i < 4; i++) {
  752. int16_t *mot_val = ff_h263_pred_motion(s, i, 0, &pred_x, &pred_y);
  753. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  754. if (mx >= 0xffff)
  755. return AVERROR_INVALIDDATA;
  756. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  757. if (my >= 0xffff)
  758. return AVERROR_INVALIDDATA;
  759. mot_val[0] = mx;
  760. mot_val[1] = my;
  761. }
  762. }
  763. }
  764. }
  765. }
  766. s->mb_x = 0;
  767. }
  768. return mb_num;
  769. }
  770. /**
  771. * decode second partition.
  772. * @return <0 if an error occurred
  773. */
  774. static int mpeg4_decode_partition_b(MpegEncContext *s, int mb_count)
  775. {
  776. int mb_num = 0;
  777. static const int8_t quant_tab[4] = { -1, -2, 1, 2 };
  778. s->mb_x = s->resync_mb_x;
  779. s->first_slice_line = 1;
  780. for (s->mb_y = s->resync_mb_y; mb_num < mb_count; s->mb_y++) {
  781. ff_init_block_index(s);
  782. for (; mb_num < mb_count && s->mb_x < s->mb_width; s->mb_x++) {
  783. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  784. mb_num++;
  785. ff_update_block_index(s);
  786. if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1)
  787. s->first_slice_line = 0;
  788. if (s->pict_type == AV_PICTURE_TYPE_I) {
  789. int ac_pred = get_bits1(&s->gb);
  790. int cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  791. if (cbpy < 0) {
  792. av_log(s->avctx, AV_LOG_ERROR,
  793. "cbpy corrupted at %d %d\n", s->mb_x, s->mb_y);
  794. return AVERROR_INVALIDDATA;
  795. }
  796. s->cbp_table[xy] |= cbpy << 2;
  797. s->current_picture.mb_type[xy] |= ac_pred * MB_TYPE_ACPRED;
  798. } else { /* P || S_TYPE */
  799. if (IS_INTRA(s->current_picture.mb_type[xy])) {
  800. int i;
  801. int dir = 0;
  802. int ac_pred = get_bits1(&s->gb);
  803. int cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  804. if (cbpy < 0) {
  805. av_log(s->avctx, AV_LOG_ERROR,
  806. "I cbpy corrupted at %d %d\n", s->mb_x, s->mb_y);
  807. return AVERROR_INVALIDDATA;
  808. }
  809. if (s->cbp_table[xy] & 8)
  810. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  811. s->current_picture.qscale_table[xy] = s->qscale;
  812. for (i = 0; i < 6; i++) {
  813. int dc_pred_dir;
  814. int dc = mpeg4_decode_dc(s, i, &dc_pred_dir);
  815. if (dc < 0) {
  816. av_log(s->avctx, AV_LOG_ERROR,
  817. "DC corrupted at %d %d\n", s->mb_x, s->mb_y);
  818. return dc;
  819. }
  820. dir <<= 1;
  821. if (dc_pred_dir)
  822. dir |= 1;
  823. }
  824. s->cbp_table[xy] &= 3; // remove dquant
  825. s->cbp_table[xy] |= cbpy << 2;
  826. s->current_picture.mb_type[xy] |= ac_pred * MB_TYPE_ACPRED;
  827. s->pred_dir_table[xy] = dir;
  828. } else if (IS_SKIP(s->current_picture.mb_type[xy])) {
  829. s->current_picture.qscale_table[xy] = s->qscale;
  830. s->cbp_table[xy] = 0;
  831. } else {
  832. int cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  833. if (cbpy < 0) {
  834. av_log(s->avctx, AV_LOG_ERROR,
  835. "P cbpy corrupted at %d %d\n", s->mb_x, s->mb_y);
  836. return AVERROR_INVALIDDATA;
  837. }
  838. if (s->cbp_table[xy] & 8)
  839. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  840. s->current_picture.qscale_table[xy] = s->qscale;
  841. s->cbp_table[xy] &= 3; // remove dquant
  842. s->cbp_table[xy] |= (cbpy ^ 0xf) << 2;
  843. }
  844. }
  845. }
  846. if (mb_num >= mb_count)
  847. return 0;
  848. s->mb_x = 0;
  849. }
  850. return 0;
  851. }
  852. /**
  853. * Decode the first and second partition.
  854. * @return <0 if error (and sets error type in the error_status_table)
  855. */
  856. int ff_mpeg4_decode_partitions(Mpeg4DecContext *ctx)
  857. {
  858. MpegEncContext *s = &ctx->m;
  859. int mb_num;
  860. int ret;
  861. const int part_a_error = s->pict_type == AV_PICTURE_TYPE_I ? (ER_DC_ERROR | ER_MV_ERROR) : ER_MV_ERROR;
  862. const int part_a_end = s->pict_type == AV_PICTURE_TYPE_I ? (ER_DC_END | ER_MV_END) : ER_MV_END;
  863. mb_num = mpeg4_decode_partition_a(ctx);
  864. if (mb_num <= 0) {
  865. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  866. s->mb_x, s->mb_y, part_a_error);
  867. return mb_num ? mb_num : AVERROR_INVALIDDATA;
  868. }
  869. if (s->resync_mb_x + s->resync_mb_y * s->mb_width + mb_num > s->mb_num) {
  870. av_log(s->avctx, AV_LOG_ERROR, "slice below monitor ...\n");
  871. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  872. s->mb_x, s->mb_y, part_a_error);
  873. return AVERROR_INVALIDDATA;
  874. }
  875. s->mb_num_left = mb_num;
  876. if (s->pict_type == AV_PICTURE_TYPE_I) {
  877. while (show_bits(&s->gb, 9) == 1)
  878. skip_bits(&s->gb, 9);
  879. if (get_bits(&s->gb, 19) != DC_MARKER) {
  880. av_log(s->avctx, AV_LOG_ERROR,
  881. "marker missing after first I partition at %d %d\n",
  882. s->mb_x, s->mb_y);
  883. return AVERROR_INVALIDDATA;
  884. }
  885. } else {
  886. while (show_bits(&s->gb, 10) == 1)
  887. skip_bits(&s->gb, 10);
  888. if (get_bits(&s->gb, 17) != MOTION_MARKER) {
  889. av_log(s->avctx, AV_LOG_ERROR,
  890. "marker missing after first P partition at %d %d\n",
  891. s->mb_x, s->mb_y);
  892. return AVERROR_INVALIDDATA;
  893. }
  894. }
  895. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  896. s->mb_x - 1, s->mb_y, part_a_end);
  897. ret = mpeg4_decode_partition_b(s, mb_num);
  898. if (ret < 0) {
  899. if (s->pict_type == AV_PICTURE_TYPE_P)
  900. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  901. s->mb_x, s->mb_y, ER_DC_ERROR);
  902. return ret;
  903. } else {
  904. if (s->pict_type == AV_PICTURE_TYPE_P)
  905. ff_er_add_slice(&s->er, s->resync_mb_x, s->resync_mb_y,
  906. s->mb_x - 1, s->mb_y, ER_DC_END);
  907. }
  908. return 0;
  909. }
  910. /**
  911. * Decode a block.
  912. * @return <0 if an error occurred
  913. */
  914. static inline int mpeg4_decode_block(Mpeg4DecContext *ctx, int16_t *block,
  915. int n, int coded, int intra, int rvlc)
  916. {
  917. MpegEncContext *s = &ctx->m;
  918. int level, i, last, run, qmul, qadd;
  919. int av_uninit(dc_pred_dir);
  920. RLTable *rl;
  921. RL_VLC_ELEM *rl_vlc;
  922. const uint8_t *scan_table;
  923. // Note intra & rvlc should be optimized away if this is inlined
  924. if (intra) {
  925. if (ctx->use_intra_dc_vlc) {
  926. /* DC coef */
  927. if (s->partitioned_frame) {
  928. level = s->dc_val[0][s->block_index[n]];
  929. if (n < 4)
  930. level = FASTDIV((level + (s->y_dc_scale >> 1)), s->y_dc_scale);
  931. else
  932. level = FASTDIV((level + (s->c_dc_scale >> 1)), s->c_dc_scale);
  933. dc_pred_dir = (s->pred_dir_table[s->mb_x + s->mb_y * s->mb_stride] << n) & 32;
  934. } else {
  935. level = mpeg4_decode_dc(s, n, &dc_pred_dir);
  936. if (level < 0)
  937. return level;
  938. }
  939. block[0] = level;
  940. i = 0;
  941. } else {
  942. i = -1;
  943. ff_mpeg4_pred_dc(s, n, 0, &dc_pred_dir, 0);
  944. }
  945. if (!coded)
  946. goto not_coded;
  947. if (rvlc) {
  948. rl = &ff_rvlc_rl_intra;
  949. rl_vlc = ff_rvlc_rl_intra.rl_vlc[0];
  950. } else {
  951. rl = &ff_mpeg4_rl_intra;
  952. rl_vlc = ff_mpeg4_rl_intra.rl_vlc[0];
  953. }
  954. if (s->ac_pred) {
  955. if (dc_pred_dir == 0)
  956. scan_table = s->intra_v_scantable.permutated; /* left */
  957. else
  958. scan_table = s->intra_h_scantable.permutated; /* top */
  959. } else {
  960. scan_table = s->intra_scantable.permutated;
  961. }
  962. qmul = 1;
  963. qadd = 0;
  964. } else {
  965. i = -1;
  966. if (!coded) {
  967. s->block_last_index[n] = i;
  968. return 0;
  969. }
  970. if (rvlc)
  971. rl = &ff_rvlc_rl_inter;
  972. else
  973. rl = &ff_h263_rl_inter;
  974. scan_table = s->intra_scantable.permutated;
  975. if (s->mpeg_quant) {
  976. qmul = 1;
  977. qadd = 0;
  978. if (rvlc)
  979. rl_vlc = ff_rvlc_rl_inter.rl_vlc[0];
  980. else
  981. rl_vlc = ff_h263_rl_inter.rl_vlc[0];
  982. } else {
  983. qmul = s->qscale << 1;
  984. qadd = (s->qscale - 1) | 1;
  985. if (rvlc)
  986. rl_vlc = ff_rvlc_rl_inter.rl_vlc[s->qscale];
  987. else
  988. rl_vlc = ff_h263_rl_inter.rl_vlc[s->qscale];
  989. }
  990. }
  991. {
  992. OPEN_READER(re, &s->gb);
  993. for (;;) {
  994. UPDATE_CACHE(re, &s->gb);
  995. GET_RL_VLC(level, run, re, &s->gb, rl_vlc, TEX_VLC_BITS, 2, 0);
  996. if (level == 0) {
  997. /* escape */
  998. if (rvlc) {
  999. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  1000. av_log(s->avctx, AV_LOG_ERROR,
  1001. "1. marker bit missing in rvlc esc\n");
  1002. return AVERROR_INVALIDDATA;
  1003. }
  1004. SKIP_CACHE(re, &s->gb, 1);
  1005. last = SHOW_UBITS(re, &s->gb, 1);
  1006. SKIP_CACHE(re, &s->gb, 1);
  1007. run = SHOW_UBITS(re, &s->gb, 6);
  1008. SKIP_COUNTER(re, &s->gb, 1 + 1 + 6);
  1009. UPDATE_CACHE(re, &s->gb);
  1010. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  1011. av_log(s->avctx, AV_LOG_ERROR,
  1012. "2. marker bit missing in rvlc esc\n");
  1013. return AVERROR_INVALIDDATA;
  1014. }
  1015. SKIP_CACHE(re, &s->gb, 1);
  1016. level = SHOW_UBITS(re, &s->gb, 11);
  1017. SKIP_CACHE(re, &s->gb, 11);
  1018. if (SHOW_UBITS(re, &s->gb, 5) != 0x10) {
  1019. av_log(s->avctx, AV_LOG_ERROR, "reverse esc missing\n");
  1020. return AVERROR_INVALIDDATA;
  1021. }
  1022. SKIP_CACHE(re, &s->gb, 5);
  1023. level = level * qmul + qadd;
  1024. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1025. SKIP_COUNTER(re, &s->gb, 1 + 11 + 5 + 1);
  1026. i += run + 1;
  1027. if (last)
  1028. i += 192;
  1029. } else {
  1030. int cache;
  1031. cache = GET_CACHE(re, &s->gb);
  1032. if (IS_3IV1)
  1033. cache ^= 0xC0000000;
  1034. if (cache & 0x80000000) {
  1035. if (cache & 0x40000000) {
  1036. /* third escape */
  1037. SKIP_CACHE(re, &s->gb, 2);
  1038. last = SHOW_UBITS(re, &s->gb, 1);
  1039. SKIP_CACHE(re, &s->gb, 1);
  1040. run = SHOW_UBITS(re, &s->gb, 6);
  1041. SKIP_COUNTER(re, &s->gb, 2 + 1 + 6);
  1042. UPDATE_CACHE(re, &s->gb);
  1043. if (IS_3IV1) {
  1044. level = SHOW_SBITS(re, &s->gb, 12);
  1045. LAST_SKIP_BITS(re, &s->gb, 12);
  1046. } else {
  1047. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  1048. av_log(s->avctx, AV_LOG_ERROR,
  1049. "1. marker bit missing in 3. esc\n");
  1050. if (!(s->avctx->err_recognition & AV_EF_IGNORE_ERR))
  1051. return AVERROR_INVALIDDATA;
  1052. }
  1053. SKIP_CACHE(re, &s->gb, 1);
  1054. level = SHOW_SBITS(re, &s->gb, 12);
  1055. SKIP_CACHE(re, &s->gb, 12);
  1056. if (SHOW_UBITS(re, &s->gb, 1) == 0) {
  1057. av_log(s->avctx, AV_LOG_ERROR,
  1058. "2. marker bit missing in 3. esc\n");
  1059. if (!(s->avctx->err_recognition & AV_EF_IGNORE_ERR))
  1060. return AVERROR_INVALIDDATA;
  1061. }
  1062. SKIP_COUNTER(re, &s->gb, 1 + 12 + 1);
  1063. }
  1064. #if 0
  1065. if (s->error_recognition >= FF_ER_COMPLIANT) {
  1066. const int abs_level= FFABS(level);
  1067. if (abs_level<=MAX_LEVEL && run<=MAX_RUN) {
  1068. const int run1= run - rl->max_run[last][abs_level] - 1;
  1069. if (abs_level <= rl->max_level[last][run]) {
  1070. av_log(s->avctx, AV_LOG_ERROR, "illegal 3. esc, vlc encoding possible\n");
  1071. return AVERROR_INVALIDDATA;
  1072. }
  1073. if (s->error_recognition > FF_ER_COMPLIANT) {
  1074. if (abs_level <= rl->max_level[last][run]*2) {
  1075. av_log(s->avctx, AV_LOG_ERROR, "illegal 3. esc, esc 1 encoding possible\n");
  1076. return AVERROR_INVALIDDATA;
  1077. }
  1078. if (run1 >= 0 && abs_level <= rl->max_level[last][run1]) {
  1079. av_log(s->avctx, AV_LOG_ERROR, "illegal 3. esc, esc 2 encoding possible\n");
  1080. return AVERROR_INVALIDDATA;
  1081. }
  1082. }
  1083. }
  1084. }
  1085. #endif
  1086. if (level > 0)
  1087. level = level * qmul + qadd;
  1088. else
  1089. level = level * qmul - qadd;
  1090. if ((unsigned)(level + 2048) > 4095) {
  1091. if (s->avctx->err_recognition & (AV_EF_BITSTREAM|AV_EF_AGGRESSIVE)) {
  1092. if (level > 2560 || level < -2560) {
  1093. av_log(s->avctx, AV_LOG_ERROR,
  1094. "|level| overflow in 3. esc, qp=%d\n",
  1095. s->qscale);
  1096. return AVERROR_INVALIDDATA;
  1097. }
  1098. }
  1099. level = level < 0 ? -2048 : 2047;
  1100. }
  1101. i += run + 1;
  1102. if (last)
  1103. i += 192;
  1104. } else {
  1105. /* second escape */
  1106. SKIP_BITS(re, &s->gb, 2);
  1107. GET_RL_VLC(level, run, re, &s->gb, rl_vlc, TEX_VLC_BITS, 2, 1);
  1108. i += run + rl->max_run[run >> 7][level / qmul] + 1; // FIXME opt indexing
  1109. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1110. LAST_SKIP_BITS(re, &s->gb, 1);
  1111. }
  1112. } else {
  1113. /* first escape */
  1114. SKIP_BITS(re, &s->gb, 1);
  1115. GET_RL_VLC(level, run, re, &s->gb, rl_vlc, TEX_VLC_BITS, 2, 1);
  1116. i += run;
  1117. level = level + rl->max_level[run >> 7][(run - 1) & 63] * qmul; // FIXME opt indexing
  1118. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1119. LAST_SKIP_BITS(re, &s->gb, 1);
  1120. }
  1121. }
  1122. } else {
  1123. i += run;
  1124. level = (level ^ SHOW_SBITS(re, &s->gb, 1)) - SHOW_SBITS(re, &s->gb, 1);
  1125. LAST_SKIP_BITS(re, &s->gb, 1);
  1126. }
  1127. ff_tlog(s->avctx, "dct[%d][%d] = %- 4d end?:%d\n", scan_table[i&63]&7, scan_table[i&63] >> 3, level, i>62);
  1128. if (i > 62) {
  1129. i -= 192;
  1130. if (i & (~63)) {
  1131. av_log(s->avctx, AV_LOG_ERROR,
  1132. "ac-tex damaged at %d %d\n", s->mb_x, s->mb_y);
  1133. return AVERROR_INVALIDDATA;
  1134. }
  1135. block[scan_table[i]] = level;
  1136. break;
  1137. }
  1138. block[scan_table[i]] = level;
  1139. }
  1140. CLOSE_READER(re, &s->gb);
  1141. }
  1142. not_coded:
  1143. if (intra) {
  1144. if (!ctx->use_intra_dc_vlc) {
  1145. block[0] = ff_mpeg4_pred_dc(s, n, block[0], &dc_pred_dir, 0);
  1146. i -= i >> 31; // if (i == -1) i = 0;
  1147. }
  1148. ff_mpeg4_pred_ac(s, block, n, dc_pred_dir);
  1149. if (s->ac_pred)
  1150. i = 63; // FIXME not optimal
  1151. }
  1152. s->block_last_index[n] = i;
  1153. return 0;
  1154. }
  1155. /**
  1156. * decode partition C of one MB.
  1157. * @return <0 if an error occurred
  1158. */
  1159. static int mpeg4_decode_partitioned_mb(MpegEncContext *s, int16_t block[6][64])
  1160. {
  1161. Mpeg4DecContext *ctx = s->avctx->priv_data;
  1162. int cbp, mb_type;
  1163. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  1164. av_assert2(s == (void*)ctx);
  1165. mb_type = s->current_picture.mb_type[xy];
  1166. cbp = s->cbp_table[xy];
  1167. ctx->use_intra_dc_vlc = s->qscale < ctx->intra_dc_threshold;
  1168. if (s->current_picture.qscale_table[xy] != s->qscale)
  1169. ff_set_qscale(s, s->current_picture.qscale_table[xy]);
  1170. if (s->pict_type == AV_PICTURE_TYPE_P ||
  1171. s->pict_type == AV_PICTURE_TYPE_S) {
  1172. int i;
  1173. for (i = 0; i < 4; i++) {
  1174. s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0];
  1175. s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1];
  1176. }
  1177. s->mb_intra = IS_INTRA(mb_type);
  1178. if (IS_SKIP(mb_type)) {
  1179. /* skip mb */
  1180. for (i = 0; i < 6; i++)
  1181. s->block_last_index[i] = -1;
  1182. s->mv_dir = MV_DIR_FORWARD;
  1183. s->mv_type = MV_TYPE_16X16;
  1184. if (s->pict_type == AV_PICTURE_TYPE_S
  1185. && ctx->vol_sprite_usage == GMC_SPRITE) {
  1186. s->mcsel = 1;
  1187. s->mb_skipped = 0;
  1188. } else {
  1189. s->mcsel = 0;
  1190. s->mb_skipped = 1;
  1191. }
  1192. } else if (s->mb_intra) {
  1193. s->ac_pred = IS_ACPRED(s->current_picture.mb_type[xy]);
  1194. } else if (!s->mb_intra) {
  1195. // s->mcsel = 0; // FIXME do we need to init that?
  1196. s->mv_dir = MV_DIR_FORWARD;
  1197. if (IS_8X8(mb_type)) {
  1198. s->mv_type = MV_TYPE_8X8;
  1199. } else {
  1200. s->mv_type = MV_TYPE_16X16;
  1201. }
  1202. }
  1203. } else { /* I-Frame */
  1204. s->mb_intra = 1;
  1205. s->ac_pred = IS_ACPRED(s->current_picture.mb_type[xy]);
  1206. }
  1207. if (!IS_SKIP(mb_type)) {
  1208. int i;
  1209. s->bdsp.clear_blocks(s->block[0]);
  1210. /* decode each block */
  1211. for (i = 0; i < 6; i++) {
  1212. if (mpeg4_decode_block(ctx, block[i], i, cbp & 32, s->mb_intra, ctx->rvlc) < 0) {
  1213. av_log(s->avctx, AV_LOG_ERROR,
  1214. "texture corrupted at %d %d %d\n",
  1215. s->mb_x, s->mb_y, s->mb_intra);
  1216. return AVERROR_INVALIDDATA;
  1217. }
  1218. cbp += cbp;
  1219. }
  1220. }
  1221. /* per-MB end of slice check */
  1222. if (--s->mb_num_left <= 0) {
  1223. if (mpeg4_is_resync(ctx))
  1224. return SLICE_END;
  1225. else
  1226. return SLICE_NOEND;
  1227. } else {
  1228. if (mpeg4_is_resync(ctx)) {
  1229. const int delta = s->mb_x + 1 == s->mb_width ? 2 : 1;
  1230. if (s->cbp_table[xy + delta])
  1231. return SLICE_END;
  1232. }
  1233. return SLICE_OK;
  1234. }
  1235. }
  1236. static int mpeg4_decode_mb(MpegEncContext *s, int16_t block[6][64])
  1237. {
  1238. Mpeg4DecContext *ctx = s->avctx->priv_data;
  1239. int cbpc, cbpy, i, cbp, pred_x, pred_y, mx, my, dquant;
  1240. int16_t *mot_val;
  1241. static const int8_t quant_tab[4] = { -1, -2, 1, 2 };
  1242. const int xy = s->mb_x + s->mb_y * s->mb_stride;
  1243. av_assert2(s == (void*)ctx);
  1244. av_assert2(s->h263_pred);
  1245. if (s->pict_type == AV_PICTURE_TYPE_P ||
  1246. s->pict_type == AV_PICTURE_TYPE_S) {
  1247. do {
  1248. if (get_bits1(&s->gb)) {
  1249. /* skip mb */
  1250. s->mb_intra = 0;
  1251. for (i = 0; i < 6; i++)
  1252. s->block_last_index[i] = -1;
  1253. s->mv_dir = MV_DIR_FORWARD;
  1254. s->mv_type = MV_TYPE_16X16;
  1255. if (s->pict_type == AV_PICTURE_TYPE_S &&
  1256. ctx->vol_sprite_usage == GMC_SPRITE) {
  1257. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  1258. MB_TYPE_GMC |
  1259. MB_TYPE_16x16 |
  1260. MB_TYPE_L0;
  1261. s->mcsel = 1;
  1262. s->mv[0][0][0] = get_amv(ctx, 0);
  1263. s->mv[0][0][1] = get_amv(ctx, 1);
  1264. s->mb_skipped = 0;
  1265. } else {
  1266. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  1267. MB_TYPE_16x16 |
  1268. MB_TYPE_L0;
  1269. s->mcsel = 0;
  1270. s->mv[0][0][0] = 0;
  1271. s->mv[0][0][1] = 0;
  1272. s->mb_skipped = 1;
  1273. }
  1274. goto end;
  1275. }
  1276. cbpc = get_vlc2(&s->gb, ff_h263_inter_MCBPC_vlc.table, INTER_MCBPC_VLC_BITS, 2);
  1277. if (cbpc < 0) {
  1278. av_log(s->avctx, AV_LOG_ERROR,
  1279. "mcbpc damaged at %d %d\n", s->mb_x, s->mb_y);
  1280. return AVERROR_INVALIDDATA;
  1281. }
  1282. } while (cbpc == 20);
  1283. s->bdsp.clear_blocks(s->block[0]);
  1284. dquant = cbpc & 8;
  1285. s->mb_intra = ((cbpc & 4) != 0);
  1286. if (s->mb_intra)
  1287. goto intra;
  1288. if (s->pict_type == AV_PICTURE_TYPE_S &&
  1289. ctx->vol_sprite_usage == GMC_SPRITE && (cbpc & 16) == 0)
  1290. s->mcsel = get_bits1(&s->gb);
  1291. else
  1292. s->mcsel = 0;
  1293. cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1) ^ 0x0F;
  1294. if (cbpy < 0) {
  1295. av_log(s->avctx, AV_LOG_ERROR,
  1296. "P cbpy damaged at %d %d\n", s->mb_x, s->mb_y);
  1297. return AVERROR_INVALIDDATA;
  1298. }
  1299. cbp = (cbpc & 3) | (cbpy << 2);
  1300. if (dquant)
  1301. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  1302. if ((!s->progressive_sequence) &&
  1303. (cbp || (s->workaround_bugs & FF_BUG_XVID_ILACE)))
  1304. s->interlaced_dct = get_bits1(&s->gb);
  1305. s->mv_dir = MV_DIR_FORWARD;
  1306. if ((cbpc & 16) == 0) {
  1307. if (s->mcsel) {
  1308. s->current_picture.mb_type[xy] = MB_TYPE_GMC |
  1309. MB_TYPE_16x16 |
  1310. MB_TYPE_L0;
  1311. /* 16x16 global motion prediction */
  1312. s->mv_type = MV_TYPE_16X16;
  1313. mx = get_amv(ctx, 0);
  1314. my = get_amv(ctx, 1);
  1315. s->mv[0][0][0] = mx;
  1316. s->mv[0][0][1] = my;
  1317. } else if ((!s->progressive_sequence) && get_bits1(&s->gb)) {
  1318. s->current_picture.mb_type[xy] = MB_TYPE_16x8 |
  1319. MB_TYPE_L0 |
  1320. MB_TYPE_INTERLACED;
  1321. /* 16x8 field motion prediction */
  1322. s->mv_type = MV_TYPE_FIELD;
  1323. s->field_select[0][0] = get_bits1(&s->gb);
  1324. s->field_select[0][1] = get_bits1(&s->gb);
  1325. ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
  1326. for (i = 0; i < 2; i++) {
  1327. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  1328. if (mx >= 0xffff)
  1329. return AVERROR_INVALIDDATA;
  1330. my = ff_h263_decode_motion(s, pred_y / 2, s->f_code);
  1331. if (my >= 0xffff)
  1332. return AVERROR_INVALIDDATA;
  1333. s->mv[0][i][0] = mx;
  1334. s->mv[0][i][1] = my;
  1335. }
  1336. } else {
  1337. s->current_picture.mb_type[xy] = MB_TYPE_16x16 | MB_TYPE_L0;
  1338. /* 16x16 motion prediction */
  1339. s->mv_type = MV_TYPE_16X16;
  1340. ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
  1341. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  1342. if (mx >= 0xffff)
  1343. return AVERROR_INVALIDDATA;
  1344. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  1345. if (my >= 0xffff)
  1346. return AVERROR_INVALIDDATA;
  1347. s->mv[0][0][0] = mx;
  1348. s->mv[0][0][1] = my;
  1349. }
  1350. } else {
  1351. s->current_picture.mb_type[xy] = MB_TYPE_8x8 | MB_TYPE_L0;
  1352. s->mv_type = MV_TYPE_8X8;
  1353. for (i = 0; i < 4; i++) {
  1354. mot_val = ff_h263_pred_motion(s, i, 0, &pred_x, &pred_y);
  1355. mx = ff_h263_decode_motion(s, pred_x, s->f_code);
  1356. if (mx >= 0xffff)
  1357. return AVERROR_INVALIDDATA;
  1358. my = ff_h263_decode_motion(s, pred_y, s->f_code);
  1359. if (my >= 0xffff)
  1360. return AVERROR_INVALIDDATA;
  1361. s->mv[0][i][0] = mx;
  1362. s->mv[0][i][1] = my;
  1363. mot_val[0] = mx;
  1364. mot_val[1] = my;
  1365. }
  1366. }
  1367. } else if (s->pict_type == AV_PICTURE_TYPE_B) {
  1368. int modb1; // first bit of modb
  1369. int modb2; // second bit of modb
  1370. int mb_type;
  1371. s->mb_intra = 0; // B-frames never contain intra blocks
  1372. s->mcsel = 0; // ... true gmc blocks
  1373. if (s->mb_x == 0) {
  1374. for (i = 0; i < 2; i++) {
  1375. s->last_mv[i][0][0] =
  1376. s->last_mv[i][0][1] =
  1377. s->last_mv[i][1][0] =
  1378. s->last_mv[i][1][1] = 0;
  1379. }
  1380. ff_thread_await_progress(&s->next_picture_ptr->tf, s->mb_y, 0);
  1381. }
  1382. /* if we skipped it in the future P-frame than skip it now too */
  1383. s->mb_skipped = s->next_picture.mbskip_table[s->mb_y * s->mb_stride + s->mb_x]; // Note, skiptab=0 if last was GMC
  1384. if (s->mb_skipped) {
  1385. /* skip mb */
  1386. for (i = 0; i < 6; i++)
  1387. s->block_last_index[i] = -1;
  1388. s->mv_dir = MV_DIR_FORWARD;
  1389. s->mv_type = MV_TYPE_16X16;
  1390. s->mv[0][0][0] =
  1391. s->mv[0][0][1] =
  1392. s->mv[1][0][0] =
  1393. s->mv[1][0][1] = 0;
  1394. s->current_picture.mb_type[xy] = MB_TYPE_SKIP |
  1395. MB_TYPE_16x16 |
  1396. MB_TYPE_L0;
  1397. goto end;
  1398. }
  1399. modb1 = get_bits1(&s->gb);
  1400. if (modb1) {
  1401. // like MB_TYPE_B_DIRECT but no vectors coded
  1402. mb_type = MB_TYPE_DIRECT2 | MB_TYPE_SKIP | MB_TYPE_L0L1;
  1403. cbp = 0;
  1404. } else {
  1405. modb2 = get_bits1(&s->gb);
  1406. mb_type = get_vlc2(&s->gb, mb_type_b_vlc.table, MB_TYPE_B_VLC_BITS, 1);
  1407. if (mb_type < 0) {
  1408. av_log(s->avctx, AV_LOG_ERROR, "illegal MB_type\n");
  1409. return AVERROR_INVALIDDATA;
  1410. }
  1411. mb_type = mb_type_b_map[mb_type];
  1412. if (modb2) {
  1413. cbp = 0;
  1414. } else {
  1415. s->bdsp.clear_blocks(s->block[0]);
  1416. cbp = get_bits(&s->gb, 6);
  1417. }
  1418. if ((!IS_DIRECT(mb_type)) && cbp) {
  1419. if (get_bits1(&s->gb))
  1420. ff_set_qscale(s, s->qscale + get_bits1(&s->gb) * 4 - 2);
  1421. }
  1422. if (!s->progressive_sequence) {
  1423. if (cbp)
  1424. s->interlaced_dct = get_bits1(&s->gb);
  1425. if (!IS_DIRECT(mb_type) && get_bits1(&s->gb)) {
  1426. mb_type |= MB_TYPE_16x8 | MB_TYPE_INTERLACED;
  1427. mb_type &= ~MB_TYPE_16x16;
  1428. if (USES_LIST(mb_type, 0)) {
  1429. s->field_select[0][0] = get_bits1(&s->gb);
  1430. s->field_select[0][1] = get_bits1(&s->gb);
  1431. }
  1432. if (USES_LIST(mb_type, 1)) {
  1433. s->field_select[1][0] = get_bits1(&s->gb);
  1434. s->field_select[1][1] = get_bits1(&s->gb);
  1435. }
  1436. }
  1437. }
  1438. s->mv_dir = 0;
  1439. if ((mb_type & (MB_TYPE_DIRECT2 | MB_TYPE_INTERLACED)) == 0) {
  1440. s->mv_type = MV_TYPE_16X16;
  1441. if (USES_LIST(mb_type, 0)) {
  1442. s->mv_dir = MV_DIR_FORWARD;
  1443. mx = ff_h263_decode_motion(s, s->last_mv[0][0][0], s->f_code);
  1444. my = ff_h263_decode_motion(s, s->last_mv[0][0][1], s->f_code);
  1445. s->last_mv[0][1][0] =
  1446. s->last_mv[0][0][0] =
  1447. s->mv[0][0][0] = mx;
  1448. s->last_mv[0][1][1] =
  1449. s->last_mv[0][0][1] =
  1450. s->mv[0][0][1] = my;
  1451. }
  1452. if (USES_LIST(mb_type, 1)) {
  1453. s->mv_dir |= MV_DIR_BACKWARD;
  1454. mx = ff_h263_decode_motion(s, s->last_mv[1][0][0], s->b_code);
  1455. my = ff_h263_decode_motion(s, s->last_mv[1][0][1], s->b_code);
  1456. s->last_mv[1][1][0] =
  1457. s->last_mv[1][0][0] =
  1458. s->mv[1][0][0] = mx;
  1459. s->last_mv[1][1][1] =
  1460. s->last_mv[1][0][1] =
  1461. s->mv[1][0][1] = my;
  1462. }
  1463. } else if (!IS_DIRECT(mb_type)) {
  1464. s->mv_type = MV_TYPE_FIELD;
  1465. if (USES_LIST(mb_type, 0)) {
  1466. s->mv_dir = MV_DIR_FORWARD;
  1467. for (i = 0; i < 2; i++) {
  1468. mx = ff_h263_decode_motion(s, s->last_mv[0][i][0], s->f_code);
  1469. my = ff_h263_decode_motion(s, s->last_mv[0][i][1] / 2, s->f_code);
  1470. s->last_mv[0][i][0] =
  1471. s->mv[0][i][0] = mx;
  1472. s->last_mv[0][i][1] = (s->mv[0][i][1] = my) * 2;
  1473. }
  1474. }
  1475. if (USES_LIST(mb_type, 1)) {
  1476. s->mv_dir |= MV_DIR_BACKWARD;
  1477. for (i = 0; i < 2; i++) {
  1478. mx = ff_h263_decode_motion(s, s->last_mv[1][i][0], s->b_code);
  1479. my = ff_h263_decode_motion(s, s->last_mv[1][i][1] / 2, s->b_code);
  1480. s->last_mv[1][i][0] =
  1481. s->mv[1][i][0] = mx;
  1482. s->last_mv[1][i][1] = (s->mv[1][i][1] = my) * 2;
  1483. }
  1484. }
  1485. }
  1486. }
  1487. if (IS_DIRECT(mb_type)) {
  1488. if (IS_SKIP(mb_type)) {
  1489. mx =
  1490. my = 0;
  1491. } else {
  1492. mx = ff_h263_decode_motion(s, 0, 1);
  1493. my = ff_h263_decode_motion(s, 0, 1);
  1494. }
  1495. s->mv_dir = MV_DIR_FORWARD | MV_DIR_BACKWARD | MV_DIRECT;
  1496. mb_type |= ff_mpeg4_set_direct_mv(s, mx, my);
  1497. }
  1498. s->current_picture.mb_type[xy] = mb_type;
  1499. } else { /* I-Frame */
  1500. do {
  1501. cbpc = get_vlc2(&s->gb, ff_h263_intra_MCBPC_vlc.table, INTRA_MCBPC_VLC_BITS, 2);
  1502. if (cbpc < 0) {
  1503. av_log(s->avctx, AV_LOG_ERROR,
  1504. "I cbpc damaged at %d %d\n", s->mb_x, s->mb_y);
  1505. return AVERROR_INVALIDDATA;
  1506. }
  1507. } while (cbpc == 8);
  1508. dquant = cbpc & 4;
  1509. s->mb_intra = 1;
  1510. intra:
  1511. s->ac_pred = get_bits1(&s->gb);
  1512. if (s->ac_pred)
  1513. s->current_picture.mb_type[xy] = MB_TYPE_INTRA | MB_TYPE_ACPRED;
  1514. else
  1515. s->current_picture.mb_type[xy] = MB_TYPE_INTRA;
  1516. cbpy = get_vlc2(&s->gb, ff_h263_cbpy_vlc.table, CBPY_VLC_BITS, 1);
  1517. if (cbpy < 0) {
  1518. av_log(s->avctx, AV_LOG_ERROR,
  1519. "I cbpy damaged at %d %d\n", s->mb_x, s->mb_y);
  1520. return AVERROR_INVALIDDATA;
  1521. }
  1522. cbp = (cbpc & 3) | (cbpy << 2);
  1523. ctx->use_intra_dc_vlc = s->qscale < ctx->intra_dc_threshold;
  1524. if (dquant)
  1525. ff_set_qscale(s, s->qscale + quant_tab[get_bits(&s->gb, 2)]);
  1526. if (!s->progressive_sequence)
  1527. s->interlaced_dct = get_bits1(&s->gb);
  1528. s->bdsp.clear_blocks(s->block[0]);
  1529. /* decode each block */
  1530. for (i = 0; i < 6; i++) {
  1531. if (mpeg4_decode_block(ctx, block[i], i, cbp & 32, 1, 0) < 0)
  1532. return AVERROR_INVALIDDATA;
  1533. cbp += cbp;
  1534. }
  1535. goto end;
  1536. }
  1537. /* decode each block */
  1538. for (i = 0; i < 6; i++) {
  1539. if (mpeg4_decode_block(ctx, block[i], i, cbp & 32, 0, 0) < 0)
  1540. return AVERROR_INVALIDDATA;
  1541. cbp += cbp;
  1542. }
  1543. end:
  1544. /* per-MB end of slice check */
  1545. if (s->codec_id == AV_CODEC_ID_MPEG4) {
  1546. int next = mpeg4_is_resync(ctx);
  1547. if (next) {
  1548. if (s->mb_x + s->mb_y*s->mb_width + 1 > next && (s->avctx->err_recognition & AV_EF_AGGRESSIVE)) {
  1549. return AVERROR_INVALIDDATA;
  1550. } else if (s->mb_x + s->mb_y*s->mb_width + 1 >= next)
  1551. return SLICE_END;
  1552. if (s->pict_type == AV_PICTURE_TYPE_B) {
  1553. const int delta= s->mb_x + 1 == s->mb_width ? 2 : 1;
  1554. ff_thread_await_progress(&s->next_picture_ptr->tf,
  1555. (s->mb_x + delta >= s->mb_width)
  1556. ? FFMIN(s->mb_y + 1, s->mb_height - 1)
  1557. : s->mb_y, 0);
  1558. if (s->next_picture.mbskip_table[xy + delta])
  1559. return SLICE_OK;
  1560. }
  1561. return SLICE_END;
  1562. }
  1563. }
  1564. return SLICE_OK;
  1565. }
  1566. /* As per spec, studio start code search isn't the same as the old type of start code */
  1567. static void next_start_code_studio(GetBitContext *gb)
  1568. {
  1569. align_get_bits(gb);
  1570. while (get_bits_left(gb) >= 24 && show_bits(gb, 24) != 0x1) {
  1571. get_bits(gb, 8);
  1572. }
  1573. }
  1574. /* additional_code, vlc index */
  1575. static const uint8_t ac_state_tab[22][2] =
  1576. {
  1577. {0, 0},
  1578. {0, 1},
  1579. {1, 1},
  1580. {2, 1},
  1581. {3, 1},
  1582. {4, 1},
  1583. {5, 1},
  1584. {1, 2},
  1585. {2, 2},
  1586. {3, 2},
  1587. {4, 2},
  1588. {5, 2},
  1589. {6, 2},
  1590. {1, 3},
  1591. {2, 4},
  1592. {3, 5},
  1593. {4, 6},
  1594. {5, 7},
  1595. {6, 8},
  1596. {7, 9},
  1597. {8, 10},
  1598. {0, 11}
  1599. };
  1600. static int mpeg4_decode_studio_block(MpegEncContext *s, int32_t block[64], int n)
  1601. {
  1602. Mpeg4DecContext *ctx = s->avctx->priv_data;
  1603. int cc, dct_dc_size, dct_diff, code, j, idx = 1, group = 0, run = 0,
  1604. additional_code_len, sign, mismatch;
  1605. const VLC *cur_vlc = &studio_intra_tab[0];
  1606. uint8_t *const scantable = s->intra_scantable.permutated;
  1607. const uint16_t *quant_matrix;
  1608. uint32_t flc;
  1609. const int min = -1 * (1 << (s->avctx->bits_per_raw_sample + 6));
  1610. const int max = ((1 << (s->avctx->bits_per_raw_sample + 6)) - 1);
  1611. int shift = 3 - s->dct_precision;
  1612. mismatch = 1;
  1613. memset(block, 0, 64 * sizeof(int32_t));
  1614. if (n < 4) {
  1615. cc = 0;
  1616. dct_dc_size = get_vlc2(&s->gb, studio_luma_dc.table, STUDIO_INTRA_BITS, 2);
  1617. quant_matrix = s->intra_matrix;
  1618. } else {
  1619. cc = (n & 1) + 1;
  1620. if (ctx->rgb)
  1621. dct_dc_size = get_vlc2(&s->gb, studio_luma_dc.table, STUDIO_INTRA_BITS, 2);
  1622. else
  1623. dct_dc_size = get_vlc2(&s->gb, studio_chroma_dc.table, STUDIO_INTRA_BITS, 2);
  1624. quant_matrix = s->chroma_intra_matrix;
  1625. }
  1626. if (dct_dc_size == 0) {
  1627. dct_diff = 0;
  1628. } else {
  1629. dct_diff = get_xbits(&s->gb, dct_dc_size);
  1630. if (dct_dc_size > 8) {
  1631. if(!check_marker(s->avctx, &s->gb, "dct_dc_size > 8"))
  1632. return AVERROR_INVALIDDATA;
  1633. }
  1634. }
  1635. s->last_dc[cc] += dct_diff;
  1636. if (s->mpeg_quant)
  1637. block[0] = s->last_dc[cc] * (8 >> s->intra_dc_precision);
  1638. else
  1639. block[0] = s->last_dc[cc] * (8 >> s->intra_dc_precision) * (8 >> s->dct_precision);
  1640. /* TODO: support mpeg_quant for AC coefficients */
  1641. block[0] = av_clip(block[0], min, max);
  1642. mismatch ^= block[0];
  1643. /* AC Coefficients */
  1644. while (1) {
  1645. group = get_vlc2(&s->gb, cur_vlc->table, STUDIO_INTRA_BITS, 2);
  1646. if (group < 0) {
  1647. av_log(s->avctx, AV_LOG_ERROR, "illegal ac coefficient group vlc\n");
  1648. return AVERROR_INVALIDDATA;
  1649. }
  1650. additional_code_len = ac_state_tab[group][0];
  1651. cur_vlc = &studio_intra_tab[ac_state_tab[group][1]];
  1652. if (group == 0) {
  1653. /* End of Block */
  1654. break;
  1655. } else if (group >= 1 && group <= 6) {
  1656. /* Zero run length (Table B.47) */
  1657. run = 1 << additional_code_len;
  1658. if (additional_code_len)
  1659. run += get_bits(&s->gb, additional_code_len);
  1660. idx += run;
  1661. continue;
  1662. } else if (group >= 7 && group <= 12) {
  1663. /* Zero run length and +/-1 level (Table B.48) */
  1664. code = get_bits(&s->gb, additional_code_len);
  1665. sign = code & 1;
  1666. code >>= 1;
  1667. run = (1 << (additional_code_len - 1)) + code;
  1668. idx += run;
  1669. if (idx > 63)
  1670. return AVERROR_INVALIDDATA;
  1671. j = scantable[idx++];
  1672. block[j] = sign ? 1 : -1;
  1673. } else if (group >= 13 && group <= 20) {
  1674. /* Level value (Table B.49) */
  1675. if (idx > 63)
  1676. return AVERROR_INVALIDDATA;
  1677. j = scantable[idx++];
  1678. block[j] = get_xbits(&s->gb, additional_code_len);
  1679. } else if (group == 21) {
  1680. /* Escape */
  1681. if (idx > 63)
  1682. return AVERROR_INVALIDDATA;
  1683. j = scantable[idx++];
  1684. additional_code_len = s->avctx->bits_per_raw_sample + s->dct_precision + 4;
  1685. flc = get_bits(&s->gb, additional_code_len);
  1686. if (flc >> (additional_code_len-1))
  1687. block[j] = -1 * (( flc ^ ((1 << additional_code_len) -1)) + 1);
  1688. else
  1689. block[j] = flc;
  1690. }
  1691. block[j] = ((block[j] * quant_matrix[j] * s->qscale) * (1 << shift)) / 16;
  1692. block[j] = av_clip(block[j], min, max);
  1693. mismatch ^= block[j];
  1694. }
  1695. block[63] ^= mismatch & 1;
  1696. return 0;
  1697. }
  1698. static int mpeg4_decode_dpcm_macroblock(MpegEncContext *s, int16_t macroblock[256], int n)
  1699. {
  1700. int i, j, w, h, idx = 0;
  1701. int block_mean, rice_parameter, rice_prefix_code, rice_suffix_code,
  1702. dpcm_residual, left, top, topleft, min_left_top, max_left_top, p, p2, output;
  1703. h = 16 >> (n ? s->chroma_y_shift : 0);
  1704. w = 16 >> (n ? s->chroma_x_shift : 0);
  1705. block_mean = get_bits(&s->gb, s->avctx->bits_per_raw_sample);
  1706. if (block_mean == 0){
  1707. av_log(s->avctx, AV_LOG_ERROR, "Forbidden block_mean\n");
  1708. return AVERROR_INVALIDDATA;
  1709. }
  1710. s->last_dc[n] = block_mean * (1 << (s->dct_precision + s->intra_dc_precision));
  1711. rice_parameter = get_bits(&s->gb, 4);
  1712. if (rice_parameter == 0) {
  1713. av_log(s->avctx, AV_LOG_ERROR, "Forbidden rice_parameter\n");
  1714. return AVERROR_INVALIDDATA;
  1715. }
  1716. if (rice_parameter == 15)
  1717. rice_parameter = 0;
  1718. if (rice_parameter > 11) {
  1719. av_log(s->avctx, AV_LOG_ERROR, "Forbidden rice_parameter\n");
  1720. return AVERROR_INVALIDDATA;
  1721. }
  1722. for (i = 0; i < h; i++) {
  1723. output = 1 << (s->avctx->bits_per_raw_sample - 1);
  1724. top = 1 << (s->avctx->bits_per_raw_sample - 1);
  1725. for (j = 0; j < w; j++) {
  1726. left = output;
  1727. topleft = top;
  1728. rice_prefix_code = get_unary(&s->gb, 1, 12);
  1729. /* Escape */
  1730. if (rice_prefix_code == 11)
  1731. dpcm_residual = get_bits(&s->gb, s->avctx->bits_per_raw_sample);
  1732. else {
  1733. if (rice_prefix_code == 12) {
  1734. av_log(s->avctx, AV_LOG_ERROR, "Forbidden rice_prefix_code\n");
  1735. return AVERROR_INVALIDDATA;
  1736. }
  1737. rice_suffix_code = get_bitsz(&s->gb, rice_parameter);
  1738. dpcm_residual = (rice_prefix_code << rice_parameter) + rice_suffix_code;
  1739. }
  1740. /* Map to a signed residual */
  1741. if (dpcm_residual & 1)
  1742. dpcm_residual = (-1 * dpcm_residual) >> 1;
  1743. else
  1744. dpcm_residual = (dpcm_residual >> 1);
  1745. if (i != 0)
  1746. top = macroblock[idx-w];
  1747. p = left + top - topleft;
  1748. min_left_top = FFMIN(left, top);
  1749. if (p < min_left_top)
  1750. p = min_left_top;
  1751. max_left_top = FFMAX(left, top);
  1752. if (p > max_left_top)
  1753. p = max_left_top;
  1754. p2 = (FFMIN(min_left_top, topleft) + FFMAX(max_left_top, topleft)) >> 1;
  1755. if (p2 == p)
  1756. p2 = block_mean;
  1757. if (p2 > p)
  1758. dpcm_residual *= -1;
  1759. macroblock[idx++] = output = (dpcm_residual + p) & ((1 << s->avctx->bits_per_raw_sample) - 1);
  1760. }
  1761. }
  1762. return 0;
  1763. }
  1764. static int mpeg4_decode_studio_mb(MpegEncContext *s, int16_t block_[12][64])
  1765. {
  1766. int i;
  1767. s->dpcm_direction = 0;
  1768. /* StudioMacroblock */
  1769. /* Assumes I-VOP */
  1770. s->mb_intra = 1;
  1771. if (get_bits1(&s->gb)) { /* compression_mode */
  1772. /* DCT */
  1773. /* macroblock_type, 1 or 2-bit VLC */
  1774. if (!get_bits1(&s->gb)) {
  1775. skip_bits1(&s->gb);
  1776. s->qscale = mpeg_get_qscale(s);
  1777. }
  1778. for (i = 0; i < mpeg4_block_count[s->chroma_format]; i++) {
  1779. if (mpeg4_decode_studio_block(s, (*s->block32)[i], i) < 0)
  1780. return AVERROR_INVALIDDATA;
  1781. }
  1782. } else {
  1783. /* DPCM */
  1784. check_marker(s->avctx, &s->gb, "DPCM block start");
  1785. s->dpcm_direction = get_bits1(&s->gb) ? -1 : 1;
  1786. for (i = 0; i < 3; i++) {
  1787. if (mpeg4_decode_dpcm_macroblock(s, (*s->dpcm_macroblock)[i], i) < 0)
  1788. return AVERROR_INVALIDDATA;
  1789. }
  1790. }
  1791. if (get_bits_left(&s->gb) >= 24 && show_bits(&s->gb, 23) == 0) {
  1792. next_start_code_studio(&s->gb);
  1793. return SLICE_END;
  1794. }
  1795. //vcon-stp9L1.bits (first frame)
  1796. if (get_bits_left(&s->gb) == 0)
  1797. return SLICE_END;
  1798. //vcon-stp2L1.bits, vcon-stp3L1.bits, vcon-stp6L1.bits, vcon-stp7L1.bits, vcon-stp8L1.bits, vcon-stp10L1.bits (first frame)
  1799. if (get_bits_left(&s->gb) < 8U && show_bits(&s->gb, get_bits_left(&s->gb)) == 0)
  1800. return SLICE_END;
  1801. return SLICE_OK;
  1802. }
  1803. static int mpeg4_decode_gop_header(MpegEncContext *s, GetBitContext *gb)
  1804. {
  1805. int hours, minutes, seconds;
  1806. if (!show_bits(gb, 23)) {
  1807. av_log(s->avctx, AV_LOG_WARNING, "GOP header invalid\n");
  1808. return AVERROR_INVALIDDATA;
  1809. }
  1810. hours = get_bits(gb, 5);
  1811. minutes = get_bits(gb, 6);
  1812. check_marker(s->avctx, gb, "in gop_header");
  1813. seconds = get_bits(gb, 6);
  1814. s->time_base = seconds + 60*(minutes + 60*hours);
  1815. skip_bits1(gb);
  1816. skip_bits1(gb);
  1817. return 0;
  1818. }
  1819. static int mpeg4_decode_profile_level(MpegEncContext *s, GetBitContext *gb, int *profile, int *level)
  1820. {
  1821. *profile = get_bits(gb, 4);
  1822. *level = get_bits(gb, 4);
  1823. // for Simple profile, level 0
  1824. if (*profile == 0 && *level == 8) {
  1825. *level = 0;
  1826. }
  1827. return 0;
  1828. }
  1829. static int mpeg4_decode_visual_object(MpegEncContext *s, GetBitContext *gb)
  1830. {
  1831. int visual_object_type;
  1832. int is_visual_object_identifier = get_bits1(gb);
  1833. if (is_visual_object_identifier) {
  1834. skip_bits(gb, 4+3);
  1835. }
  1836. visual_object_type = get_bits(gb, 4);
  1837. if (visual_object_type == VOT_VIDEO_ID ||
  1838. visual_object_type == VOT_STILL_TEXTURE_ID) {
  1839. int video_signal_type = get_bits1(gb);
  1840. if (video_signal_type) {
  1841. int video_range, color_description;
  1842. skip_bits(gb, 3); // video_format
  1843. video_range = get_bits1(gb);
  1844. color_description = get_bits1(gb);
  1845. s->avctx->color_range = video_range ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG;
  1846. if (color_description) {
  1847. s->avctx->color_primaries = get_bits(gb, 8);
  1848. s->avctx->color_trc = get_bits(gb, 8);
  1849. s->avctx->colorspace = get_bits(gb, 8);
  1850. }
  1851. }
  1852. }
  1853. return 0;
  1854. }
  1855. static void mpeg4_load_default_matrices(MpegEncContext *s)
  1856. {
  1857. int i, v;
  1858. /* load default matrices */
  1859. for (i = 0; i < 64; i++) {
  1860. int j = s->idsp.idct_permutation[i];
  1861. v = ff_mpeg4_default_intra_matrix[i];
  1862. s->intra_matrix[j] = v;
  1863. s->chroma_intra_matrix[j] = v;
  1864. v = ff_mpeg4_default_non_intra_matrix[i];
  1865. s->inter_matrix[j] = v;
  1866. s->chroma_inter_matrix[j] = v;
  1867. }
  1868. }
  1869. static int read_quant_matrix_ext(MpegEncContext *s, GetBitContext *gb)
  1870. {
  1871. int i, j, v;
  1872. if (get_bits1(gb)) {
  1873. if (get_bits_left(gb) < 64*8)
  1874. return AVERROR_INVALIDDATA;
  1875. /* intra_quantiser_matrix */
  1876. for (i = 0; i < 64; i++) {
  1877. v = get_bits(gb, 8);
  1878. j = s->idsp.idct_permutation[ff_zigzag_direct[i]];
  1879. s->intra_matrix[j] = v;
  1880. s->chroma_intra_matrix[j] = v;
  1881. }
  1882. }
  1883. if (get_bits1(gb)) {
  1884. if (get_bits_left(gb) < 64*8)
  1885. return AVERROR_INVALIDDATA;
  1886. /* non_intra_quantiser_matrix */
  1887. for (i = 0; i < 64; i++) {
  1888. get_bits(gb, 8);
  1889. }
  1890. }
  1891. if (get_bits1(gb)) {
  1892. if (get_bits_left(gb) < 64*8)
  1893. return AVERROR_INVALIDDATA;
  1894. /* chroma_intra_quantiser_matrix */
  1895. for (i = 0; i < 64; i++) {
  1896. v = get_bits(gb, 8);
  1897. j = s->idsp.idct_permutation[ff_zigzag_direct[i]];
  1898. s->chroma_intra_matrix[j] = v;
  1899. }
  1900. }
  1901. if (get_bits1(gb)) {
  1902. if (get_bits_left(gb) < 64*8)
  1903. return AVERROR_INVALIDDATA;
  1904. /* chroma_non_intra_quantiser_matrix */
  1905. for (i = 0; i < 64; i++) {
  1906. get_bits(gb, 8);
  1907. }
  1908. }
  1909. next_start_code_studio(gb);
  1910. return 0;
  1911. }
  1912. static void extension_and_user_data(MpegEncContext *s, GetBitContext *gb, int id)
  1913. {
  1914. uint32_t startcode;
  1915. uint8_t extension_type;
  1916. startcode = show_bits_long(gb, 32);
  1917. if (startcode == USER_DATA_STARTCODE || startcode == EXT_STARTCODE) {
  1918. if ((id == 2 || id == 4) && startcode == EXT_STARTCODE) {
  1919. skip_bits_long(gb, 32);
  1920. extension_type = get_bits(gb, 4);
  1921. if (extension_type == QUANT_MATRIX_EXT_ID)
  1922. read_quant_matrix_ext(s, gb);
  1923. }
  1924. }
  1925. }
  1926. static int decode_studio_vol_header(Mpeg4DecContext *ctx, GetBitContext *gb)
  1927. {
  1928. MpegEncContext *s = &ctx->m;
  1929. int width, height;
  1930. int bits_per_raw_sample;
  1931. int rgb, chroma_format;
  1932. // random_accessible_vol and video_object_type_indication have already
  1933. // been read by the caller decode_vol_header()
  1934. skip_bits(gb, 4); /* video_object_layer_verid */
  1935. ctx->shape = get_bits(gb, 2); /* video_object_layer_shape */
  1936. skip_bits(gb, 4); /* video_object_layer_shape_extension */
  1937. skip_bits1(gb); /* progressive_sequence */
  1938. if (ctx->shape != RECT_SHAPE) {
  1939. avpriv_request_sample(s->avctx, "MPEG-4 Studio profile non rectangular shape");
  1940. return AVERROR_PATCHWELCOME;
  1941. }
  1942. if (ctx->shape != BIN_ONLY_SHAPE) {
  1943. rgb = get_bits1(gb); /* rgb_components */
  1944. chroma_format = get_bits(gb, 2); /* chroma_format */
  1945. if (!chroma_format || chroma_format == CHROMA_420 || (rgb && chroma_format == CHROMA_422)) {
  1946. av_log(s->avctx, AV_LOG_ERROR, "illegal chroma format\n");
  1947. return AVERROR_INVALIDDATA;
  1948. }
  1949. bits_per_raw_sample = get_bits(gb, 4); /* bit_depth */
  1950. if (bits_per_raw_sample == 10) {
  1951. if (rgb) {
  1952. s->avctx->pix_fmt = AV_PIX_FMT_GBRP10;
  1953. } else {
  1954. s->avctx->pix_fmt = chroma_format == CHROMA_422 ? AV_PIX_FMT_YUV422P10 : AV_PIX_FMT_YUV444P10;
  1955. }
  1956. } else {
  1957. avpriv_request_sample(s->avctx, "MPEG-4 Studio profile bit-depth %u", bits_per_raw_sample);
  1958. return AVERROR_PATCHWELCOME;
  1959. }
  1960. if (rgb != ctx->rgb || s->chroma_format != chroma_format)
  1961. s->context_reinit = 1;
  1962. s->avctx->bits_per_raw_sample = bits_per_raw_sample;
  1963. ctx->rgb = rgb;
  1964. s->chroma_format = chroma_format;
  1965. }
  1966. if (ctx->shape == RECT_SHAPE) {
  1967. check_marker(s->avctx, gb, "before video_object_layer_width");
  1968. width = get_bits(gb, 14); /* video_object_layer_width */
  1969. check_marker(s->avctx, gb, "before video_object_layer_height");
  1970. height = get_bits(gb, 14); /* video_object_layer_height */
  1971. check_marker(s->avctx, gb, "after video_object_layer_height");
  1972. /* Do the same check as non-studio profile */
  1973. if (width && height) {
  1974. if (s->width && s->height &&
  1975. (s->width != width || s->height != height))
  1976. s->context_reinit = 1;
  1977. s->width = width;
  1978. s->height = height;
  1979. }
  1980. }
  1981. s->aspect_ratio_info = get_bits(gb, 4);
  1982. if (s->aspect_ratio_info == FF_ASPECT_EXTENDED) {
  1983. s->avctx->sample_aspect_ratio.num = get_bits(gb, 8); // par_width
  1984. s->avctx->sample_aspect_ratio.den = get_bits(gb, 8); // par_height
  1985. } else {
  1986. s->avctx->sample_aspect_ratio = ff_h263_pixel_aspect[s->aspect_ratio_info];
  1987. }
  1988. skip_bits(gb, 4); /* frame_rate_code */
  1989. skip_bits(gb, 15); /* first_half_bit_rate */
  1990. check_marker(s->avctx, gb, "after first_half_bit_rate");
  1991. skip_bits(gb, 15); /* latter_half_bit_rate */
  1992. check_marker(s->avctx, gb, "after latter_half_bit_rate");
  1993. skip_bits(gb, 15); /* first_half_vbv_buffer_size */
  1994. check_marker(s->avctx, gb, "after first_half_vbv_buffer_size");
  1995. skip_bits(gb, 3); /* latter_half_vbv_buffer_size */
  1996. skip_bits(gb, 11); /* first_half_vbv_buffer_size */
  1997. check_marker(s->avctx, gb, "after first_half_vbv_buffer_size");
  1998. skip_bits(gb, 15); /* latter_half_vbv_occupancy */
  1999. check_marker(s->avctx, gb, "after latter_half_vbv_occupancy");
  2000. s->low_delay = get_bits1(gb);
  2001. s->mpeg_quant = get_bits1(gb); /* mpeg2_stream */
  2002. next_start_code_studio(gb);
  2003. extension_and_user_data(s, gb, 2);
  2004. return 0;
  2005. }
  2006. static int decode_vol_header(Mpeg4DecContext *ctx, GetBitContext *gb)
  2007. {
  2008. MpegEncContext *s = &ctx->m;
  2009. int width, height, vo_ver_id;
  2010. /* vol header */
  2011. skip_bits(gb, 1); /* random access */
  2012. s->vo_type = get_bits(gb, 8);
  2013. /* If we are in studio profile (per vo_type), check if its all consistent
  2014. * and if so continue pass control to decode_studio_vol_header().
  2015. * elIf something is inconsistent, error out
  2016. * else continue with (non studio) vol header decpoding.
  2017. */
  2018. if (s->vo_type == CORE_STUDIO_VO_TYPE ||
  2019. s->vo_type == SIMPLE_STUDIO_VO_TYPE) {
  2020. if (s->avctx->profile != FF_PROFILE_UNKNOWN && s->avctx->profile != FF_PROFILE_MPEG4_SIMPLE_STUDIO)
  2021. return AVERROR_INVALIDDATA;
  2022. s->studio_profile = 1;
  2023. s->avctx->profile = FF_PROFILE_MPEG4_SIMPLE_STUDIO;
  2024. return decode_studio_vol_header(ctx, gb);
  2025. } else if (s->studio_profile) {
  2026. return AVERROR_PATCHWELCOME;
  2027. }
  2028. if (get_bits1(gb) != 0) { /* is_ol_id */
  2029. vo_ver_id = get_bits(gb, 4); /* vo_ver_id */
  2030. skip_bits(gb, 3); /* vo_priority */
  2031. } else {
  2032. vo_ver_id = 1;
  2033. }
  2034. s->aspect_ratio_info = get_bits(gb, 4);
  2035. if (s->aspect_ratio_info == FF_ASPECT_EXTENDED) {
  2036. s->avctx->sample_aspect_ratio.num = get_bits(gb, 8); // par_width
  2037. s->avctx->sample_aspect_ratio.den = get_bits(gb, 8); // par_height
  2038. } else {
  2039. s->avctx->sample_aspect_ratio = ff_h263_pixel_aspect[s->aspect_ratio_info];
  2040. }
  2041. if ((ctx->vol_control_parameters = get_bits1(gb))) { /* vol control parameter */
  2042. int chroma_format = get_bits(gb, 2);
  2043. if (chroma_format != CHROMA_420)
  2044. av_log(s->avctx, AV_LOG_ERROR, "illegal chroma format\n");
  2045. s->low_delay = get_bits1(gb);
  2046. if (get_bits1(gb)) { /* vbv parameters */
  2047. get_bits(gb, 15); /* first_half_bitrate */
  2048. check_marker(s->avctx, gb, "after first_half_bitrate");
  2049. get_bits(gb, 15); /* latter_half_bitrate */
  2050. check_marker(s->avctx, gb, "after latter_half_bitrate");
  2051. get_bits(gb, 15); /* first_half_vbv_buffer_size */
  2052. check_marker(s->avctx, gb, "after first_half_vbv_buffer_size");
  2053. get_bits(gb, 3); /* latter_half_vbv_buffer_size */
  2054. get_bits(gb, 11); /* first_half_vbv_occupancy */
  2055. check_marker(s->avctx, gb, "after first_half_vbv_occupancy");
  2056. get_bits(gb, 15); /* latter_half_vbv_occupancy */
  2057. check_marker(s->avctx, gb, "after latter_half_vbv_occupancy");
  2058. }
  2059. } else {
  2060. /* is setting low delay flag only once the smartest thing to do?
  2061. * low delay detection will not be overridden. */
  2062. if (s->picture_number == 0) {
  2063. switch(s->vo_type) {
  2064. case SIMPLE_VO_TYPE:
  2065. case ADV_SIMPLE_VO_TYPE:
  2066. s->low_delay = 1;
  2067. break;
  2068. default:
  2069. s->low_delay = 0;
  2070. }
  2071. }
  2072. }
  2073. ctx->shape = get_bits(gb, 2); /* vol shape */
  2074. if (ctx->shape != RECT_SHAPE)
  2075. av_log(s->avctx, AV_LOG_ERROR, "only rectangular vol supported\n");
  2076. if (ctx->shape == GRAY_SHAPE && vo_ver_id != 1) {
  2077. av_log(s->avctx, AV_LOG_ERROR, "Gray shape not supported\n");
  2078. skip_bits(gb, 4); /* video_object_layer_shape_extension */
  2079. }
  2080. check_marker(s->avctx, gb, "before time_increment_resolution");
  2081. s->avctx->framerate.num = get_bits(gb, 16);
  2082. if (!s->avctx->framerate.num) {
  2083. av_log(s->avctx, AV_LOG_ERROR, "framerate==0\n");
  2084. return AVERROR_INVALIDDATA;
  2085. }
  2086. ctx->time_increment_bits = av_log2(s->avctx->framerate.num - 1) + 1;
  2087. if (ctx->time_increment_bits < 1)
  2088. ctx->time_increment_bits = 1;
  2089. check_marker(s->avctx, gb, "before fixed_vop_rate");
  2090. if (get_bits1(gb) != 0) /* fixed_vop_rate */
  2091. s->avctx->framerate.den = get_bits(gb, ctx->time_increment_bits);
  2092. else
  2093. s->avctx->framerate.den = 1;
  2094. s->avctx->time_base = av_inv_q(av_mul_q(s->avctx->framerate, (AVRational){s->avctx->ticks_per_frame, 1}));
  2095. ctx->t_frame = 0;
  2096. if (ctx->shape != BIN_ONLY_SHAPE) {
  2097. if (ctx->shape == RECT_SHAPE) {
  2098. check_marker(s->avctx, gb, "before width");
  2099. width = get_bits(gb, 13);
  2100. check_marker(s->avctx, gb, "before height");
  2101. height = get_bits(gb, 13);
  2102. check_marker(s->avctx, gb, "after height");
  2103. if (width && height && /* they should be non zero but who knows */
  2104. !(s->width && s->codec_tag == AV_RL32("MP4S"))) {
  2105. if (s->width && s->height &&
  2106. (s->width != width || s->height != height))
  2107. s->context_reinit = 1;
  2108. s->width = width;
  2109. s->height = height;
  2110. }
  2111. }
  2112. s->progressive_sequence =
  2113. s->progressive_frame = get_bits1(gb) ^ 1;
  2114. s->interlaced_dct = 0;
  2115. if (!get_bits1(gb) && (s->avctx->debug & FF_DEBUG_PICT_INFO))
  2116. av_log(s->avctx, AV_LOG_INFO, /* OBMC Disable */
  2117. "MPEG-4 OBMC not supported (very likely buggy encoder)\n");
  2118. if (vo_ver_id == 1)
  2119. ctx->vol_sprite_usage = get_bits1(gb); /* vol_sprite_usage */
  2120. else
  2121. ctx->vol_sprite_usage = get_bits(gb, 2); /* vol_sprite_usage */
  2122. if (ctx->vol_sprite_usage == STATIC_SPRITE)
  2123. av_log(s->avctx, AV_LOG_ERROR, "Static Sprites not supported\n");
  2124. if (ctx->vol_sprite_usage == STATIC_SPRITE ||
  2125. ctx->vol_sprite_usage == GMC_SPRITE) {
  2126. if (ctx->vol_sprite_usage == STATIC_SPRITE) {
  2127. skip_bits(gb, 13); // sprite_width
  2128. check_marker(s->avctx, gb, "after sprite_width");
  2129. skip_bits(gb, 13); // sprite_height
  2130. check_marker(s->avctx, gb, "after sprite_height");
  2131. skip_bits(gb, 13); // sprite_left
  2132. check_marker(s->avctx, gb, "after sprite_left");
  2133. skip_bits(gb, 13); // sprite_top
  2134. check_marker(s->avctx, gb, "after sprite_top");
  2135. }
  2136. ctx->num_sprite_warping_points = get_bits(gb, 6);
  2137. if (ctx->num_sprite_warping_points > 3) {
  2138. av_log(s->avctx, AV_LOG_ERROR,
  2139. "%d sprite_warping_points\n",
  2140. ctx->num_sprite_warping_points);
  2141. ctx->num_sprite_warping_points = 0;
  2142. return AVERROR_INVALIDDATA;
  2143. }
  2144. s->sprite_warping_accuracy = get_bits(gb, 2);
  2145. ctx->sprite_brightness_change = get_bits1(gb);
  2146. if (ctx->vol_sprite_usage == STATIC_SPRITE)
  2147. skip_bits1(gb); // low_latency_sprite
  2148. }
  2149. // FIXME sadct disable bit if verid!=1 && shape not rect
  2150. if (get_bits1(gb) == 1) { /* not_8_bit */
  2151. s->quant_precision = get_bits(gb, 4); /* quant_precision */
  2152. if (get_bits(gb, 4) != 8) /* bits_per_pixel */
  2153. av_log(s->avctx, AV_LOG_ERROR, "N-bit not supported\n");
  2154. if (s->quant_precision != 5)
  2155. av_log(s->avctx, AV_LOG_ERROR,
  2156. "quant precision %d\n", s->quant_precision);
  2157. if (s->quant_precision<3 || s->quant_precision>9) {
  2158. s->quant_precision = 5;
  2159. }
  2160. } else {
  2161. s->quant_precision = 5;
  2162. }
  2163. // FIXME a bunch of grayscale shape things
  2164. if ((s->mpeg_quant = get_bits1(gb))) { /* vol_quant_type */
  2165. int i, v;
  2166. mpeg4_load_default_matrices(s);
  2167. /* load custom intra matrix */
  2168. if (get_bits1(gb)) {
  2169. int last = 0;
  2170. for (i = 0; i < 64; i++) {
  2171. int j;
  2172. if (get_bits_left(gb) < 8) {
  2173. av_log(s->avctx, AV_LOG_ERROR, "insufficient data for custom matrix\n");
  2174. return AVERROR_INVALIDDATA;
  2175. }
  2176. v = get_bits(gb, 8);
  2177. if (v == 0)
  2178. break;
  2179. last = v;
  2180. j = s->idsp.idct_permutation[ff_zigzag_direct[i]];
  2181. s->intra_matrix[j] = last;
  2182. s->chroma_intra_matrix[j] = last;
  2183. }
  2184. /* replicate last value */
  2185. for (; i < 64; i++) {
  2186. int j = s->idsp.idct_permutation[ff_zigzag_direct[i]];
  2187. s->intra_matrix[j] = last;
  2188. s->chroma_intra_matrix[j] = last;
  2189. }
  2190. }
  2191. /* load custom non intra matrix */
  2192. if (get_bits1(gb)) {
  2193. int last = 0;
  2194. for (i = 0; i < 64; i++) {
  2195. int j;
  2196. if (get_bits_left(gb) < 8) {
  2197. av_log(s->avctx, AV_LOG_ERROR, "insufficient data for custom matrix\n");
  2198. return AVERROR_INVALIDDATA;
  2199. }
  2200. v = get_bits(gb, 8);
  2201. if (v == 0)
  2202. break;
  2203. last = v;
  2204. j = s->idsp.idct_permutation[ff_zigzag_direct[i]];
  2205. s->inter_matrix[j] = v;
  2206. s->chroma_inter_matrix[j] = v;
  2207. }
  2208. /* replicate last value */
  2209. for (; i < 64; i++) {
  2210. int j = s->idsp.idct_permutation[ff_zigzag_direct[i]];
  2211. s->inter_matrix[j] = last;
  2212. s->chroma_inter_matrix[j] = last;
  2213. }
  2214. }
  2215. // FIXME a bunch of grayscale shape things
  2216. }
  2217. if (vo_ver_id != 1)
  2218. s->quarter_sample = get_bits1(gb);
  2219. else
  2220. s->quarter_sample = 0;
  2221. if (get_bits_left(gb) < 4) {
  2222. av_log(s->avctx, AV_LOG_ERROR, "VOL Header truncated\n");
  2223. return AVERROR_INVALIDDATA;
  2224. }
  2225. if (!get_bits1(gb)) {
  2226. int pos = get_bits_count(gb);
  2227. int estimation_method = get_bits(gb, 2);
  2228. if (estimation_method < 2) {
  2229. if (!get_bits1(gb)) {
  2230. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* opaque */
  2231. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* transparent */
  2232. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* intra_cae */
  2233. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* inter_cae */
  2234. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* no_update */
  2235. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* upsampling */
  2236. }
  2237. if (!get_bits1(gb)) {
  2238. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* intra_blocks */
  2239. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* inter_blocks */
  2240. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* inter4v_blocks */
  2241. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* not coded blocks */
  2242. }
  2243. if (!check_marker(s->avctx, gb, "in complexity estimation part 1")) {
  2244. skip_bits_long(gb, pos - get_bits_count(gb));
  2245. goto no_cplx_est;
  2246. }
  2247. if (!get_bits1(gb)) {
  2248. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* dct_coeffs */
  2249. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* dct_lines */
  2250. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* vlc_syms */
  2251. ctx->cplx_estimation_trash_i += 4 * get_bits1(gb); /* vlc_bits */
  2252. }
  2253. if (!get_bits1(gb)) {
  2254. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* apm */
  2255. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* npm */
  2256. ctx->cplx_estimation_trash_b += 8 * get_bits1(gb); /* interpolate_mc_q */
  2257. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* forwback_mc_q */
  2258. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* halfpel2 */
  2259. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* halfpel4 */
  2260. }
  2261. if (!check_marker(s->avctx, gb, "in complexity estimation part 2")) {
  2262. skip_bits_long(gb, pos - get_bits_count(gb));
  2263. goto no_cplx_est;
  2264. }
  2265. if (estimation_method == 1) {
  2266. ctx->cplx_estimation_trash_i += 8 * get_bits1(gb); /* sadct */
  2267. ctx->cplx_estimation_trash_p += 8 * get_bits1(gb); /* qpel */
  2268. }
  2269. } else
  2270. av_log(s->avctx, AV_LOG_ERROR,
  2271. "Invalid Complexity estimation method %d\n",
  2272. estimation_method);
  2273. } else {
  2274. no_cplx_est:
  2275. ctx->cplx_estimation_trash_i =
  2276. ctx->cplx_estimation_trash_p =
  2277. ctx->cplx_estimation_trash_b = 0;
  2278. }
  2279. ctx->resync_marker = !get_bits1(gb); /* resync_marker_disabled */
  2280. s->data_partitioning = get_bits1(gb);
  2281. if (s->data_partitioning)
  2282. ctx->rvlc = get_bits1(gb);
  2283. if (vo_ver_id != 1) {
  2284. ctx->new_pred = get_bits1(gb);
  2285. if (ctx->new_pred) {
  2286. av_log(s->avctx, AV_LOG_ERROR, "new pred not supported\n");
  2287. skip_bits(gb, 2); /* requested upstream message type */
  2288. skip_bits1(gb); /* newpred segment type */
  2289. }
  2290. if (get_bits1(gb)) // reduced_res_vop
  2291. av_log(s->avctx, AV_LOG_ERROR,
  2292. "reduced resolution VOP not supported\n");
  2293. } else {
  2294. ctx->new_pred = 0;
  2295. }
  2296. ctx->scalability = get_bits1(gb);
  2297. if (ctx->scalability) {
  2298. GetBitContext bak = *gb;
  2299. int h_sampling_factor_n;
  2300. int h_sampling_factor_m;
  2301. int v_sampling_factor_n;
  2302. int v_sampling_factor_m;
  2303. skip_bits1(gb); // hierarchy_type
  2304. skip_bits(gb, 4); /* ref_layer_id */
  2305. skip_bits1(gb); /* ref_layer_sampling_dir */
  2306. h_sampling_factor_n = get_bits(gb, 5);
  2307. h_sampling_factor_m = get_bits(gb, 5);
  2308. v_sampling_factor_n = get_bits(gb, 5);
  2309. v_sampling_factor_m = get_bits(gb, 5);
  2310. ctx->enhancement_type = get_bits1(gb);
  2311. if (h_sampling_factor_n == 0 || h_sampling_factor_m == 0 ||
  2312. v_sampling_factor_n == 0 || v_sampling_factor_m == 0) {
  2313. /* illegal scalability header (VERY broken encoder),
  2314. * trying to workaround */
  2315. ctx->scalability = 0;
  2316. *gb = bak;
  2317. } else
  2318. av_log(s->avctx, AV_LOG_ERROR, "scalability not supported\n");
  2319. // bin shape stuff FIXME
  2320. }
  2321. }
  2322. if (s->avctx->debug&FF_DEBUG_PICT_INFO) {
  2323. av_log(s->avctx, AV_LOG_DEBUG, "tb %d/%d, tincrbits:%d, qp_prec:%d, ps:%d, low_delay:%d %s%s%s%s\n",
  2324. s->avctx->framerate.den, s->avctx->framerate.num,
  2325. ctx->time_increment_bits,
  2326. s->quant_precision,
  2327. s->progressive_sequence,
  2328. s->low_delay,
  2329. ctx->scalability ? "scalability " :"" , s->quarter_sample ? "qpel " : "",
  2330. s->data_partitioning ? "partition " : "", ctx->rvlc ? "rvlc " : ""
  2331. );
  2332. }
  2333. return 0;
  2334. }
  2335. /**
  2336. * Decode the user data stuff in the header.
  2337. * Also initializes divx/xvid/lavc_version/build.
  2338. */
  2339. static int decode_user_data(Mpeg4DecContext *ctx, GetBitContext *gb)
  2340. {
  2341. MpegEncContext *s = &ctx->m;
  2342. char buf[256];
  2343. int i;
  2344. int e;
  2345. int ver = 0, build = 0, ver2 = 0, ver3 = 0;
  2346. char last;
  2347. for (i = 0; i < 255 && get_bits_count(gb) < gb->size_in_bits; i++) {
  2348. if (show_bits(gb, 23) == 0)
  2349. break;
  2350. buf[i] = get_bits(gb, 8);
  2351. }
  2352. buf[i] = 0;
  2353. /* divx detection */
  2354. e = sscanf(buf, "DivX%dBuild%d%c", &ver, &build, &last);
  2355. if (e < 2)
  2356. e = sscanf(buf, "DivX%db%d%c", &ver, &build, &last);
  2357. if (e >= 2) {
  2358. ctx->divx_version = ver;
  2359. ctx->divx_build = build;
  2360. s->divx_packed = e == 3 && last == 'p';
  2361. }
  2362. /* libavcodec detection */
  2363. e = sscanf(buf, "FFmpe%*[^b]b%d", &build) + 3;
  2364. if (e != 4)
  2365. e = sscanf(buf, "FFmpeg v%d.%d.%d / libavcodec build: %d", &ver, &ver2, &ver3, &build);
  2366. if (e != 4) {
  2367. e = sscanf(buf, "Lavc%d.%d.%d", &ver, &ver2, &ver3) + 1;
  2368. if (e > 1) {
  2369. if (ver > 0xFFU || ver2 > 0xFFU || ver3 > 0xFFU) {
  2370. av_log(s->avctx, AV_LOG_WARNING,
  2371. "Unknown Lavc version string encountered, %d.%d.%d; "
  2372. "clamping sub-version values to 8-bits.\n",
  2373. ver, ver2, ver3);
  2374. }
  2375. build = ((ver & 0xFF) << 16) + ((ver2 & 0xFF) << 8) + (ver3 & 0xFF);
  2376. }
  2377. }
  2378. if (e != 4) {
  2379. if (strcmp(buf, "ffmpeg") == 0)
  2380. ctx->lavc_build = 4600;
  2381. }
  2382. if (e == 4)
  2383. ctx->lavc_build = build;
  2384. /* Xvid detection */
  2385. e = sscanf(buf, "XviD%d", &build);
  2386. if (e == 1)
  2387. ctx->xvid_build = build;
  2388. return 0;
  2389. }
  2390. int ff_mpeg4_workaround_bugs(AVCodecContext *avctx)
  2391. {
  2392. Mpeg4DecContext *ctx = avctx->priv_data;
  2393. MpegEncContext *s = &ctx->m;
  2394. if (ctx->xvid_build == -1 && ctx->divx_version == -1 && ctx->lavc_build == -1) {
  2395. if (s->codec_tag == AV_RL32("XVID") ||
  2396. s->codec_tag == AV_RL32("XVIX") ||
  2397. s->codec_tag == AV_RL32("RMP4") ||
  2398. s->codec_tag == AV_RL32("ZMP4") ||
  2399. s->codec_tag == AV_RL32("SIPP"))
  2400. ctx->xvid_build = 0;
  2401. }
  2402. if (ctx->xvid_build == -1 && ctx->divx_version == -1 && ctx->lavc_build == -1)
  2403. if (s->codec_tag == AV_RL32("DIVX") && s->vo_type == 0 &&
  2404. ctx->vol_control_parameters == 0)
  2405. ctx->divx_version = 400; // divx 4
  2406. if (ctx->xvid_build >= 0 && ctx->divx_version >= 0) {
  2407. ctx->divx_version =
  2408. ctx->divx_build = -1;
  2409. }
  2410. if (s->workaround_bugs & FF_BUG_AUTODETECT) {
  2411. if (s->codec_tag == AV_RL32("XVIX"))
  2412. s->workaround_bugs |= FF_BUG_XVID_ILACE;
  2413. if (s->codec_tag == AV_RL32("UMP4"))
  2414. s->workaround_bugs |= FF_BUG_UMP4;
  2415. if (ctx->divx_version >= 500 && ctx->divx_build < 1814)
  2416. s->workaround_bugs |= FF_BUG_QPEL_CHROMA;
  2417. if (ctx->divx_version > 502 && ctx->divx_build < 1814)
  2418. s->workaround_bugs |= FF_BUG_QPEL_CHROMA2;
  2419. if (ctx->xvid_build <= 3U)
  2420. s->padding_bug_score = 256 * 256 * 256 * 64;
  2421. if (ctx->xvid_build <= 1U)
  2422. s->workaround_bugs |= FF_BUG_QPEL_CHROMA;
  2423. if (ctx->xvid_build <= 12U)
  2424. s->workaround_bugs |= FF_BUG_EDGE;
  2425. if (ctx->xvid_build <= 32U)
  2426. s->workaround_bugs |= FF_BUG_DC_CLIP;
  2427. #define SET_QPEL_FUNC(postfix1, postfix2) \
  2428. s->qdsp.put_ ## postfix1 = ff_put_ ## postfix2; \
  2429. s->qdsp.put_no_rnd_ ## postfix1 = ff_put_no_rnd_ ## postfix2; \
  2430. s->qdsp.avg_ ## postfix1 = ff_avg_ ## postfix2;
  2431. if (ctx->lavc_build < 4653U)
  2432. s->workaround_bugs |= FF_BUG_STD_QPEL;
  2433. if (ctx->lavc_build < 4655U)
  2434. s->workaround_bugs |= FF_BUG_DIRECT_BLOCKSIZE;
  2435. if (ctx->lavc_build < 4670U)
  2436. s->workaround_bugs |= FF_BUG_EDGE;
  2437. if (ctx->lavc_build <= 4712U)
  2438. s->workaround_bugs |= FF_BUG_DC_CLIP;
  2439. if ((ctx->lavc_build&0xFF) >= 100) {
  2440. if (ctx->lavc_build > 3621476 && ctx->lavc_build < 3752552 &&
  2441. (ctx->lavc_build < 3752037 || ctx->lavc_build > 3752191) // 3.2.1+
  2442. )
  2443. s->workaround_bugs |= FF_BUG_IEDGE;
  2444. }
  2445. if (ctx->divx_version >= 0)
  2446. s->workaround_bugs |= FF_BUG_DIRECT_BLOCKSIZE;
  2447. if (ctx->divx_version == 501 && ctx->divx_build == 20020416)
  2448. s->padding_bug_score = 256 * 256 * 256 * 64;
  2449. if (ctx->divx_version < 500U)
  2450. s->workaround_bugs |= FF_BUG_EDGE;
  2451. if (ctx->divx_version >= 0)
  2452. s->workaround_bugs |= FF_BUG_HPEL_CHROMA;
  2453. }
  2454. if (s->workaround_bugs & FF_BUG_STD_QPEL) {
  2455. SET_QPEL_FUNC(qpel_pixels_tab[0][5], qpel16_mc11_old_c)
  2456. SET_QPEL_FUNC(qpel_pixels_tab[0][7], qpel16_mc31_old_c)
  2457. SET_QPEL_FUNC(qpel_pixels_tab[0][9], qpel16_mc12_old_c)
  2458. SET_QPEL_FUNC(qpel_pixels_tab[0][11], qpel16_mc32_old_c)
  2459. SET_QPEL_FUNC(qpel_pixels_tab[0][13], qpel16_mc13_old_c)
  2460. SET_QPEL_FUNC(qpel_pixels_tab[0][15], qpel16_mc33_old_c)
  2461. SET_QPEL_FUNC(qpel_pixels_tab[1][5], qpel8_mc11_old_c)
  2462. SET_QPEL_FUNC(qpel_pixels_tab[1][7], qpel8_mc31_old_c)
  2463. SET_QPEL_FUNC(qpel_pixels_tab[1][9], qpel8_mc12_old_c)
  2464. SET_QPEL_FUNC(qpel_pixels_tab[1][11], qpel8_mc32_old_c)
  2465. SET_QPEL_FUNC(qpel_pixels_tab[1][13], qpel8_mc13_old_c)
  2466. SET_QPEL_FUNC(qpel_pixels_tab[1][15], qpel8_mc33_old_c)
  2467. }
  2468. if (avctx->debug & FF_DEBUG_BUGS)
  2469. av_log(s->avctx, AV_LOG_DEBUG,
  2470. "bugs: %X lavc_build:%d xvid_build:%d divx_version:%d divx_build:%d %s\n",
  2471. s->workaround_bugs, ctx->lavc_build, ctx->xvid_build,
  2472. ctx->divx_version, ctx->divx_build, s->divx_packed ? "p" : "");
  2473. if (CONFIG_MPEG4_DECODER && ctx->xvid_build >= 0 &&
  2474. s->codec_id == AV_CODEC_ID_MPEG4 &&
  2475. avctx->idct_algo == FF_IDCT_AUTO) {
  2476. avctx->idct_algo = FF_IDCT_XVID;
  2477. ff_mpv_idct_init(s);
  2478. return 1;
  2479. }
  2480. return 0;
  2481. }
  2482. static int decode_vop_header(Mpeg4DecContext *ctx, GetBitContext *gb)
  2483. {
  2484. MpegEncContext *s = &ctx->m;
  2485. int time_incr, time_increment;
  2486. int64_t pts;
  2487. s->mcsel = 0;
  2488. s->pict_type = get_bits(gb, 2) + AV_PICTURE_TYPE_I; /* pict type: I = 0 , P = 1 */
  2489. if (s->pict_type == AV_PICTURE_TYPE_B && s->low_delay &&
  2490. ctx->vol_control_parameters == 0 && !(s->avctx->flags & AV_CODEC_FLAG_LOW_DELAY)) {
  2491. av_log(s->avctx, AV_LOG_ERROR, "low_delay flag set incorrectly, clearing it\n");
  2492. s->low_delay = 0;
  2493. }
  2494. s->partitioned_frame = s->data_partitioning && s->pict_type != AV_PICTURE_TYPE_B;
  2495. if (s->partitioned_frame)
  2496. s->decode_mb = mpeg4_decode_partitioned_mb;
  2497. else
  2498. s->decode_mb = mpeg4_decode_mb;
  2499. time_incr = 0;
  2500. while (get_bits1(gb) != 0)
  2501. time_incr++;
  2502. check_marker(s->avctx, gb, "before time_increment");
  2503. if (ctx->time_increment_bits == 0 ||
  2504. !(show_bits(gb, ctx->time_increment_bits + 1) & 1)) {
  2505. av_log(s->avctx, AV_LOG_WARNING,
  2506. "time_increment_bits %d is invalid in relation to the current bitstream, this is likely caused by a missing VOL header\n", ctx->time_increment_bits);
  2507. for (ctx->time_increment_bits = 1;
  2508. ctx->time_increment_bits < 16;
  2509. ctx->time_increment_bits++) {
  2510. if (s->pict_type == AV_PICTURE_TYPE_P ||
  2511. (s->pict_type == AV_PICTURE_TYPE_S &&
  2512. ctx->vol_sprite_usage == GMC_SPRITE)) {
  2513. if ((show_bits(gb, ctx->time_increment_bits + 6) & 0x37) == 0x30)
  2514. break;
  2515. } else if ((show_bits(gb, ctx->time_increment_bits + 5) & 0x1F) == 0x18)
  2516. break;
  2517. }
  2518. av_log(s->avctx, AV_LOG_WARNING,
  2519. "time_increment_bits set to %d bits, based on bitstream analysis\n", ctx->time_increment_bits);
  2520. if (s->avctx->framerate.num && 4*s->avctx->framerate.num < 1<<ctx->time_increment_bits) {
  2521. s->avctx->framerate.num = 1<<ctx->time_increment_bits;
  2522. s->avctx->time_base = av_inv_q(av_mul_q(s->avctx->framerate, (AVRational){s->avctx->ticks_per_frame, 1}));
  2523. }
  2524. }
  2525. if (IS_3IV1)
  2526. time_increment = get_bits1(gb); // FIXME investigate further
  2527. else
  2528. time_increment = get_bits(gb, ctx->time_increment_bits);
  2529. if (s->pict_type != AV_PICTURE_TYPE_B) {
  2530. s->last_time_base = s->time_base;
  2531. s->time_base += time_incr;
  2532. s->time = s->time_base * (int64_t)s->avctx->framerate.num + time_increment;
  2533. if (s->workaround_bugs & FF_BUG_UMP4) {
  2534. if (s->time < s->last_non_b_time) {
  2535. /* header is not mpeg-4-compatible, broken encoder,
  2536. * trying to workaround */
  2537. s->time_base++;
  2538. s->time += s->avctx->framerate.num;
  2539. }
  2540. }
  2541. s->pp_time = s->time - s->last_non_b_time;
  2542. s->last_non_b_time = s->time;
  2543. } else {
  2544. s->time = (s->last_time_base + time_incr) * (int64_t)s->avctx->framerate.num + time_increment;
  2545. s->pb_time = s->pp_time - (s->last_non_b_time - s->time);
  2546. if (s->pp_time <= s->pb_time ||
  2547. s->pp_time <= s->pp_time - s->pb_time ||
  2548. s->pp_time <= 0) {
  2549. /* messed up order, maybe after seeking? skipping current B-frame */
  2550. return FRAME_SKIPPED;
  2551. }
  2552. ff_mpeg4_init_direct_mv(s);
  2553. if (ctx->t_frame == 0)
  2554. ctx->t_frame = s->pb_time;
  2555. if (ctx->t_frame == 0)
  2556. ctx->t_frame = 1; // 1/0 protection
  2557. s->pp_field_time = (ROUNDED_DIV(s->last_non_b_time, ctx->t_frame) -
  2558. ROUNDED_DIV(s->last_non_b_time - s->pp_time, ctx->t_frame)) * 2;
  2559. s->pb_field_time = (ROUNDED_DIV(s->time, ctx->t_frame) -
  2560. ROUNDED_DIV(s->last_non_b_time - s->pp_time, ctx->t_frame)) * 2;
  2561. if (s->pp_field_time <= s->pb_field_time || s->pb_field_time <= 1) {
  2562. s->pb_field_time = 2;
  2563. s->pp_field_time = 4;
  2564. if (!s->progressive_sequence)
  2565. return FRAME_SKIPPED;
  2566. }
  2567. }
  2568. if (s->avctx->framerate.den)
  2569. pts = ROUNDED_DIV(s->time, s->avctx->framerate.den);
  2570. else
  2571. pts = AV_NOPTS_VALUE;
  2572. ff_dlog(s->avctx, "MPEG4 PTS: %"PRId64"\n", pts);
  2573. check_marker(s->avctx, gb, "before vop_coded");
  2574. /* vop coded */
  2575. if (get_bits1(gb) != 1) {
  2576. if (s->avctx->debug & FF_DEBUG_PICT_INFO)
  2577. av_log(s->avctx, AV_LOG_ERROR, "vop not coded\n");
  2578. return FRAME_SKIPPED;
  2579. }
  2580. if (ctx->new_pred)
  2581. decode_new_pred(ctx, gb);
  2582. if (ctx->shape != BIN_ONLY_SHAPE &&
  2583. (s->pict_type == AV_PICTURE_TYPE_P ||
  2584. (s->pict_type == AV_PICTURE_TYPE_S &&
  2585. ctx->vol_sprite_usage == GMC_SPRITE))) {
  2586. /* rounding type for motion estimation */
  2587. s->no_rounding = get_bits1(gb);
  2588. } else {
  2589. s->no_rounding = 0;
  2590. }
  2591. // FIXME reduced res stuff
  2592. if (ctx->shape != RECT_SHAPE) {
  2593. if (ctx->vol_sprite_usage != 1 || s->pict_type != AV_PICTURE_TYPE_I) {
  2594. skip_bits(gb, 13); /* width */
  2595. check_marker(s->avctx, gb, "after width");
  2596. skip_bits(gb, 13); /* height */
  2597. check_marker(s->avctx, gb, "after height");
  2598. skip_bits(gb, 13); /* hor_spat_ref */
  2599. check_marker(s->avctx, gb, "after hor_spat_ref");
  2600. skip_bits(gb, 13); /* ver_spat_ref */
  2601. }
  2602. skip_bits1(gb); /* change_CR_disable */
  2603. if (get_bits1(gb) != 0)
  2604. skip_bits(gb, 8); /* constant_alpha_value */
  2605. }
  2606. // FIXME complexity estimation stuff
  2607. if (ctx->shape != BIN_ONLY_SHAPE) {
  2608. skip_bits_long(gb, ctx->cplx_estimation_trash_i);
  2609. if (s->pict_type != AV_PICTURE_TYPE_I)
  2610. skip_bits_long(gb, ctx->cplx_estimation_trash_p);
  2611. if (s->pict_type == AV_PICTURE_TYPE_B)
  2612. skip_bits_long(gb, ctx->cplx_estimation_trash_b);
  2613. if (get_bits_left(gb) < 3) {
  2614. av_log(s->avctx, AV_LOG_ERROR, "Header truncated\n");
  2615. return AVERROR_INVALIDDATA;
  2616. }
  2617. ctx->intra_dc_threshold = ff_mpeg4_dc_threshold[get_bits(gb, 3)];
  2618. if (!s->progressive_sequence) {
  2619. s->top_field_first = get_bits1(gb);
  2620. s->alternate_scan = get_bits1(gb);
  2621. } else
  2622. s->alternate_scan = 0;
  2623. }
  2624. if (s->alternate_scan) {
  2625. ff_init_scantable(s->idsp.idct_permutation, &s->inter_scantable, ff_alternate_vertical_scan);
  2626. ff_init_scantable(s->idsp.idct_permutation, &s->intra_scantable, ff_alternate_vertical_scan);
  2627. ff_init_scantable(s->idsp.idct_permutation, &s->intra_h_scantable, ff_alternate_vertical_scan);
  2628. ff_init_scantable(s->idsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  2629. } else {
  2630. ff_init_scantable(s->idsp.idct_permutation, &s->inter_scantable, ff_zigzag_direct);
  2631. ff_init_scantable(s->idsp.idct_permutation, &s->intra_scantable, ff_zigzag_direct);
  2632. ff_init_scantable(s->idsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
  2633. ff_init_scantable(s->idsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  2634. }
  2635. if (s->pict_type == AV_PICTURE_TYPE_S) {
  2636. if((ctx->vol_sprite_usage == STATIC_SPRITE ||
  2637. ctx->vol_sprite_usage == GMC_SPRITE)) {
  2638. if (mpeg4_decode_sprite_trajectory(ctx, gb) < 0)
  2639. return AVERROR_INVALIDDATA;
  2640. if (ctx->sprite_brightness_change)
  2641. av_log(s->avctx, AV_LOG_ERROR,
  2642. "sprite_brightness_change not supported\n");
  2643. if (ctx->vol_sprite_usage == STATIC_SPRITE)
  2644. av_log(s->avctx, AV_LOG_ERROR, "static sprite not supported\n");
  2645. } else {
  2646. memset(s->sprite_offset, 0, sizeof(s->sprite_offset));
  2647. memset(s->sprite_delta, 0, sizeof(s->sprite_delta));
  2648. }
  2649. }
  2650. if (ctx->shape != BIN_ONLY_SHAPE) {
  2651. s->chroma_qscale = s->qscale = get_bits(gb, s->quant_precision);
  2652. if (s->qscale == 0) {
  2653. av_log(s->avctx, AV_LOG_ERROR,
  2654. "Error, header damaged or not MPEG-4 header (qscale=0)\n");
  2655. return AVERROR_INVALIDDATA; // makes no sense to continue, as there is nothing left from the image then
  2656. }
  2657. if (s->pict_type != AV_PICTURE_TYPE_I) {
  2658. s->f_code = get_bits(gb, 3); /* fcode_for */
  2659. if (s->f_code == 0) {
  2660. av_log(s->avctx, AV_LOG_ERROR,
  2661. "Error, header damaged or not MPEG-4 header (f_code=0)\n");
  2662. s->f_code = 1;
  2663. return AVERROR_INVALIDDATA; // makes no sense to continue, as there is nothing left from the image then
  2664. }
  2665. } else
  2666. s->f_code = 1;
  2667. if (s->pict_type == AV_PICTURE_TYPE_B) {
  2668. s->b_code = get_bits(gb, 3);
  2669. if (s->b_code == 0) {
  2670. av_log(s->avctx, AV_LOG_ERROR,
  2671. "Error, header damaged or not MPEG4 header (b_code=0)\n");
  2672. s->b_code=1;
  2673. return AVERROR_INVALIDDATA; // makes no sense to continue, as the MV decoding will break very quickly
  2674. }
  2675. } else
  2676. s->b_code = 1;
  2677. if (s->avctx->debug & FF_DEBUG_PICT_INFO) {
  2678. av_log(s->avctx, AV_LOG_DEBUG,
  2679. "qp:%d fc:%d,%d %s size:%d pro:%d alt:%d top:%d %spel part:%d resync:%d w:%d a:%d rnd:%d vot:%d%s dc:%d ce:%d/%d/%d time:%"PRId64" tincr:%d\n",
  2680. s->qscale, s->f_code, s->b_code,
  2681. s->pict_type == AV_PICTURE_TYPE_I ? "I" : (s->pict_type == AV_PICTURE_TYPE_P ? "P" : (s->pict_type == AV_PICTURE_TYPE_B ? "B" : "S")),
  2682. gb->size_in_bits,s->progressive_sequence, s->alternate_scan,
  2683. s->top_field_first, s->quarter_sample ? "q" : "h",
  2684. s->data_partitioning, ctx->resync_marker,
  2685. ctx->num_sprite_warping_points, s->sprite_warping_accuracy,
  2686. 1 - s->no_rounding, s->vo_type,
  2687. ctx->vol_control_parameters ? " VOLC" : " ", ctx->intra_dc_threshold,
  2688. ctx->cplx_estimation_trash_i, ctx->cplx_estimation_trash_p,
  2689. ctx->cplx_estimation_trash_b,
  2690. s->time,
  2691. time_increment
  2692. );
  2693. }
  2694. if (!ctx->scalability) {
  2695. if (ctx->shape != RECT_SHAPE && s->pict_type != AV_PICTURE_TYPE_I)
  2696. skip_bits1(gb); // vop shape coding type
  2697. } else {
  2698. if (ctx->enhancement_type) {
  2699. int load_backward_shape = get_bits1(gb);
  2700. if (load_backward_shape)
  2701. av_log(s->avctx, AV_LOG_ERROR,
  2702. "load backward shape isn't supported\n");
  2703. }
  2704. skip_bits(gb, 2); // ref_select_code
  2705. }
  2706. }
  2707. /* detect buggy encoders which don't set the low_delay flag
  2708. * (divx4/xvid/opendivx). Note we cannot detect divx5 without B-frames
  2709. * easily (although it's buggy too) */
  2710. if (s->vo_type == 0 && ctx->vol_control_parameters == 0 &&
  2711. ctx->divx_version == -1 && s->picture_number == 0) {
  2712. av_log(s->avctx, AV_LOG_WARNING,
  2713. "looks like this file was encoded with (divx4/(old)xvid/opendivx) -> forcing low_delay flag\n");
  2714. s->low_delay = 1;
  2715. }
  2716. s->picture_number++; // better than pic number==0 always ;)
  2717. // FIXME add short header support
  2718. s->y_dc_scale_table = ff_mpeg4_y_dc_scale_table;
  2719. s->c_dc_scale_table = ff_mpeg4_c_dc_scale_table;
  2720. if (s->workaround_bugs & FF_BUG_EDGE) {
  2721. s->h_edge_pos = s->width;
  2722. s->v_edge_pos = s->height;
  2723. }
  2724. return 0;
  2725. }
  2726. static void decode_smpte_tc(Mpeg4DecContext *ctx, GetBitContext *gb)
  2727. {
  2728. MpegEncContext *s = &ctx->m;
  2729. skip_bits(gb, 16); /* Time_code[63..48] */
  2730. check_marker(s->avctx, gb, "after Time_code[63..48]");
  2731. skip_bits(gb, 16); /* Time_code[47..32] */
  2732. check_marker(s->avctx, gb, "after Time_code[47..32]");
  2733. skip_bits(gb, 16); /* Time_code[31..16] */
  2734. check_marker(s->avctx, gb, "after Time_code[31..16]");
  2735. skip_bits(gb, 16); /* Time_code[15..0] */
  2736. check_marker(s->avctx, gb, "after Time_code[15..0]");
  2737. skip_bits(gb, 4); /* reserved_bits */
  2738. }
  2739. /**
  2740. * Decode the next studio vop header.
  2741. * @return <0 if something went wrong
  2742. */
  2743. static int decode_studio_vop_header(Mpeg4DecContext *ctx, GetBitContext *gb)
  2744. {
  2745. MpegEncContext *s = &ctx->m;
  2746. if (get_bits_left(gb) <= 32)
  2747. return 0;
  2748. s->partitioned_frame = 0;
  2749. s->interlaced_dct = 0;
  2750. s->decode_mb = mpeg4_decode_studio_mb;
  2751. decode_smpte_tc(ctx, gb);
  2752. skip_bits(gb, 10); /* temporal_reference */
  2753. skip_bits(gb, 2); /* vop_structure */
  2754. s->pict_type = get_bits(gb, 2) + AV_PICTURE_TYPE_I; /* vop_coding_type */
  2755. if (get_bits1(gb)) { /* vop_coded */
  2756. skip_bits1(gb); /* top_field_first */
  2757. skip_bits1(gb); /* repeat_first_field */
  2758. s->progressive_frame = get_bits1(gb) ^ 1; /* progressive_frame */
  2759. }
  2760. if (s->pict_type == AV_PICTURE_TYPE_I) {
  2761. if (get_bits1(gb))
  2762. reset_studio_dc_predictors(s);
  2763. }
  2764. if (ctx->shape != BIN_ONLY_SHAPE) {
  2765. s->alternate_scan = get_bits1(gb);
  2766. s->frame_pred_frame_dct = get_bits1(gb);
  2767. s->dct_precision = get_bits(gb, 2);
  2768. s->intra_dc_precision = get_bits(gb, 2);
  2769. s->q_scale_type = get_bits1(gb);
  2770. }
  2771. if (s->alternate_scan) {
  2772. ff_init_scantable(s->idsp.idct_permutation, &s->inter_scantable, ff_alternate_vertical_scan);
  2773. ff_init_scantable(s->idsp.idct_permutation, &s->intra_scantable, ff_alternate_vertical_scan);
  2774. ff_init_scantable(s->idsp.idct_permutation, &s->intra_h_scantable, ff_alternate_vertical_scan);
  2775. ff_init_scantable(s->idsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  2776. } else {
  2777. ff_init_scantable(s->idsp.idct_permutation, &s->inter_scantable, ff_zigzag_direct);
  2778. ff_init_scantable(s->idsp.idct_permutation, &s->intra_scantable, ff_zigzag_direct);
  2779. ff_init_scantable(s->idsp.idct_permutation, &s->intra_h_scantable, ff_alternate_horizontal_scan);
  2780. ff_init_scantable(s->idsp.idct_permutation, &s->intra_v_scantable, ff_alternate_vertical_scan);
  2781. }
  2782. mpeg4_load_default_matrices(s);
  2783. next_start_code_studio(gb);
  2784. extension_and_user_data(s, gb, 4);
  2785. return 0;
  2786. }
  2787. static int decode_studiovisualobject(Mpeg4DecContext *ctx, GetBitContext *gb)
  2788. {
  2789. MpegEncContext *s = &ctx->m;
  2790. int visual_object_type;
  2791. skip_bits(gb, 4); /* visual_object_verid */
  2792. visual_object_type = get_bits(gb, 4);
  2793. if (visual_object_type != VOT_VIDEO_ID) {
  2794. avpriv_request_sample(s->avctx, "VO type %u", visual_object_type);
  2795. return AVERROR_PATCHWELCOME;
  2796. }
  2797. next_start_code_studio(gb);
  2798. extension_and_user_data(s, gb, 1);
  2799. return 0;
  2800. }
  2801. /**
  2802. * Decode MPEG-4 headers.
  2803. *
  2804. * @param header If set the absence of a VOP is not treated as error; otherwise, it is treated as such.
  2805. * @return <0 if an error occurred
  2806. * FRAME_SKIPPED if a not coded VOP is found
  2807. * 0 else
  2808. */
  2809. int ff_mpeg4_decode_picture_header(Mpeg4DecContext *ctx, GetBitContext *gb, int header)
  2810. {
  2811. MpegEncContext *s = &ctx->m;
  2812. unsigned startcode, v;
  2813. int ret;
  2814. int vol = 0;
  2815. /* search next start code */
  2816. align_get_bits(gb);
  2817. // If we have not switched to studio profile than we also did not switch bps
  2818. // that means something else (like a previous instance) outside set bps which
  2819. // would be inconsistant with the currect state, thus reset it
  2820. if (!s->studio_profile && s->avctx->bits_per_raw_sample != 8)
  2821. s->avctx->bits_per_raw_sample = 0;
  2822. if (s->codec_tag == AV_RL32("WV1F") && show_bits(gb, 24) == 0x575630) {
  2823. skip_bits(gb, 24);
  2824. if (get_bits(gb, 8) == 0xF0)
  2825. goto end;
  2826. }
  2827. startcode = 0xff;
  2828. for (;;) {
  2829. if (get_bits_count(gb) >= gb->size_in_bits) {
  2830. if (gb->size_in_bits == 8 &&
  2831. (ctx->divx_version >= 0 || ctx->xvid_build >= 0) || s->codec_tag == AV_RL32("QMP4")) {
  2832. av_log(s->avctx, AV_LOG_VERBOSE, "frame skip %d\n", gb->size_in_bits);
  2833. return FRAME_SKIPPED; // divx bug
  2834. } else if (header && get_bits_count(gb) == gb->size_in_bits) {
  2835. return 0; // ordinary return value for parsing of extradata
  2836. } else
  2837. return AVERROR_INVALIDDATA; // end of stream
  2838. }
  2839. /* use the bits after the test */
  2840. v = get_bits(gb, 8);
  2841. startcode = ((startcode << 8) | v) & 0xffffffff;
  2842. if ((startcode & 0xFFFFFF00) != 0x100)
  2843. continue; // no startcode
  2844. if (s->avctx->debug & FF_DEBUG_STARTCODE) {
  2845. av_log(s->avctx, AV_LOG_DEBUG, "startcode: %3X ", startcode);
  2846. if (startcode <= 0x11F)
  2847. av_log(s->avctx, AV_LOG_DEBUG, "Video Object Start");
  2848. else if (startcode <= 0x12F)
  2849. av_log(s->avctx, AV_LOG_DEBUG, "Video Object Layer Start");
  2850. else if (startcode <= 0x13F)
  2851. av_log(s->avctx, AV_LOG_DEBUG, "Reserved");
  2852. else if (startcode <= 0x15F)
  2853. av_log(s->avctx, AV_LOG_DEBUG, "FGS bp start");
  2854. else if (startcode <= 0x1AF)
  2855. av_log(s->avctx, AV_LOG_DEBUG, "Reserved");
  2856. else if (startcode == 0x1B0)
  2857. av_log(s->avctx, AV_LOG_DEBUG, "Visual Object Seq Start");
  2858. else if (startcode == 0x1B1)
  2859. av_log(s->avctx, AV_LOG_DEBUG, "Visual Object Seq End");
  2860. else if (startcode == 0x1B2)
  2861. av_log(s->avctx, AV_LOG_DEBUG, "User Data");
  2862. else if (startcode == 0x1B3)
  2863. av_log(s->avctx, AV_LOG_DEBUG, "Group of VOP start");
  2864. else if (startcode == 0x1B4)
  2865. av_log(s->avctx, AV_LOG_DEBUG, "Video Session Error");
  2866. else if (startcode == 0x1B5)
  2867. av_log(s->avctx, AV_LOG_DEBUG, "Visual Object Start");
  2868. else if (startcode == 0x1B6)
  2869. av_log(s->avctx, AV_LOG_DEBUG, "Video Object Plane start");
  2870. else if (startcode == 0x1B7)
  2871. av_log(s->avctx, AV_LOG_DEBUG, "slice start");
  2872. else if (startcode == 0x1B8)
  2873. av_log(s->avctx, AV_LOG_DEBUG, "extension start");
  2874. else if (startcode == 0x1B9)
  2875. av_log(s->avctx, AV_LOG_DEBUG, "fgs start");
  2876. else if (startcode == 0x1BA)
  2877. av_log(s->avctx, AV_LOG_DEBUG, "FBA Object start");
  2878. else if (startcode == 0x1BB)
  2879. av_log(s->avctx, AV_LOG_DEBUG, "FBA Object Plane start");
  2880. else if (startcode == 0x1BC)
  2881. av_log(s->avctx, AV_LOG_DEBUG, "Mesh Object start");
  2882. else if (startcode == 0x1BD)
  2883. av_log(s->avctx, AV_LOG_DEBUG, "Mesh Object Plane start");
  2884. else if (startcode == 0x1BE)
  2885. av_log(s->avctx, AV_LOG_DEBUG, "Still Texture Object start");
  2886. else if (startcode == 0x1BF)
  2887. av_log(s->avctx, AV_LOG_DEBUG, "Texture Spatial Layer start");
  2888. else if (startcode == 0x1C0)
  2889. av_log(s->avctx, AV_LOG_DEBUG, "Texture SNR Layer start");
  2890. else if (startcode == 0x1C1)
  2891. av_log(s->avctx, AV_LOG_DEBUG, "Texture Tile start");
  2892. else if (startcode == 0x1C2)
  2893. av_log(s->avctx, AV_LOG_DEBUG, "Texture Shape Layer start");
  2894. else if (startcode == 0x1C3)
  2895. av_log(s->avctx, AV_LOG_DEBUG, "stuffing start");
  2896. else if (startcode <= 0x1C5)
  2897. av_log(s->avctx, AV_LOG_DEBUG, "reserved");
  2898. else if (startcode <= 0x1FF)
  2899. av_log(s->avctx, AV_LOG_DEBUG, "System start");
  2900. av_log(s->avctx, AV_LOG_DEBUG, " at %d\n", get_bits_count(gb));
  2901. }
  2902. if (startcode >= 0x120 && startcode <= 0x12F) {
  2903. if (vol) {
  2904. av_log(s->avctx, AV_LOG_WARNING, "Ignoring multiple VOL headers\n");
  2905. continue;
  2906. }
  2907. vol++;
  2908. if ((ret = decode_vol_header(ctx, gb)) < 0)
  2909. return ret;
  2910. } else if (startcode == USER_DATA_STARTCODE) {
  2911. decode_user_data(ctx, gb);
  2912. } else if (startcode == GOP_STARTCODE) {
  2913. mpeg4_decode_gop_header(s, gb);
  2914. } else if (startcode == VOS_STARTCODE) {
  2915. int profile, level;
  2916. mpeg4_decode_profile_level(s, gb, &profile, &level);
  2917. if (profile == FF_PROFILE_MPEG4_SIMPLE_STUDIO &&
  2918. (level > 0 && level < 9)) {
  2919. s->studio_profile = 1;
  2920. next_start_code_studio(gb);
  2921. extension_and_user_data(s, gb, 0);
  2922. } else if (s->studio_profile) {
  2923. avpriv_request_sample(s->avctx, "Mix of studio and non studio profile");
  2924. return AVERROR_PATCHWELCOME;
  2925. }
  2926. s->avctx->profile = profile;
  2927. s->avctx->level = level;
  2928. } else if (startcode == VISUAL_OBJ_STARTCODE) {
  2929. if (s->studio_profile) {
  2930. if ((ret = decode_studiovisualobject(ctx, gb)) < 0)
  2931. return ret;
  2932. } else
  2933. mpeg4_decode_visual_object(s, gb);
  2934. } else if (startcode == VOP_STARTCODE) {
  2935. break;
  2936. }
  2937. align_get_bits(gb);
  2938. startcode = 0xff;
  2939. }
  2940. end:
  2941. if (s->avctx->flags & AV_CODEC_FLAG_LOW_DELAY)
  2942. s->low_delay = 1;
  2943. s->avctx->has_b_frames = !s->low_delay;
  2944. if (s->studio_profile) {
  2945. if (!s->avctx->bits_per_raw_sample) {
  2946. av_log(s->avctx, AV_LOG_ERROR, "Missing VOL header\n");
  2947. return AVERROR_INVALIDDATA;
  2948. }
  2949. return decode_studio_vop_header(ctx, gb);
  2950. } else
  2951. return decode_vop_header(ctx, gb);
  2952. }
  2953. av_cold void ff_mpeg4videodec_static_init(void) {
  2954. static int done = 0;
  2955. if (!done) {
  2956. ff_rl_init(&ff_mpeg4_rl_intra, ff_mpeg4_static_rl_table_store[0]);
  2957. ff_rl_init(&ff_rvlc_rl_inter, ff_mpeg4_static_rl_table_store[1]);
  2958. ff_rl_init(&ff_rvlc_rl_intra, ff_mpeg4_static_rl_table_store[2]);
  2959. INIT_FIRST_VLC_RL(ff_mpeg4_rl_intra, 554);
  2960. INIT_VLC_RL(ff_rvlc_rl_inter, 1072);
  2961. INIT_FIRST_VLC_RL(ff_rvlc_rl_intra, 1072);
  2962. INIT_VLC_STATIC(&dc_lum, DC_VLC_BITS, 10 /* 13 */,
  2963. &ff_mpeg4_DCtab_lum[0][1], 2, 1,
  2964. &ff_mpeg4_DCtab_lum[0][0], 2, 1, 512);
  2965. INIT_VLC_STATIC(&dc_chrom, DC_VLC_BITS, 10 /* 13 */,
  2966. &ff_mpeg4_DCtab_chrom[0][1], 2, 1,
  2967. &ff_mpeg4_DCtab_chrom[0][0], 2, 1, 512);
  2968. INIT_VLC_STATIC_FROM_LENGTHS(&sprite_trajectory, SPRITE_TRAJ_VLC_BITS, 15,
  2969. ff_sprite_trajectory_lens, 1,
  2970. NULL, 0, 0, 0, 0, 128);
  2971. INIT_VLC_STATIC(&mb_type_b_vlc, MB_TYPE_B_VLC_BITS, 4,
  2972. &ff_mb_type_b_tab[0][1], 2, 1,
  2973. &ff_mb_type_b_tab[0][0], 2, 1, 16);
  2974. done = 1;
  2975. }
  2976. }
  2977. int ff_mpeg4_frame_end(AVCodecContext *avctx, const uint8_t *buf, int buf_size)
  2978. {
  2979. Mpeg4DecContext *ctx = avctx->priv_data;
  2980. MpegEncContext *s = &ctx->m;
  2981. /* divx 5.01+ bitstream reorder stuff */
  2982. /* Since this clobbers the input buffer and hwaccel codecs still need the
  2983. * data during hwaccel->end_frame we should not do this any earlier */
  2984. if (s->divx_packed) {
  2985. int current_pos = s->gb.buffer == s->bitstream_buffer ? 0 : (get_bits_count(&s->gb) >> 3);
  2986. int startcode_found = 0;
  2987. if (buf_size - current_pos > 7) {
  2988. int i;
  2989. for (i = current_pos; i < buf_size - 4; i++)
  2990. if (buf[i] == 0 &&
  2991. buf[i + 1] == 0 &&
  2992. buf[i + 2] == 1 &&
  2993. buf[i + 3] == 0xB6) {
  2994. startcode_found = !(buf[i + 4] & 0x40);
  2995. break;
  2996. }
  2997. }
  2998. if (startcode_found) {
  2999. if (!ctx->showed_packed_warning) {
  3000. av_log(s->avctx, AV_LOG_INFO, "Video uses a non-standard and "
  3001. "wasteful way to store B-frames ('packed B-frames'). "
  3002. "Consider using the mpeg4_unpack_bframes bitstream filter without encoding but stream copy to fix it.\n");
  3003. ctx->showed_packed_warning = 1;
  3004. }
  3005. av_fast_padded_malloc(&s->bitstream_buffer,
  3006. &s->allocated_bitstream_buffer_size,
  3007. buf_size - current_pos);
  3008. if (!s->bitstream_buffer) {
  3009. s->bitstream_buffer_size = 0;
  3010. return AVERROR(ENOMEM);
  3011. }
  3012. memcpy(s->bitstream_buffer, buf + current_pos,
  3013. buf_size - current_pos);
  3014. s->bitstream_buffer_size = buf_size - current_pos;
  3015. }
  3016. }
  3017. return 0;
  3018. }
  3019. #if HAVE_THREADS
  3020. static int mpeg4_update_thread_context(AVCodecContext *dst,
  3021. const AVCodecContext *src)
  3022. {
  3023. Mpeg4DecContext *s = dst->priv_data;
  3024. const Mpeg4DecContext *s1 = src->priv_data;
  3025. int init = s->m.context_initialized;
  3026. int ret = ff_mpeg_update_thread_context(dst, src);
  3027. if (ret < 0)
  3028. return ret;
  3029. // copy all the necessary fields explicitly
  3030. s->time_increment_bits = s1->time_increment_bits;
  3031. s->shape = s1->shape;
  3032. s->vol_sprite_usage = s1->vol_sprite_usage;
  3033. s->sprite_brightness_change = s1->sprite_brightness_change;
  3034. s->num_sprite_warping_points = s1->num_sprite_warping_points;
  3035. s->rvlc = s1->rvlc;
  3036. s->resync_marker = s1->resync_marker;
  3037. s->t_frame = s1->t_frame;
  3038. s->new_pred = s1->new_pred;
  3039. s->enhancement_type = s1->enhancement_type;
  3040. s->scalability = s1->scalability;
  3041. s->use_intra_dc_vlc = s1->use_intra_dc_vlc;
  3042. s->intra_dc_threshold = s1->intra_dc_threshold;
  3043. s->divx_version = s1->divx_version;
  3044. s->divx_build = s1->divx_build;
  3045. s->xvid_build = s1->xvid_build;
  3046. s->lavc_build = s1->lavc_build;
  3047. s->showed_packed_warning = s1->showed_packed_warning;
  3048. s->vol_control_parameters = s1->vol_control_parameters;
  3049. s->cplx_estimation_trash_i = s1->cplx_estimation_trash_i;
  3050. s->cplx_estimation_trash_p = s1->cplx_estimation_trash_p;
  3051. s->cplx_estimation_trash_b = s1->cplx_estimation_trash_b;
  3052. s->rgb = s1->rgb;
  3053. memcpy(s->sprite_shift, s1->sprite_shift, sizeof(s1->sprite_shift));
  3054. memcpy(s->sprite_traj, s1->sprite_traj, sizeof(s1->sprite_traj));
  3055. if (CONFIG_MPEG4_DECODER && !init && s1->xvid_build >= 0)
  3056. ff_xvid_idct_init(&s->m.idsp, dst);
  3057. return 0;
  3058. }
  3059. #endif
  3060. static av_cold void mpeg4_init_static(void)
  3061. {
  3062. INIT_VLC_STATIC_FROM_LENGTHS(&studio_luma_dc, STUDIO_INTRA_BITS, 19,
  3063. &ff_mpeg4_studio_dc_luma[0][1], 2,
  3064. &ff_mpeg4_studio_dc_luma[0][0], 2, 1,
  3065. 0, 0, 528);
  3066. INIT_VLC_STATIC_FROM_LENGTHS(&studio_chroma_dc, STUDIO_INTRA_BITS, 19,
  3067. &ff_mpeg4_studio_dc_chroma[0][1], 2,
  3068. &ff_mpeg4_studio_dc_chroma[0][0], 2, 1,
  3069. 0, 0, 528);
  3070. for (unsigned i = 0, offset = 0; i < 12; i++) {
  3071. static VLC_TYPE vlc_buf[6498][2];
  3072. studio_intra_tab[i].table = &vlc_buf[offset];
  3073. studio_intra_tab[i].table_allocated = FF_ARRAY_ELEMS(vlc_buf) - offset;
  3074. ff_init_vlc_from_lengths(&studio_intra_tab[i],
  3075. STUDIO_INTRA_BITS, 24,
  3076. &ff_mpeg4_studio_intra[i][0][1], 2,
  3077. &ff_mpeg4_studio_intra[i][0][0], 2, 1,
  3078. 0, INIT_VLC_STATIC_OVERLONG, NULL);
  3079. offset += studio_intra_tab[i].table_size;
  3080. }
  3081. ff_mpeg4videodec_static_init();
  3082. }
  3083. static av_cold int decode_init(AVCodecContext *avctx)
  3084. {
  3085. static AVOnce init_static_once = AV_ONCE_INIT;
  3086. Mpeg4DecContext *ctx = avctx->priv_data;
  3087. MpegEncContext *s = &ctx->m;
  3088. int ret;
  3089. ctx->divx_version =
  3090. ctx->divx_build =
  3091. ctx->xvid_build =
  3092. ctx->lavc_build = -1;
  3093. if ((ret = ff_h263_decode_init(avctx)) < 0)
  3094. return ret;
  3095. s->h263_pred = 1;
  3096. s->low_delay = 0; /* default, might be overridden in the vol header during header parsing */
  3097. s->decode_mb = mpeg4_decode_mb;
  3098. ctx->time_increment_bits = 4; /* default value for broken headers */
  3099. avctx->chroma_sample_location = AVCHROMA_LOC_LEFT;
  3100. ff_thread_once(&init_static_once, mpeg4_init_static);
  3101. return 0;
  3102. }
  3103. #define OFFSET(x) offsetof(MpegEncContext, x)
  3104. #define FLAGS AV_OPT_FLAG_EXPORT | AV_OPT_FLAG_READONLY
  3105. static const AVOption mpeg4_options[] = {
  3106. {"quarter_sample", "1/4 subpel MC", OFFSET(quarter_sample), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, FLAGS},
  3107. {"divx_packed", "divx style packed b frames", OFFSET(divx_packed), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, FLAGS},
  3108. {NULL}
  3109. };
  3110. static const AVClass mpeg4_class = {
  3111. .class_name = "MPEG4 Video Decoder",
  3112. .item_name = av_default_item_name,
  3113. .option = mpeg4_options,
  3114. .version = LIBAVUTIL_VERSION_INT,
  3115. };
  3116. AVCodec ff_mpeg4_decoder = {
  3117. .name = "mpeg4",
  3118. .long_name = NULL_IF_CONFIG_SMALL("MPEG-4 part 2"),
  3119. .type = AVMEDIA_TYPE_VIDEO,
  3120. .id = AV_CODEC_ID_MPEG4,
  3121. .priv_data_size = sizeof(Mpeg4DecContext),
  3122. .init = decode_init,
  3123. .close = ff_h263_decode_end,
  3124. .decode = ff_h263_decode_frame,
  3125. .capabilities = AV_CODEC_CAP_DRAW_HORIZ_BAND | AV_CODEC_CAP_DR1 |
  3126. AV_CODEC_CAP_TRUNCATED | AV_CODEC_CAP_DELAY |
  3127. AV_CODEC_CAP_FRAME_THREADS,
  3128. .caps_internal = FF_CODEC_CAP_SKIP_FRAME_FILL_PARAM |
  3129. FF_CODEC_CAP_ALLOCATE_PROGRESS,
  3130. .flush = ff_mpeg_flush,
  3131. .max_lowres = 3,
  3132. .pix_fmts = ff_h263_hwaccel_pixfmt_list_420,
  3133. .profiles = NULL_IF_CONFIG_SMALL(ff_mpeg4_video_profiles),
  3134. .update_thread_context = ONLY_IF_THREADS_ENABLED(mpeg4_update_thread_context),
  3135. .priv_class = &mpeg4_class,
  3136. .hw_configs = (const AVCodecHWConfigInternal *const []) {
  3137. #if CONFIG_MPEG4_NVDEC_HWACCEL
  3138. HWACCEL_NVDEC(mpeg4),
  3139. #endif
  3140. #if CONFIG_MPEG4_VAAPI_HWACCEL
  3141. HWACCEL_VAAPI(mpeg4),
  3142. #endif
  3143. #if CONFIG_MPEG4_VDPAU_HWACCEL
  3144. HWACCEL_VDPAU(mpeg4),
  3145. #endif
  3146. #if CONFIG_MPEG4_VIDEOTOOLBOX_HWACCEL
  3147. HWACCEL_VIDEOTOOLBOX(mpeg4),
  3148. #endif
  3149. NULL
  3150. },
  3151. };