You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

6233 lines
243KB

  1. /*
  2. * VC-1 and WMV3 decoder
  3. * Copyright (c) 2011 Mashiat Sarker Shakkhar
  4. * Copyright (c) 2006-2007 Konstantin Shishkov
  5. * Partly based on vc9.c (c) 2005 Anonymous, Alex Beregszaszi, Michael Niedermayer
  6. *
  7. * This file is part of Libav.
  8. *
  9. * Libav is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation; either
  12. * version 2.1 of the License, or (at your option) any later version.
  13. *
  14. * Libav is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17. * Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with Libav; if not, write to the Free Software
  21. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  22. */
  23. /**
  24. * @file
  25. * VC-1 and WMV3 decoder
  26. */
  27. #include "internal.h"
  28. #include "avcodec.h"
  29. #include "error_resilience.h"
  30. #include "mpeg_er.h"
  31. #include "mpegutils.h"
  32. #include "mpegvideo.h"
  33. #include "h263.h"
  34. #include "h264chroma.h"
  35. #include "qpeldsp.h"
  36. #include "vc1.h"
  37. #include "vc1data.h"
  38. #include "vc1acdata.h"
  39. #include "msmpeg4data.h"
  40. #include "unary.h"
  41. #include "mathops.h"
  42. #undef NDEBUG
  43. #include <assert.h>
  44. #define MB_INTRA_VLC_BITS 9
  45. #define DC_VLC_BITS 9
  46. // offset tables for interlaced picture MVDATA decoding
  47. static const int offset_table1[9] = { 0, 1, 2, 4, 8, 16, 32, 64, 128 };
  48. static const int offset_table2[9] = { 0, 1, 3, 7, 15, 31, 63, 127, 255 };
  49. /***********************************************************************/
  50. /**
  51. * @name VC-1 Bitplane decoding
  52. * @see 8.7, p56
  53. * @{
  54. */
  55. /**
  56. * Imode types
  57. * @{
  58. */
  59. enum Imode {
  60. IMODE_RAW,
  61. IMODE_NORM2,
  62. IMODE_DIFF2,
  63. IMODE_NORM6,
  64. IMODE_DIFF6,
  65. IMODE_ROWSKIP,
  66. IMODE_COLSKIP
  67. };
  68. /** @} */ //imode defines
  69. static void init_block_index(VC1Context *v)
  70. {
  71. MpegEncContext *s = &v->s;
  72. ff_init_block_index(s);
  73. if (v->field_mode && !(v->second_field ^ v->tff)) {
  74. s->dest[0] += s->current_picture_ptr->f->linesize[0];
  75. s->dest[1] += s->current_picture_ptr->f->linesize[1];
  76. s->dest[2] += s->current_picture_ptr->f->linesize[2];
  77. }
  78. }
  79. /** @} */ //Bitplane group
  80. static void vc1_put_signed_blocks_clamped(VC1Context *v)
  81. {
  82. MpegEncContext *s = &v->s;
  83. int topleft_mb_pos, top_mb_pos;
  84. int stride_y, fieldtx = 0;
  85. int v_dist;
  86. /* The put pixels loop is always one MB row behind the decoding loop,
  87. * because we can only put pixels when overlap filtering is done, and
  88. * for filtering of the bottom edge of a MB, we need the next MB row
  89. * present as well.
  90. * Within the row, the put pixels loop is also one MB col behind the
  91. * decoding loop. The reason for this is again, because for filtering
  92. * of the right MB edge, we need the next MB present. */
  93. if (!s->first_slice_line) {
  94. if (s->mb_x) {
  95. topleft_mb_pos = (s->mb_y - 1) * s->mb_stride + s->mb_x - 1;
  96. if (v->fcm == ILACE_FRAME)
  97. fieldtx = v->fieldtx_plane[topleft_mb_pos];
  98. stride_y = s->linesize << fieldtx;
  99. v_dist = (16 - fieldtx) >> (fieldtx == 0);
  100. s->idsp.put_signed_pixels_clamped(v->block[v->topleft_blk_idx][0],
  101. s->dest[0] - 16 * s->linesize - 16,
  102. stride_y);
  103. s->idsp.put_signed_pixels_clamped(v->block[v->topleft_blk_idx][1],
  104. s->dest[0] - 16 * s->linesize - 8,
  105. stride_y);
  106. s->idsp.put_signed_pixels_clamped(v->block[v->topleft_blk_idx][2],
  107. s->dest[0] - v_dist * s->linesize - 16,
  108. stride_y);
  109. s->idsp.put_signed_pixels_clamped(v->block[v->topleft_blk_idx][3],
  110. s->dest[0] - v_dist * s->linesize - 8,
  111. stride_y);
  112. s->idsp.put_signed_pixels_clamped(v->block[v->topleft_blk_idx][4],
  113. s->dest[1] - 8 * s->uvlinesize - 8,
  114. s->uvlinesize);
  115. s->idsp.put_signed_pixels_clamped(v->block[v->topleft_blk_idx][5],
  116. s->dest[2] - 8 * s->uvlinesize - 8,
  117. s->uvlinesize);
  118. }
  119. if (s->mb_x == s->mb_width - 1) {
  120. top_mb_pos = (s->mb_y - 1) * s->mb_stride + s->mb_x;
  121. if (v->fcm == ILACE_FRAME)
  122. fieldtx = v->fieldtx_plane[top_mb_pos];
  123. stride_y = s->linesize << fieldtx;
  124. v_dist = fieldtx ? 15 : 8;
  125. s->idsp.put_signed_pixels_clamped(v->block[v->top_blk_idx][0],
  126. s->dest[0] - 16 * s->linesize,
  127. stride_y);
  128. s->idsp.put_signed_pixels_clamped(v->block[v->top_blk_idx][1],
  129. s->dest[0] - 16 * s->linesize + 8,
  130. stride_y);
  131. s->idsp.put_signed_pixels_clamped(v->block[v->top_blk_idx][2],
  132. s->dest[0] - v_dist * s->linesize,
  133. stride_y);
  134. s->idsp.put_signed_pixels_clamped(v->block[v->top_blk_idx][3],
  135. s->dest[0] - v_dist * s->linesize + 8,
  136. stride_y);
  137. s->idsp.put_signed_pixels_clamped(v->block[v->top_blk_idx][4],
  138. s->dest[1] - 8 * s->uvlinesize,
  139. s->uvlinesize);
  140. s->idsp.put_signed_pixels_clamped(v->block[v->top_blk_idx][5],
  141. s->dest[2] - 8 * s->uvlinesize,
  142. s->uvlinesize);
  143. }
  144. }
  145. #define inc_blk_idx(idx) do { \
  146. idx++; \
  147. if (idx >= v->n_allocated_blks) \
  148. idx = 0; \
  149. } while (0)
  150. inc_blk_idx(v->topleft_blk_idx);
  151. inc_blk_idx(v->top_blk_idx);
  152. inc_blk_idx(v->left_blk_idx);
  153. inc_blk_idx(v->cur_blk_idx);
  154. }
  155. static void vc1_loop_filter_iblk(VC1Context *v, int pq)
  156. {
  157. MpegEncContext *s = &v->s;
  158. int j;
  159. if (!s->first_slice_line) {
  160. v->vc1dsp.vc1_v_loop_filter16(s->dest[0], s->linesize, pq);
  161. if (s->mb_x)
  162. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 16 * s->linesize, s->linesize, pq);
  163. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 16 * s->linesize + 8, s->linesize, pq);
  164. for (j = 0; j < 2; j++) {
  165. v->vc1dsp.vc1_v_loop_filter8(s->dest[j + 1], s->uvlinesize, pq);
  166. if (s->mb_x)
  167. v->vc1dsp.vc1_h_loop_filter8(s->dest[j + 1] - 8 * s->uvlinesize, s->uvlinesize, pq);
  168. }
  169. }
  170. v->vc1dsp.vc1_v_loop_filter16(s->dest[0] + 8 * s->linesize, s->linesize, pq);
  171. if (s->mb_y == s->end_mb_y - 1) {
  172. if (s->mb_x) {
  173. v->vc1dsp.vc1_h_loop_filter16(s->dest[0], s->linesize, pq);
  174. v->vc1dsp.vc1_h_loop_filter8(s->dest[1], s->uvlinesize, pq);
  175. v->vc1dsp.vc1_h_loop_filter8(s->dest[2], s->uvlinesize, pq);
  176. }
  177. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] + 8, s->linesize, pq);
  178. }
  179. }
  180. static void vc1_loop_filter_iblk_delayed(VC1Context *v, int pq)
  181. {
  182. MpegEncContext *s = &v->s;
  183. int j;
  184. /* The loopfilter runs 1 row and 1 column behind the overlap filter, which
  185. * means it runs two rows/cols behind the decoding loop. */
  186. if (!s->first_slice_line) {
  187. if (s->mb_x) {
  188. if (s->mb_y >= s->start_mb_y + 2) {
  189. v->vc1dsp.vc1_v_loop_filter16(s->dest[0] - 16 * s->linesize - 16, s->linesize, pq);
  190. if (s->mb_x >= 2)
  191. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 32 * s->linesize - 16, s->linesize, pq);
  192. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 32 * s->linesize - 8, s->linesize, pq);
  193. for (j = 0; j < 2; j++) {
  194. v->vc1dsp.vc1_v_loop_filter8(s->dest[j + 1] - 8 * s->uvlinesize - 8, s->uvlinesize, pq);
  195. if (s->mb_x >= 2) {
  196. v->vc1dsp.vc1_h_loop_filter8(s->dest[j + 1] - 16 * s->uvlinesize - 8, s->uvlinesize, pq);
  197. }
  198. }
  199. }
  200. v->vc1dsp.vc1_v_loop_filter16(s->dest[0] - 8 * s->linesize - 16, s->linesize, pq);
  201. }
  202. if (s->mb_x == s->mb_width - 1) {
  203. if (s->mb_y >= s->start_mb_y + 2) {
  204. v->vc1dsp.vc1_v_loop_filter16(s->dest[0] - 16 * s->linesize, s->linesize, pq);
  205. if (s->mb_x)
  206. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 32 * s->linesize, s->linesize, pq);
  207. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 32 * s->linesize + 8, s->linesize, pq);
  208. for (j = 0; j < 2; j++) {
  209. v->vc1dsp.vc1_v_loop_filter8(s->dest[j + 1] - 8 * s->uvlinesize, s->uvlinesize, pq);
  210. if (s->mb_x >= 2) {
  211. v->vc1dsp.vc1_h_loop_filter8(s->dest[j + 1] - 16 * s->uvlinesize, s->uvlinesize, pq);
  212. }
  213. }
  214. }
  215. v->vc1dsp.vc1_v_loop_filter16(s->dest[0] - 8 * s->linesize, s->linesize, pq);
  216. }
  217. if (s->mb_y == s->end_mb_y) {
  218. if (s->mb_x) {
  219. if (s->mb_x >= 2)
  220. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 16 * s->linesize - 16, s->linesize, pq);
  221. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 16 * s->linesize - 8, s->linesize, pq);
  222. if (s->mb_x >= 2) {
  223. for (j = 0; j < 2; j++) {
  224. v->vc1dsp.vc1_h_loop_filter8(s->dest[j + 1] - 8 * s->uvlinesize - 8, s->uvlinesize, pq);
  225. }
  226. }
  227. }
  228. if (s->mb_x == s->mb_width - 1) {
  229. if (s->mb_x)
  230. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 16 * s->linesize, s->linesize, pq);
  231. v->vc1dsp.vc1_h_loop_filter16(s->dest[0] - 16 * s->linesize + 8, s->linesize, pq);
  232. if (s->mb_x) {
  233. for (j = 0; j < 2; j++) {
  234. v->vc1dsp.vc1_h_loop_filter8(s->dest[j + 1] - 8 * s->uvlinesize, s->uvlinesize, pq);
  235. }
  236. }
  237. }
  238. }
  239. }
  240. }
  241. static void vc1_smooth_overlap_filter_iblk(VC1Context *v)
  242. {
  243. MpegEncContext *s = &v->s;
  244. int mb_pos;
  245. if (v->condover == CONDOVER_NONE)
  246. return;
  247. mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  248. /* Within a MB, the horizontal overlap always runs before the vertical.
  249. * To accomplish that, we run the H on left and internal borders of the
  250. * currently decoded MB. Then, we wait for the next overlap iteration
  251. * to do H overlap on the right edge of this MB, before moving over and
  252. * running the V overlap. Therefore, the V overlap makes us trail by one
  253. * MB col and the H overlap filter makes us trail by one MB row. This
  254. * is reflected in the time at which we run the put_pixels loop. */
  255. if (v->condover == CONDOVER_ALL || v->pq >= 9 || v->over_flags_plane[mb_pos]) {
  256. if (s->mb_x && (v->condover == CONDOVER_ALL || v->pq >= 9 ||
  257. v->over_flags_plane[mb_pos - 1])) {
  258. v->vc1dsp.vc1_h_s_overlap(v->block[v->left_blk_idx][1],
  259. v->block[v->cur_blk_idx][0]);
  260. v->vc1dsp.vc1_h_s_overlap(v->block[v->left_blk_idx][3],
  261. v->block[v->cur_blk_idx][2]);
  262. if (!(s->flags & CODEC_FLAG_GRAY)) {
  263. v->vc1dsp.vc1_h_s_overlap(v->block[v->left_blk_idx][4],
  264. v->block[v->cur_blk_idx][4]);
  265. v->vc1dsp.vc1_h_s_overlap(v->block[v->left_blk_idx][5],
  266. v->block[v->cur_blk_idx][5]);
  267. }
  268. }
  269. v->vc1dsp.vc1_h_s_overlap(v->block[v->cur_blk_idx][0],
  270. v->block[v->cur_blk_idx][1]);
  271. v->vc1dsp.vc1_h_s_overlap(v->block[v->cur_blk_idx][2],
  272. v->block[v->cur_blk_idx][3]);
  273. if (s->mb_x == s->mb_width - 1) {
  274. if (!s->first_slice_line && (v->condover == CONDOVER_ALL || v->pq >= 9 ||
  275. v->over_flags_plane[mb_pos - s->mb_stride])) {
  276. v->vc1dsp.vc1_v_s_overlap(v->block[v->top_blk_idx][2],
  277. v->block[v->cur_blk_idx][0]);
  278. v->vc1dsp.vc1_v_s_overlap(v->block[v->top_blk_idx][3],
  279. v->block[v->cur_blk_idx][1]);
  280. if (!(s->flags & CODEC_FLAG_GRAY)) {
  281. v->vc1dsp.vc1_v_s_overlap(v->block[v->top_blk_idx][4],
  282. v->block[v->cur_blk_idx][4]);
  283. v->vc1dsp.vc1_v_s_overlap(v->block[v->top_blk_idx][5],
  284. v->block[v->cur_blk_idx][5]);
  285. }
  286. }
  287. v->vc1dsp.vc1_v_s_overlap(v->block[v->cur_blk_idx][0],
  288. v->block[v->cur_blk_idx][2]);
  289. v->vc1dsp.vc1_v_s_overlap(v->block[v->cur_blk_idx][1],
  290. v->block[v->cur_blk_idx][3]);
  291. }
  292. }
  293. if (s->mb_x && (v->condover == CONDOVER_ALL || v->over_flags_plane[mb_pos - 1])) {
  294. if (!s->first_slice_line && (v->condover == CONDOVER_ALL || v->pq >= 9 ||
  295. v->over_flags_plane[mb_pos - s->mb_stride - 1])) {
  296. v->vc1dsp.vc1_v_s_overlap(v->block[v->topleft_blk_idx][2],
  297. v->block[v->left_blk_idx][0]);
  298. v->vc1dsp.vc1_v_s_overlap(v->block[v->topleft_blk_idx][3],
  299. v->block[v->left_blk_idx][1]);
  300. if (!(s->flags & CODEC_FLAG_GRAY)) {
  301. v->vc1dsp.vc1_v_s_overlap(v->block[v->topleft_blk_idx][4],
  302. v->block[v->left_blk_idx][4]);
  303. v->vc1dsp.vc1_v_s_overlap(v->block[v->topleft_blk_idx][5],
  304. v->block[v->left_blk_idx][5]);
  305. }
  306. }
  307. v->vc1dsp.vc1_v_s_overlap(v->block[v->left_blk_idx][0],
  308. v->block[v->left_blk_idx][2]);
  309. v->vc1dsp.vc1_v_s_overlap(v->block[v->left_blk_idx][1],
  310. v->block[v->left_blk_idx][3]);
  311. }
  312. }
  313. /** Do motion compensation over 1 macroblock
  314. * Mostly adapted hpel_motion and qpel_motion from mpegvideo.c
  315. */
  316. static void vc1_mc_1mv(VC1Context *v, int dir)
  317. {
  318. MpegEncContext *s = &v->s;
  319. H264ChromaContext *h264chroma = &v->h264chroma;
  320. uint8_t *srcY, *srcU, *srcV;
  321. int dxy, mx, my, uvmx, uvmy, src_x, src_y, uvsrc_x, uvsrc_y;
  322. int v_edge_pos = s->v_edge_pos >> v->field_mode;
  323. int i;
  324. uint8_t (*luty)[256], (*lutuv)[256];
  325. int use_ic;
  326. if ((!v->field_mode ||
  327. (v->ref_field_type[dir] == 1 && v->cur_field_type == 1)) &&
  328. !v->s.last_picture.f->data[0])
  329. return;
  330. mx = s->mv[dir][0][0];
  331. my = s->mv[dir][0][1];
  332. // store motion vectors for further use in B frames
  333. if (s->pict_type == AV_PICTURE_TYPE_P) {
  334. for (i = 0; i < 4; i++) {
  335. s->current_picture.motion_val[1][s->block_index[i] + v->blocks_off][0] = mx;
  336. s->current_picture.motion_val[1][s->block_index[i] + v->blocks_off][1] = my;
  337. }
  338. }
  339. uvmx = (mx + ((mx & 3) == 3)) >> 1;
  340. uvmy = (my + ((my & 3) == 3)) >> 1;
  341. v->luma_mv[s->mb_x][0] = uvmx;
  342. v->luma_mv[s->mb_x][1] = uvmy;
  343. if (v->field_mode &&
  344. v->cur_field_type != v->ref_field_type[dir]) {
  345. my = my - 2 + 4 * v->cur_field_type;
  346. uvmy = uvmy - 2 + 4 * v->cur_field_type;
  347. }
  348. // fastuvmc shall be ignored for interlaced frame picture
  349. if (v->fastuvmc && (v->fcm != ILACE_FRAME)) {
  350. uvmx = uvmx + ((uvmx < 0) ? (uvmx & 1) : -(uvmx & 1));
  351. uvmy = uvmy + ((uvmy < 0) ? (uvmy & 1) : -(uvmy & 1));
  352. }
  353. if (!dir) {
  354. if (v->field_mode && (v->cur_field_type != v->ref_field_type[dir]) && v->second_field) {
  355. srcY = s->current_picture.f->data[0];
  356. srcU = s->current_picture.f->data[1];
  357. srcV = s->current_picture.f->data[2];
  358. luty = v->curr_luty;
  359. lutuv = v->curr_lutuv;
  360. use_ic = v->curr_use_ic;
  361. } else {
  362. srcY = s->last_picture.f->data[0];
  363. srcU = s->last_picture.f->data[1];
  364. srcV = s->last_picture.f->data[2];
  365. luty = v->last_luty;
  366. lutuv = v->last_lutuv;
  367. use_ic = v->last_use_ic;
  368. }
  369. } else {
  370. srcY = s->next_picture.f->data[0];
  371. srcU = s->next_picture.f->data[1];
  372. srcV = s->next_picture.f->data[2];
  373. luty = v->next_luty;
  374. lutuv = v->next_lutuv;
  375. use_ic = v->next_use_ic;
  376. }
  377. if (!srcY || !srcU) {
  378. av_log(v->s.avctx, AV_LOG_ERROR, "Referenced frame missing.\n");
  379. return;
  380. }
  381. src_x = s->mb_x * 16 + (mx >> 2);
  382. src_y = s->mb_y * 16 + (my >> 2);
  383. uvsrc_x = s->mb_x * 8 + (uvmx >> 2);
  384. uvsrc_y = s->mb_y * 8 + (uvmy >> 2);
  385. if (v->profile != PROFILE_ADVANCED) {
  386. src_x = av_clip( src_x, -16, s->mb_width * 16);
  387. src_y = av_clip( src_y, -16, s->mb_height * 16);
  388. uvsrc_x = av_clip(uvsrc_x, -8, s->mb_width * 8);
  389. uvsrc_y = av_clip(uvsrc_y, -8, s->mb_height * 8);
  390. } else {
  391. src_x = av_clip( src_x, -17, s->avctx->coded_width);
  392. src_y = av_clip( src_y, -18, s->avctx->coded_height + 1);
  393. uvsrc_x = av_clip(uvsrc_x, -8, s->avctx->coded_width >> 1);
  394. uvsrc_y = av_clip(uvsrc_y, -8, s->avctx->coded_height >> 1);
  395. }
  396. srcY += src_y * s->linesize + src_x;
  397. srcU += uvsrc_y * s->uvlinesize + uvsrc_x;
  398. srcV += uvsrc_y * s->uvlinesize + uvsrc_x;
  399. if (v->field_mode && v->ref_field_type[dir]) {
  400. srcY += s->current_picture_ptr->f->linesize[0];
  401. srcU += s->current_picture_ptr->f->linesize[1];
  402. srcV += s->current_picture_ptr->f->linesize[2];
  403. }
  404. /* for grayscale we should not try to read from unknown area */
  405. if (s->flags & CODEC_FLAG_GRAY) {
  406. srcU = s->edge_emu_buffer + 18 * s->linesize;
  407. srcV = s->edge_emu_buffer + 18 * s->linesize;
  408. }
  409. if (v->rangeredfrm || use_ic
  410. || s->h_edge_pos < 22 || v_edge_pos < 22
  411. || (unsigned)(src_x - s->mspel) > s->h_edge_pos - (mx&3) - 16 - s->mspel * 3
  412. || (unsigned)(src_y - 1) > v_edge_pos - (my&3) - 16 - 3) {
  413. uint8_t *uvbuf = s->edge_emu_buffer + 19 * s->linesize;
  414. srcY -= s->mspel * (1 + s->linesize);
  415. s->vdsp.emulated_edge_mc(s->edge_emu_buffer, srcY,
  416. s->linesize, s->linesize,
  417. 17 + s->mspel * 2, 17 + s->mspel * 2,
  418. src_x - s->mspel, src_y - s->mspel,
  419. s->h_edge_pos, v_edge_pos);
  420. srcY = s->edge_emu_buffer;
  421. s->vdsp.emulated_edge_mc(uvbuf, srcU,
  422. s->uvlinesize, s->uvlinesize,
  423. 8 + 1, 8 + 1,
  424. uvsrc_x, uvsrc_y, s->h_edge_pos >> 1, v_edge_pos >> 1);
  425. s->vdsp.emulated_edge_mc(uvbuf + 16, srcV,
  426. s->uvlinesize, s->uvlinesize,
  427. 8 + 1, 8 + 1,
  428. uvsrc_x, uvsrc_y, s->h_edge_pos >> 1, v_edge_pos >> 1);
  429. srcU = uvbuf;
  430. srcV = uvbuf + 16;
  431. /* if we deal with range reduction we need to scale source blocks */
  432. if (v->rangeredfrm) {
  433. int i, j;
  434. uint8_t *src, *src2;
  435. src = srcY;
  436. for (j = 0; j < 17 + s->mspel * 2; j++) {
  437. for (i = 0; i < 17 + s->mspel * 2; i++)
  438. src[i] = ((src[i] - 128) >> 1) + 128;
  439. src += s->linesize;
  440. }
  441. src = srcU;
  442. src2 = srcV;
  443. for (j = 0; j < 9; j++) {
  444. for (i = 0; i < 9; i++) {
  445. src[i] = ((src[i] - 128) >> 1) + 128;
  446. src2[i] = ((src2[i] - 128) >> 1) + 128;
  447. }
  448. src += s->uvlinesize;
  449. src2 += s->uvlinesize;
  450. }
  451. }
  452. /* if we deal with intensity compensation we need to scale source blocks */
  453. if (use_ic) {
  454. int i, j;
  455. uint8_t *src, *src2;
  456. src = srcY;
  457. for (j = 0; j < 17 + s->mspel * 2; j++) {
  458. int f = v->field_mode ? v->ref_field_type[dir] : ((j + src_y - s->mspel) & 1) ;
  459. for (i = 0; i < 17 + s->mspel * 2; i++)
  460. src[i] = luty[f][src[i]];
  461. src += s->linesize;
  462. }
  463. src = srcU;
  464. src2 = srcV;
  465. for (j = 0; j < 9; j++) {
  466. int f = v->field_mode ? v->ref_field_type[dir] : ((j + uvsrc_y) & 1);
  467. for (i = 0; i < 9; i++) {
  468. src[i] = lutuv[f][src[i]];
  469. src2[i] = lutuv[f][src2[i]];
  470. }
  471. src += s->uvlinesize;
  472. src2 += s->uvlinesize;
  473. }
  474. }
  475. srcY += s->mspel * (1 + s->linesize);
  476. }
  477. if (s->mspel) {
  478. dxy = ((my & 3) << 2) | (mx & 3);
  479. v->vc1dsp.put_vc1_mspel_pixels_tab[dxy](s->dest[0] , srcY , s->linesize, v->rnd);
  480. v->vc1dsp.put_vc1_mspel_pixels_tab[dxy](s->dest[0] + 8, srcY + 8, s->linesize, v->rnd);
  481. srcY += s->linesize * 8;
  482. v->vc1dsp.put_vc1_mspel_pixels_tab[dxy](s->dest[0] + 8 * s->linesize , srcY , s->linesize, v->rnd);
  483. v->vc1dsp.put_vc1_mspel_pixels_tab[dxy](s->dest[0] + 8 * s->linesize + 8, srcY + 8, s->linesize, v->rnd);
  484. } else { // hpel mc - always used for luma
  485. dxy = (my & 2) | ((mx & 2) >> 1);
  486. if (!v->rnd)
  487. s->hdsp.put_pixels_tab[0][dxy](s->dest[0], srcY, s->linesize, 16);
  488. else
  489. s->hdsp.put_no_rnd_pixels_tab[0][dxy](s->dest[0], srcY, s->linesize, 16);
  490. }
  491. if (s->flags & CODEC_FLAG_GRAY) return;
  492. /* Chroma MC always uses qpel bilinear */
  493. uvmx = (uvmx & 3) << 1;
  494. uvmy = (uvmy & 3) << 1;
  495. if (!v->rnd) {
  496. h264chroma->put_h264_chroma_pixels_tab[0](s->dest[1], srcU, s->uvlinesize, 8, uvmx, uvmy);
  497. h264chroma->put_h264_chroma_pixels_tab[0](s->dest[2], srcV, s->uvlinesize, 8, uvmx, uvmy);
  498. } else {
  499. v->vc1dsp.put_no_rnd_vc1_chroma_pixels_tab[0](s->dest[1], srcU, s->uvlinesize, 8, uvmx, uvmy);
  500. v->vc1dsp.put_no_rnd_vc1_chroma_pixels_tab[0](s->dest[2], srcV, s->uvlinesize, 8, uvmx, uvmy);
  501. }
  502. }
  503. static inline int median4(int a, int b, int c, int d)
  504. {
  505. if (a < b) {
  506. if (c < d) return (FFMIN(b, d) + FFMAX(a, c)) / 2;
  507. else return (FFMIN(b, c) + FFMAX(a, d)) / 2;
  508. } else {
  509. if (c < d) return (FFMIN(a, d) + FFMAX(b, c)) / 2;
  510. else return (FFMIN(a, c) + FFMAX(b, d)) / 2;
  511. }
  512. }
  513. /** Do motion compensation for 4-MV macroblock - luminance block
  514. */
  515. static void vc1_mc_4mv_luma(VC1Context *v, int n, int dir, int avg)
  516. {
  517. MpegEncContext *s = &v->s;
  518. uint8_t *srcY;
  519. int dxy, mx, my, src_x, src_y;
  520. int off;
  521. int fieldmv = (v->fcm == ILACE_FRAME) ? v->blk_mv_type[s->block_index[n]] : 0;
  522. int v_edge_pos = s->v_edge_pos >> v->field_mode;
  523. uint8_t (*luty)[256];
  524. int use_ic;
  525. if ((!v->field_mode ||
  526. (v->ref_field_type[dir] == 1 && v->cur_field_type == 1)) &&
  527. !v->s.last_picture.f->data[0])
  528. return;
  529. mx = s->mv[dir][n][0];
  530. my = s->mv[dir][n][1];
  531. if (!dir) {
  532. if (v->field_mode && (v->cur_field_type != v->ref_field_type[dir]) && v->second_field) {
  533. srcY = s->current_picture.f->data[0];
  534. luty = v->curr_luty;
  535. use_ic = v->curr_use_ic;
  536. } else {
  537. srcY = s->last_picture.f->data[0];
  538. luty = v->last_luty;
  539. use_ic = v->last_use_ic;
  540. }
  541. } else {
  542. srcY = s->next_picture.f->data[0];
  543. luty = v->next_luty;
  544. use_ic = v->next_use_ic;
  545. }
  546. if (!srcY) {
  547. av_log(v->s.avctx, AV_LOG_ERROR, "Referenced frame missing.\n");
  548. return;
  549. }
  550. if (v->field_mode) {
  551. if (v->cur_field_type != v->ref_field_type[dir])
  552. my = my - 2 + 4 * v->cur_field_type;
  553. }
  554. if (s->pict_type == AV_PICTURE_TYPE_P && n == 3 && v->field_mode) {
  555. int same_count = 0, opp_count = 0, k;
  556. int chosen_mv[2][4][2], f;
  557. int tx, ty;
  558. for (k = 0; k < 4; k++) {
  559. f = v->mv_f[0][s->block_index[k] + v->blocks_off];
  560. chosen_mv[f][f ? opp_count : same_count][0] = s->mv[0][k][0];
  561. chosen_mv[f][f ? opp_count : same_count][1] = s->mv[0][k][1];
  562. opp_count += f;
  563. same_count += 1 - f;
  564. }
  565. f = opp_count > same_count;
  566. switch (f ? opp_count : same_count) {
  567. case 4:
  568. tx = median4(chosen_mv[f][0][0], chosen_mv[f][1][0],
  569. chosen_mv[f][2][0], chosen_mv[f][3][0]);
  570. ty = median4(chosen_mv[f][0][1], chosen_mv[f][1][1],
  571. chosen_mv[f][2][1], chosen_mv[f][3][1]);
  572. break;
  573. case 3:
  574. tx = mid_pred(chosen_mv[f][0][0], chosen_mv[f][1][0], chosen_mv[f][2][0]);
  575. ty = mid_pred(chosen_mv[f][0][1], chosen_mv[f][1][1], chosen_mv[f][2][1]);
  576. break;
  577. case 2:
  578. tx = (chosen_mv[f][0][0] + chosen_mv[f][1][0]) / 2;
  579. ty = (chosen_mv[f][0][1] + chosen_mv[f][1][1]) / 2;
  580. break;
  581. }
  582. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][0] = tx;
  583. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][1] = ty;
  584. for (k = 0; k < 4; k++)
  585. v->mv_f[1][s->block_index[k] + v->blocks_off] = f;
  586. }
  587. if (v->fcm == ILACE_FRAME) { // not sure if needed for other types of picture
  588. int qx, qy;
  589. int width = s->avctx->coded_width;
  590. int height = s->avctx->coded_height >> 1;
  591. if (s->pict_type == AV_PICTURE_TYPE_P) {
  592. s->current_picture.motion_val[1][s->block_index[n] + v->blocks_off][0] = mx;
  593. s->current_picture.motion_val[1][s->block_index[n] + v->blocks_off][1] = my;
  594. }
  595. qx = (s->mb_x * 16) + (mx >> 2);
  596. qy = (s->mb_y * 8) + (my >> 3);
  597. if (qx < -17)
  598. mx -= 4 * (qx + 17);
  599. else if (qx > width)
  600. mx -= 4 * (qx - width);
  601. if (qy < -18)
  602. my -= 8 * (qy + 18);
  603. else if (qy > height + 1)
  604. my -= 8 * (qy - height - 1);
  605. }
  606. if ((v->fcm == ILACE_FRAME) && fieldmv)
  607. off = ((n > 1) ? s->linesize : 0) + (n & 1) * 8;
  608. else
  609. off = s->linesize * 4 * (n & 2) + (n & 1) * 8;
  610. src_x = s->mb_x * 16 + (n & 1) * 8 + (mx >> 2);
  611. if (!fieldmv)
  612. src_y = s->mb_y * 16 + (n & 2) * 4 + (my >> 2);
  613. else
  614. src_y = s->mb_y * 16 + ((n > 1) ? 1 : 0) + (my >> 2);
  615. if (v->profile != PROFILE_ADVANCED) {
  616. src_x = av_clip(src_x, -16, s->mb_width * 16);
  617. src_y = av_clip(src_y, -16, s->mb_height * 16);
  618. } else {
  619. src_x = av_clip(src_x, -17, s->avctx->coded_width);
  620. if (v->fcm == ILACE_FRAME) {
  621. if (src_y & 1)
  622. src_y = av_clip(src_y, -17, s->avctx->coded_height + 1);
  623. else
  624. src_y = av_clip(src_y, -18, s->avctx->coded_height);
  625. } else {
  626. src_y = av_clip(src_y, -18, s->avctx->coded_height + 1);
  627. }
  628. }
  629. srcY += src_y * s->linesize + src_x;
  630. if (v->field_mode && v->ref_field_type[dir])
  631. srcY += s->current_picture_ptr->f->linesize[0];
  632. if (fieldmv && !(src_y & 1))
  633. v_edge_pos--;
  634. if (fieldmv && (src_y & 1) && src_y < 4)
  635. src_y--;
  636. if (v->rangeredfrm || use_ic
  637. || s->h_edge_pos < 13 || v_edge_pos < 23
  638. || (unsigned)(src_x - s->mspel) > s->h_edge_pos - (mx & 3) - 8 - s->mspel * 2
  639. || (unsigned)(src_y - (s->mspel << fieldmv)) > v_edge_pos - (my & 3) - ((8 + s->mspel * 2) << fieldmv)) {
  640. srcY -= s->mspel * (1 + (s->linesize << fieldmv));
  641. /* check emulate edge stride and offset */
  642. s->vdsp.emulated_edge_mc(s->edge_emu_buffer, srcY,
  643. s->linesize, s->linesize,
  644. 9 + s->mspel * 2, (9 + s->mspel * 2) << fieldmv,
  645. src_x - s->mspel, src_y - (s->mspel << fieldmv),
  646. s->h_edge_pos, v_edge_pos);
  647. srcY = s->edge_emu_buffer;
  648. /* if we deal with range reduction we need to scale source blocks */
  649. if (v->rangeredfrm) {
  650. int i, j;
  651. uint8_t *src;
  652. src = srcY;
  653. for (j = 0; j < 9 + s->mspel * 2; j++) {
  654. for (i = 0; i < 9 + s->mspel * 2; i++)
  655. src[i] = ((src[i] - 128) >> 1) + 128;
  656. src += s->linesize << fieldmv;
  657. }
  658. }
  659. /* if we deal with intensity compensation we need to scale source blocks */
  660. if (use_ic) {
  661. int i, j;
  662. uint8_t *src;
  663. src = srcY;
  664. for (j = 0; j < 9 + s->mspel * 2; j++) {
  665. int f = v->field_mode ? v->ref_field_type[dir] : (((j<<fieldmv)+src_y - (s->mspel << fieldmv)) & 1);
  666. for (i = 0; i < 9 + s->mspel * 2; i++)
  667. src[i] = luty[f][src[i]];
  668. src += s->linesize << fieldmv;
  669. }
  670. }
  671. srcY += s->mspel * (1 + (s->linesize << fieldmv));
  672. }
  673. if (s->mspel) {
  674. dxy = ((my & 3) << 2) | (mx & 3);
  675. if (avg)
  676. v->vc1dsp.avg_vc1_mspel_pixels_tab[dxy](s->dest[0] + off, srcY, s->linesize << fieldmv, v->rnd);
  677. else
  678. v->vc1dsp.put_vc1_mspel_pixels_tab[dxy](s->dest[0] + off, srcY, s->linesize << fieldmv, v->rnd);
  679. } else { // hpel mc - always used for luma
  680. dxy = (my & 2) | ((mx & 2) >> 1);
  681. if (!v->rnd)
  682. s->hdsp.put_pixels_tab[1][dxy](s->dest[0] + off, srcY, s->linesize, 8);
  683. else
  684. s->hdsp.put_no_rnd_pixels_tab[1][dxy](s->dest[0] + off, srcY, s->linesize, 8);
  685. }
  686. }
  687. static av_always_inline int get_chroma_mv(int *mvx, int *mvy, int *a, int flag, int *tx, int *ty)
  688. {
  689. int idx, i;
  690. static const int count[16] = { 0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4};
  691. idx = ((a[3] != flag) << 3)
  692. | ((a[2] != flag) << 2)
  693. | ((a[1] != flag) << 1)
  694. | (a[0] != flag);
  695. if (!idx) {
  696. *tx = median4(mvx[0], mvx[1], mvx[2], mvx[3]);
  697. *ty = median4(mvy[0], mvy[1], mvy[2], mvy[3]);
  698. return 4;
  699. } else if (count[idx] == 1) {
  700. switch (idx) {
  701. case 0x1:
  702. *tx = mid_pred(mvx[1], mvx[2], mvx[3]);
  703. *ty = mid_pred(mvy[1], mvy[2], mvy[3]);
  704. return 3;
  705. case 0x2:
  706. *tx = mid_pred(mvx[0], mvx[2], mvx[3]);
  707. *ty = mid_pred(mvy[0], mvy[2], mvy[3]);
  708. return 3;
  709. case 0x4:
  710. *tx = mid_pred(mvx[0], mvx[1], mvx[3]);
  711. *ty = mid_pred(mvy[0], mvy[1], mvy[3]);
  712. return 3;
  713. case 0x8:
  714. *tx = mid_pred(mvx[0], mvx[1], mvx[2]);
  715. *ty = mid_pred(mvy[0], mvy[1], mvy[2]);
  716. return 3;
  717. }
  718. } else if (count[idx] == 2) {
  719. int t1 = 0, t2 = 0;
  720. for (i = 0; i < 3; i++)
  721. if (!a[i]) {
  722. t1 = i;
  723. break;
  724. }
  725. for (i = t1 + 1; i < 4; i++)
  726. if (!a[i]) {
  727. t2 = i;
  728. break;
  729. }
  730. *tx = (mvx[t1] + mvx[t2]) / 2;
  731. *ty = (mvy[t1] + mvy[t2]) / 2;
  732. return 2;
  733. } else {
  734. return 0;
  735. }
  736. return -1;
  737. }
  738. /** Do motion compensation for 4-MV macroblock - both chroma blocks
  739. */
  740. static void vc1_mc_4mv_chroma(VC1Context *v, int dir)
  741. {
  742. MpegEncContext *s = &v->s;
  743. H264ChromaContext *h264chroma = &v->h264chroma;
  744. uint8_t *srcU, *srcV;
  745. int uvmx, uvmy, uvsrc_x, uvsrc_y;
  746. int k, tx = 0, ty = 0;
  747. int mvx[4], mvy[4], intra[4], mv_f[4];
  748. int valid_count;
  749. int chroma_ref_type = v->cur_field_type;
  750. int v_edge_pos = s->v_edge_pos >> v->field_mode;
  751. uint8_t (*lutuv)[256];
  752. int use_ic;
  753. if (!v->field_mode && !v->s.last_picture.f->data[0])
  754. return;
  755. if (s->flags & CODEC_FLAG_GRAY)
  756. return;
  757. for (k = 0; k < 4; k++) {
  758. mvx[k] = s->mv[dir][k][0];
  759. mvy[k] = s->mv[dir][k][1];
  760. intra[k] = v->mb_type[0][s->block_index[k]];
  761. if (v->field_mode)
  762. mv_f[k] = v->mv_f[dir][s->block_index[k] + v->blocks_off];
  763. }
  764. /* calculate chroma MV vector from four luma MVs */
  765. if (!v->field_mode || (v->field_mode && !v->numref)) {
  766. valid_count = get_chroma_mv(mvx, mvy, intra, 0, &tx, &ty);
  767. chroma_ref_type = v->reffield;
  768. if (!valid_count) {
  769. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][0] = 0;
  770. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][1] = 0;
  771. v->luma_mv[s->mb_x][0] = v->luma_mv[s->mb_x][1] = 0;
  772. return; //no need to do MC for intra blocks
  773. }
  774. } else {
  775. int dominant = 0;
  776. if (mv_f[0] + mv_f[1] + mv_f[2] + mv_f[3] > 2)
  777. dominant = 1;
  778. valid_count = get_chroma_mv(mvx, mvy, mv_f, dominant, &tx, &ty);
  779. if (dominant)
  780. chroma_ref_type = !v->cur_field_type;
  781. }
  782. if (v->field_mode && chroma_ref_type == 1 && v->cur_field_type == 1 && !v->s.last_picture.f->data[0])
  783. return;
  784. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][0] = tx;
  785. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][1] = ty;
  786. uvmx = (tx + ((tx & 3) == 3)) >> 1;
  787. uvmy = (ty + ((ty & 3) == 3)) >> 1;
  788. v->luma_mv[s->mb_x][0] = uvmx;
  789. v->luma_mv[s->mb_x][1] = uvmy;
  790. if (v->fastuvmc) {
  791. uvmx = uvmx + ((uvmx < 0) ? (uvmx & 1) : -(uvmx & 1));
  792. uvmy = uvmy + ((uvmy < 0) ? (uvmy & 1) : -(uvmy & 1));
  793. }
  794. // Field conversion bias
  795. if (v->cur_field_type != chroma_ref_type)
  796. uvmy += 2 - 4 * chroma_ref_type;
  797. uvsrc_x = s->mb_x * 8 + (uvmx >> 2);
  798. uvsrc_y = s->mb_y * 8 + (uvmy >> 2);
  799. if (v->profile != PROFILE_ADVANCED) {
  800. uvsrc_x = av_clip(uvsrc_x, -8, s->mb_width * 8);
  801. uvsrc_y = av_clip(uvsrc_y, -8, s->mb_height * 8);
  802. } else {
  803. uvsrc_x = av_clip(uvsrc_x, -8, s->avctx->coded_width >> 1);
  804. uvsrc_y = av_clip(uvsrc_y, -8, s->avctx->coded_height >> 1);
  805. }
  806. if (!dir) {
  807. if (v->field_mode && (v->cur_field_type != chroma_ref_type) && v->second_field) {
  808. srcU = s->current_picture.f->data[1];
  809. srcV = s->current_picture.f->data[2];
  810. lutuv = v->curr_lutuv;
  811. use_ic = v->curr_use_ic;
  812. } else {
  813. srcU = s->last_picture.f->data[1];
  814. srcV = s->last_picture.f->data[2];
  815. lutuv = v->last_lutuv;
  816. use_ic = v->last_use_ic;
  817. }
  818. } else {
  819. srcU = s->next_picture.f->data[1];
  820. srcV = s->next_picture.f->data[2];
  821. lutuv = v->next_lutuv;
  822. use_ic = v->next_use_ic;
  823. }
  824. if (!srcU) {
  825. av_log(v->s.avctx, AV_LOG_ERROR, "Referenced frame missing.\n");
  826. return;
  827. }
  828. srcU += uvsrc_y * s->uvlinesize + uvsrc_x;
  829. srcV += uvsrc_y * s->uvlinesize + uvsrc_x;
  830. if (v->field_mode) {
  831. if (chroma_ref_type) {
  832. srcU += s->current_picture_ptr->f->linesize[1];
  833. srcV += s->current_picture_ptr->f->linesize[2];
  834. }
  835. }
  836. if (v->rangeredfrm || use_ic
  837. || s->h_edge_pos < 18 || v_edge_pos < 18
  838. || (unsigned)uvsrc_x > (s->h_edge_pos >> 1) - 9
  839. || (unsigned)uvsrc_y > (v_edge_pos >> 1) - 9) {
  840. s->vdsp.emulated_edge_mc(s->edge_emu_buffer, srcU,
  841. s->uvlinesize, s->uvlinesize,
  842. 8 + 1, 8 + 1, uvsrc_x, uvsrc_y,
  843. s->h_edge_pos >> 1, v_edge_pos >> 1);
  844. s->vdsp.emulated_edge_mc(s->edge_emu_buffer + 16, srcV,
  845. s->uvlinesize, s->uvlinesize,
  846. 8 + 1, 8 + 1, uvsrc_x, uvsrc_y,
  847. s->h_edge_pos >> 1, v_edge_pos >> 1);
  848. srcU = s->edge_emu_buffer;
  849. srcV = s->edge_emu_buffer + 16;
  850. /* if we deal with range reduction we need to scale source blocks */
  851. if (v->rangeredfrm) {
  852. int i, j;
  853. uint8_t *src, *src2;
  854. src = srcU;
  855. src2 = srcV;
  856. for (j = 0; j < 9; j++) {
  857. for (i = 0; i < 9; i++) {
  858. src[i] = ((src[i] - 128) >> 1) + 128;
  859. src2[i] = ((src2[i] - 128) >> 1) + 128;
  860. }
  861. src += s->uvlinesize;
  862. src2 += s->uvlinesize;
  863. }
  864. }
  865. /* if we deal with intensity compensation we need to scale source blocks */
  866. if (use_ic) {
  867. int i, j;
  868. uint8_t *src, *src2;
  869. src = srcU;
  870. src2 = srcV;
  871. for (j = 0; j < 9; j++) {
  872. int f = v->field_mode ? chroma_ref_type : ((j + uvsrc_y) & 1);
  873. for (i = 0; i < 9; i++) {
  874. src[i] = lutuv[f][src[i]];
  875. src2[i] = lutuv[f][src2[i]];
  876. }
  877. src += s->uvlinesize;
  878. src2 += s->uvlinesize;
  879. }
  880. }
  881. }
  882. /* Chroma MC always uses qpel bilinear */
  883. uvmx = (uvmx & 3) << 1;
  884. uvmy = (uvmy & 3) << 1;
  885. if (!v->rnd) {
  886. h264chroma->put_h264_chroma_pixels_tab[0](s->dest[1], srcU, s->uvlinesize, 8, uvmx, uvmy);
  887. h264chroma->put_h264_chroma_pixels_tab[0](s->dest[2], srcV, s->uvlinesize, 8, uvmx, uvmy);
  888. } else {
  889. v->vc1dsp.put_no_rnd_vc1_chroma_pixels_tab[0](s->dest[1], srcU, s->uvlinesize, 8, uvmx, uvmy);
  890. v->vc1dsp.put_no_rnd_vc1_chroma_pixels_tab[0](s->dest[2], srcV, s->uvlinesize, 8, uvmx, uvmy);
  891. }
  892. }
  893. /** Do motion compensation for 4-MV interlaced frame chroma macroblock (both U and V)
  894. */
  895. static void vc1_mc_4mv_chroma4(VC1Context *v, int dir, int dir2, int avg)
  896. {
  897. MpegEncContext *s = &v->s;
  898. H264ChromaContext *h264chroma = &v->h264chroma;
  899. uint8_t *srcU, *srcV;
  900. int uvsrc_x, uvsrc_y;
  901. int uvmx_field[4], uvmy_field[4];
  902. int i, off, tx, ty;
  903. int fieldmv = v->blk_mv_type[s->block_index[0]];
  904. static const int s_rndtblfield[16] = { 0, 0, 1, 2, 4, 4, 5, 6, 2, 2, 3, 8, 6, 6, 7, 12 };
  905. int v_dist = fieldmv ? 1 : 4; // vertical offset for lower sub-blocks
  906. int v_edge_pos = s->v_edge_pos >> 1;
  907. int use_ic;
  908. uint8_t (*lutuv)[256];
  909. if (s->flags & CODEC_FLAG_GRAY)
  910. return;
  911. for (i = 0; i < 4; i++) {
  912. int d = i < 2 ? dir: dir2;
  913. tx = s->mv[d][i][0];
  914. uvmx_field[i] = (tx + ((tx & 3) == 3)) >> 1;
  915. ty = s->mv[d][i][1];
  916. if (fieldmv)
  917. uvmy_field[i] = (ty >> 4) * 8 + s_rndtblfield[ty & 0xF];
  918. else
  919. uvmy_field[i] = (ty + ((ty & 3) == 3)) >> 1;
  920. }
  921. for (i = 0; i < 4; i++) {
  922. off = (i & 1) * 4 + ((i & 2) ? v_dist * s->uvlinesize : 0);
  923. uvsrc_x = s->mb_x * 8 + (i & 1) * 4 + (uvmx_field[i] >> 2);
  924. uvsrc_y = s->mb_y * 8 + ((i & 2) ? v_dist : 0) + (uvmy_field[i] >> 2);
  925. // FIXME: implement proper pull-back (see vc1cropmv.c, vc1CROPMV_ChromaPullBack())
  926. uvsrc_x = av_clip(uvsrc_x, -8, s->avctx->coded_width >> 1);
  927. uvsrc_y = av_clip(uvsrc_y, -8, s->avctx->coded_height >> 1);
  928. if (i < 2 ? dir : dir2) {
  929. srcU = s->next_picture.f->data[1] + uvsrc_y * s->uvlinesize + uvsrc_x;
  930. srcV = s->next_picture.f->data[2] + uvsrc_y * s->uvlinesize + uvsrc_x;
  931. lutuv = v->next_lutuv;
  932. use_ic = v->next_use_ic;
  933. } else {
  934. srcU = s->last_picture.f->data[1] + uvsrc_y * s->uvlinesize + uvsrc_x;
  935. srcV = s->last_picture.f->data[2] + uvsrc_y * s->uvlinesize + uvsrc_x;
  936. lutuv = v->last_lutuv;
  937. use_ic = v->last_use_ic;
  938. }
  939. uvmx_field[i] = (uvmx_field[i] & 3) << 1;
  940. uvmy_field[i] = (uvmy_field[i] & 3) << 1;
  941. if (fieldmv && !(uvsrc_y & 1))
  942. v_edge_pos--;
  943. if (fieldmv && (uvsrc_y & 1) && uvsrc_y < 2)
  944. uvsrc_y--;
  945. if (use_ic
  946. || s->h_edge_pos < 10 || v_edge_pos < (5 << fieldmv)
  947. || (unsigned)uvsrc_x > (s->h_edge_pos >> 1) - 5
  948. || (unsigned)uvsrc_y > v_edge_pos - (5 << fieldmv)) {
  949. s->vdsp.emulated_edge_mc(s->edge_emu_buffer, srcU,
  950. s->uvlinesize, s->uvlinesize,
  951. 5, (5 << fieldmv), uvsrc_x, uvsrc_y,
  952. s->h_edge_pos >> 1, v_edge_pos);
  953. s->vdsp.emulated_edge_mc(s->edge_emu_buffer + 16, srcV,
  954. s->uvlinesize, s->uvlinesize,
  955. 5, (5 << fieldmv), uvsrc_x, uvsrc_y,
  956. s->h_edge_pos >> 1, v_edge_pos);
  957. srcU = s->edge_emu_buffer;
  958. srcV = s->edge_emu_buffer + 16;
  959. /* if we deal with intensity compensation we need to scale source blocks */
  960. if (use_ic) {
  961. int i, j;
  962. uint8_t *src, *src2;
  963. src = srcU;
  964. src2 = srcV;
  965. for (j = 0; j < 5; j++) {
  966. int f = (uvsrc_y + (j << fieldmv)) & 1;
  967. for (i = 0; i < 5; i++) {
  968. src[i] = lutuv[f][src[i]];
  969. src2[i] = lutuv[f][src2[i]];
  970. }
  971. src += s->uvlinesize << fieldmv;
  972. src2 += s->uvlinesize << fieldmv;
  973. }
  974. }
  975. }
  976. if (avg) {
  977. if (!v->rnd) {
  978. h264chroma->avg_h264_chroma_pixels_tab[1](s->dest[1] + off, srcU, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  979. h264chroma->avg_h264_chroma_pixels_tab[1](s->dest[2] + off, srcV, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  980. } else {
  981. v->vc1dsp.avg_no_rnd_vc1_chroma_pixels_tab[1](s->dest[1] + off, srcU, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  982. v->vc1dsp.avg_no_rnd_vc1_chroma_pixels_tab[1](s->dest[2] + off, srcV, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  983. }
  984. } else {
  985. if (!v->rnd) {
  986. h264chroma->put_h264_chroma_pixels_tab[1](s->dest[1] + off, srcU, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  987. h264chroma->put_h264_chroma_pixels_tab[1](s->dest[2] + off, srcV, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  988. } else {
  989. v->vc1dsp.put_no_rnd_vc1_chroma_pixels_tab[1](s->dest[1] + off, srcU, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  990. v->vc1dsp.put_no_rnd_vc1_chroma_pixels_tab[1](s->dest[2] + off, srcV, s->uvlinesize << fieldmv, 4, uvmx_field[i], uvmy_field[i]);
  991. }
  992. }
  993. }
  994. }
  995. /***********************************************************************/
  996. /**
  997. * @name VC-1 Block-level functions
  998. * @see 7.1.4, p91 and 8.1.1.7, p(1)04
  999. * @{
  1000. */
  1001. /**
  1002. * @def GET_MQUANT
  1003. * @brief Get macroblock-level quantizer scale
  1004. */
  1005. #define GET_MQUANT() \
  1006. if (v->dquantfrm) { \
  1007. int edges = 0; \
  1008. if (v->dqprofile == DQPROFILE_ALL_MBS) { \
  1009. if (v->dqbilevel) { \
  1010. mquant = (get_bits1(gb)) ? v->altpq : v->pq; \
  1011. } else { \
  1012. mqdiff = get_bits(gb, 3); \
  1013. if (mqdiff != 7) \
  1014. mquant = v->pq + mqdiff; \
  1015. else \
  1016. mquant = get_bits(gb, 5); \
  1017. } \
  1018. } \
  1019. if (v->dqprofile == DQPROFILE_SINGLE_EDGE) \
  1020. edges = 1 << v->dqsbedge; \
  1021. else if (v->dqprofile == DQPROFILE_DOUBLE_EDGES) \
  1022. edges = (3 << v->dqsbedge) % 15; \
  1023. else if (v->dqprofile == DQPROFILE_FOUR_EDGES) \
  1024. edges = 15; \
  1025. if ((edges&1) && !s->mb_x) \
  1026. mquant = v->altpq; \
  1027. if ((edges&2) && s->first_slice_line) \
  1028. mquant = v->altpq; \
  1029. if ((edges&4) && s->mb_x == (s->mb_width - 1)) \
  1030. mquant = v->altpq; \
  1031. if ((edges&8) && s->mb_y == (s->mb_height - 1)) \
  1032. mquant = v->altpq; \
  1033. if (!mquant || mquant > 31) { \
  1034. av_log(v->s.avctx, AV_LOG_ERROR, \
  1035. "Overriding invalid mquant %d\n", mquant); \
  1036. mquant = 1; \
  1037. } \
  1038. }
  1039. /**
  1040. * @def GET_MVDATA(_dmv_x, _dmv_y)
  1041. * @brief Get MV differentials
  1042. * @see MVDATA decoding from 8.3.5.2, p(1)20
  1043. * @param _dmv_x Horizontal differential for decoded MV
  1044. * @param _dmv_y Vertical differential for decoded MV
  1045. */
  1046. #define GET_MVDATA(_dmv_x, _dmv_y) \
  1047. index = 1 + get_vlc2(gb, ff_vc1_mv_diff_vlc[s->mv_table_index].table, \
  1048. VC1_MV_DIFF_VLC_BITS, 2); \
  1049. if (index > 36) { \
  1050. mb_has_coeffs = 1; \
  1051. index -= 37; \
  1052. } else \
  1053. mb_has_coeffs = 0; \
  1054. s->mb_intra = 0; \
  1055. if (!index) { \
  1056. _dmv_x = _dmv_y = 0; \
  1057. } else if (index == 35) { \
  1058. _dmv_x = get_bits(gb, v->k_x - 1 + s->quarter_sample); \
  1059. _dmv_y = get_bits(gb, v->k_y - 1 + s->quarter_sample); \
  1060. } else if (index == 36) { \
  1061. _dmv_x = 0; \
  1062. _dmv_y = 0; \
  1063. s->mb_intra = 1; \
  1064. } else { \
  1065. index1 = index % 6; \
  1066. if (!s->quarter_sample && index1 == 5) val = 1; \
  1067. else val = 0; \
  1068. if (size_table[index1] - val > 0) \
  1069. val = get_bits(gb, size_table[index1] - val); \
  1070. else val = 0; \
  1071. sign = 0 - (val&1); \
  1072. _dmv_x = (sign ^ ((val>>1) + offset_table[index1])) - sign; \
  1073. \
  1074. index1 = index / 6; \
  1075. if (!s->quarter_sample && index1 == 5) val = 1; \
  1076. else val = 0; \
  1077. if (size_table[index1] - val > 0) \
  1078. val = get_bits(gb, size_table[index1] - val); \
  1079. else val = 0; \
  1080. sign = 0 - (val & 1); \
  1081. _dmv_y = (sign ^ ((val >> 1) + offset_table[index1])) - sign; \
  1082. }
  1083. static av_always_inline void get_mvdata_interlaced(VC1Context *v, int *dmv_x,
  1084. int *dmv_y, int *pred_flag)
  1085. {
  1086. int index, index1;
  1087. int extend_x = 0, extend_y = 0;
  1088. GetBitContext *gb = &v->s.gb;
  1089. int bits, esc;
  1090. int val, sign;
  1091. const int* offs_tab;
  1092. if (v->numref) {
  1093. bits = VC1_2REF_MVDATA_VLC_BITS;
  1094. esc = 125;
  1095. } else {
  1096. bits = VC1_1REF_MVDATA_VLC_BITS;
  1097. esc = 71;
  1098. }
  1099. switch (v->dmvrange) {
  1100. case 1:
  1101. extend_x = 1;
  1102. break;
  1103. case 2:
  1104. extend_y = 1;
  1105. break;
  1106. case 3:
  1107. extend_x = extend_y = 1;
  1108. break;
  1109. }
  1110. index = get_vlc2(gb, v->imv_vlc->table, bits, 3);
  1111. if (index == esc) {
  1112. *dmv_x = get_bits(gb, v->k_x);
  1113. *dmv_y = get_bits(gb, v->k_y);
  1114. if (v->numref) {
  1115. if (pred_flag) {
  1116. *pred_flag = *dmv_y & 1;
  1117. *dmv_y = (*dmv_y + *pred_flag) >> 1;
  1118. } else {
  1119. *dmv_y = (*dmv_y + (*dmv_y & 1)) >> 1;
  1120. }
  1121. }
  1122. }
  1123. else {
  1124. if (extend_x)
  1125. offs_tab = offset_table2;
  1126. else
  1127. offs_tab = offset_table1;
  1128. index1 = (index + 1) % 9;
  1129. if (index1 != 0) {
  1130. val = get_bits(gb, index1 + extend_x);
  1131. sign = 0 -(val & 1);
  1132. *dmv_x = (sign ^ ((val >> 1) + offs_tab[index1])) - sign;
  1133. } else
  1134. *dmv_x = 0;
  1135. if (extend_y)
  1136. offs_tab = offset_table2;
  1137. else
  1138. offs_tab = offset_table1;
  1139. index1 = (index + 1) / 9;
  1140. if (index1 > v->numref) {
  1141. val = get_bits(gb, (index1 + (extend_y << v->numref)) >> v->numref);
  1142. sign = 0 - (val & 1);
  1143. *dmv_y = (sign ^ ((val >> 1) + offs_tab[index1 >> v->numref])) - sign;
  1144. } else
  1145. *dmv_y = 0;
  1146. if (v->numref && pred_flag)
  1147. *pred_flag = index1 & 1;
  1148. }
  1149. }
  1150. static av_always_inline int scaleforsame_x(VC1Context *v, int n /* MV */, int dir)
  1151. {
  1152. int scaledvalue, refdist;
  1153. int scalesame1, scalesame2;
  1154. int scalezone1_x, zone1offset_x;
  1155. int table_index = dir ^ v->second_field;
  1156. if (v->s.pict_type != AV_PICTURE_TYPE_B)
  1157. refdist = v->refdist;
  1158. else
  1159. refdist = dir ? v->brfd : v->frfd;
  1160. if (refdist > 3)
  1161. refdist = 3;
  1162. scalesame1 = ff_vc1_field_mvpred_scales[table_index][1][refdist];
  1163. scalesame2 = ff_vc1_field_mvpred_scales[table_index][2][refdist];
  1164. scalezone1_x = ff_vc1_field_mvpred_scales[table_index][3][refdist];
  1165. zone1offset_x = ff_vc1_field_mvpred_scales[table_index][5][refdist];
  1166. if (FFABS(n) > 255)
  1167. scaledvalue = n;
  1168. else {
  1169. if (FFABS(n) < scalezone1_x)
  1170. scaledvalue = (n * scalesame1) >> 8;
  1171. else {
  1172. if (n < 0)
  1173. scaledvalue = ((n * scalesame2) >> 8) - zone1offset_x;
  1174. else
  1175. scaledvalue = ((n * scalesame2) >> 8) + zone1offset_x;
  1176. }
  1177. }
  1178. return av_clip(scaledvalue, -v->range_x, v->range_x - 1);
  1179. }
  1180. static av_always_inline int scaleforsame_y(VC1Context *v, int i, int n /* MV */, int dir)
  1181. {
  1182. int scaledvalue, refdist;
  1183. int scalesame1, scalesame2;
  1184. int scalezone1_y, zone1offset_y;
  1185. int table_index = dir ^ v->second_field;
  1186. if (v->s.pict_type != AV_PICTURE_TYPE_B)
  1187. refdist = v->refdist;
  1188. else
  1189. refdist = dir ? v->brfd : v->frfd;
  1190. if (refdist > 3)
  1191. refdist = 3;
  1192. scalesame1 = ff_vc1_field_mvpred_scales[table_index][1][refdist];
  1193. scalesame2 = ff_vc1_field_mvpred_scales[table_index][2][refdist];
  1194. scalezone1_y = ff_vc1_field_mvpred_scales[table_index][4][refdist];
  1195. zone1offset_y = ff_vc1_field_mvpred_scales[table_index][6][refdist];
  1196. if (FFABS(n) > 63)
  1197. scaledvalue = n;
  1198. else {
  1199. if (FFABS(n) < scalezone1_y)
  1200. scaledvalue = (n * scalesame1) >> 8;
  1201. else {
  1202. if (n < 0)
  1203. scaledvalue = ((n * scalesame2) >> 8) - zone1offset_y;
  1204. else
  1205. scaledvalue = ((n * scalesame2) >> 8) + zone1offset_y;
  1206. }
  1207. }
  1208. if (v->cur_field_type && !v->ref_field_type[dir])
  1209. return av_clip(scaledvalue, -v->range_y / 2 + 1, v->range_y / 2);
  1210. else
  1211. return av_clip(scaledvalue, -v->range_y / 2, v->range_y / 2 - 1);
  1212. }
  1213. static av_always_inline int scaleforopp_x(VC1Context *v, int n /* MV */)
  1214. {
  1215. int scalezone1_x, zone1offset_x;
  1216. int scaleopp1, scaleopp2, brfd;
  1217. int scaledvalue;
  1218. brfd = FFMIN(v->brfd, 3);
  1219. scalezone1_x = ff_vc1_b_field_mvpred_scales[3][brfd];
  1220. zone1offset_x = ff_vc1_b_field_mvpred_scales[5][brfd];
  1221. scaleopp1 = ff_vc1_b_field_mvpred_scales[1][brfd];
  1222. scaleopp2 = ff_vc1_b_field_mvpred_scales[2][brfd];
  1223. if (FFABS(n) > 255)
  1224. scaledvalue = n;
  1225. else {
  1226. if (FFABS(n) < scalezone1_x)
  1227. scaledvalue = (n * scaleopp1) >> 8;
  1228. else {
  1229. if (n < 0)
  1230. scaledvalue = ((n * scaleopp2) >> 8) - zone1offset_x;
  1231. else
  1232. scaledvalue = ((n * scaleopp2) >> 8) + zone1offset_x;
  1233. }
  1234. }
  1235. return av_clip(scaledvalue, -v->range_x, v->range_x - 1);
  1236. }
  1237. static av_always_inline int scaleforopp_y(VC1Context *v, int n /* MV */, int dir)
  1238. {
  1239. int scalezone1_y, zone1offset_y;
  1240. int scaleopp1, scaleopp2, brfd;
  1241. int scaledvalue;
  1242. brfd = FFMIN(v->brfd, 3);
  1243. scalezone1_y = ff_vc1_b_field_mvpred_scales[4][brfd];
  1244. zone1offset_y = ff_vc1_b_field_mvpred_scales[6][brfd];
  1245. scaleopp1 = ff_vc1_b_field_mvpred_scales[1][brfd];
  1246. scaleopp2 = ff_vc1_b_field_mvpred_scales[2][brfd];
  1247. if (FFABS(n) > 63)
  1248. scaledvalue = n;
  1249. else {
  1250. if (FFABS(n) < scalezone1_y)
  1251. scaledvalue = (n * scaleopp1) >> 8;
  1252. else {
  1253. if (n < 0)
  1254. scaledvalue = ((n * scaleopp2) >> 8) - zone1offset_y;
  1255. else
  1256. scaledvalue = ((n * scaleopp2) >> 8) + zone1offset_y;
  1257. }
  1258. }
  1259. if (v->cur_field_type && !v->ref_field_type[dir]) {
  1260. return av_clip(scaledvalue, -v->range_y / 2 + 1, v->range_y / 2);
  1261. } else {
  1262. return av_clip(scaledvalue, -v->range_y / 2, v->range_y / 2 - 1);
  1263. }
  1264. }
  1265. static av_always_inline int scaleforsame(VC1Context *v, int i, int n /* MV */,
  1266. int dim, int dir)
  1267. {
  1268. int brfd, scalesame;
  1269. int hpel = 1 - v->s.quarter_sample;
  1270. n >>= hpel;
  1271. if (v->s.pict_type != AV_PICTURE_TYPE_B || v->second_field || !dir) {
  1272. if (dim)
  1273. n = scaleforsame_y(v, i, n, dir) << hpel;
  1274. else
  1275. n = scaleforsame_x(v, n, dir) << hpel;
  1276. return n;
  1277. }
  1278. brfd = FFMIN(v->brfd, 3);
  1279. scalesame = ff_vc1_b_field_mvpred_scales[0][brfd];
  1280. n = (n * scalesame >> 8) << hpel;
  1281. return n;
  1282. }
  1283. static av_always_inline int scaleforopp(VC1Context *v, int n /* MV */,
  1284. int dim, int dir)
  1285. {
  1286. int refdist, scaleopp;
  1287. int hpel = 1 - v->s.quarter_sample;
  1288. n >>= hpel;
  1289. if (v->s.pict_type == AV_PICTURE_TYPE_B && !v->second_field && dir == 1) {
  1290. if (dim)
  1291. n = scaleforopp_y(v, n, dir) << hpel;
  1292. else
  1293. n = scaleforopp_x(v, n) << hpel;
  1294. return n;
  1295. }
  1296. if (v->s.pict_type != AV_PICTURE_TYPE_B)
  1297. refdist = FFMIN(v->refdist, 3);
  1298. else
  1299. refdist = dir ? v->brfd : v->frfd;
  1300. scaleopp = ff_vc1_field_mvpred_scales[dir ^ v->second_field][0][refdist];
  1301. n = (n * scaleopp >> 8) << hpel;
  1302. return n;
  1303. }
  1304. /** Predict and set motion vector
  1305. */
  1306. static inline void vc1_pred_mv(VC1Context *v, int n, int dmv_x, int dmv_y,
  1307. int mv1, int r_x, int r_y, uint8_t* is_intra,
  1308. int pred_flag, int dir)
  1309. {
  1310. MpegEncContext *s = &v->s;
  1311. int xy, wrap, off = 0;
  1312. int16_t *A, *B, *C;
  1313. int px, py;
  1314. int sum;
  1315. int mixedmv_pic, num_samefield = 0, num_oppfield = 0;
  1316. int opposite, a_f, b_f, c_f;
  1317. int16_t field_predA[2];
  1318. int16_t field_predB[2];
  1319. int16_t field_predC[2];
  1320. int a_valid, b_valid, c_valid;
  1321. int hybridmv_thresh, y_bias = 0;
  1322. if (v->mv_mode == MV_PMODE_MIXED_MV ||
  1323. ((v->mv_mode == MV_PMODE_INTENSITY_COMP) && (v->mv_mode2 == MV_PMODE_MIXED_MV)))
  1324. mixedmv_pic = 1;
  1325. else
  1326. mixedmv_pic = 0;
  1327. /* scale MV difference to be quad-pel */
  1328. dmv_x <<= 1 - s->quarter_sample;
  1329. dmv_y <<= 1 - s->quarter_sample;
  1330. wrap = s->b8_stride;
  1331. xy = s->block_index[n];
  1332. if (s->mb_intra) {
  1333. s->mv[0][n][0] = s->current_picture.motion_val[0][xy + v->blocks_off][0] = 0;
  1334. s->mv[0][n][1] = s->current_picture.motion_val[0][xy + v->blocks_off][1] = 0;
  1335. s->current_picture.motion_val[1][xy + v->blocks_off][0] = 0;
  1336. s->current_picture.motion_val[1][xy + v->blocks_off][1] = 0;
  1337. if (mv1) { /* duplicate motion data for 1-MV block */
  1338. s->current_picture.motion_val[0][xy + 1 + v->blocks_off][0] = 0;
  1339. s->current_picture.motion_val[0][xy + 1 + v->blocks_off][1] = 0;
  1340. s->current_picture.motion_val[0][xy + wrap + v->blocks_off][0] = 0;
  1341. s->current_picture.motion_val[0][xy + wrap + v->blocks_off][1] = 0;
  1342. s->current_picture.motion_val[0][xy + wrap + 1 + v->blocks_off][0] = 0;
  1343. s->current_picture.motion_val[0][xy + wrap + 1 + v->blocks_off][1] = 0;
  1344. v->luma_mv[s->mb_x][0] = v->luma_mv[s->mb_x][1] = 0;
  1345. s->current_picture.motion_val[1][xy + 1 + v->blocks_off][0] = 0;
  1346. s->current_picture.motion_val[1][xy + 1 + v->blocks_off][1] = 0;
  1347. s->current_picture.motion_val[1][xy + wrap][0] = 0;
  1348. s->current_picture.motion_val[1][xy + wrap + v->blocks_off][1] = 0;
  1349. s->current_picture.motion_val[1][xy + wrap + 1 + v->blocks_off][0] = 0;
  1350. s->current_picture.motion_val[1][xy + wrap + 1 + v->blocks_off][1] = 0;
  1351. }
  1352. return;
  1353. }
  1354. C = s->current_picture.motion_val[dir][xy - 1 + v->blocks_off];
  1355. A = s->current_picture.motion_val[dir][xy - wrap + v->blocks_off];
  1356. if (mv1) {
  1357. if (v->field_mode && mixedmv_pic)
  1358. off = (s->mb_x == (s->mb_width - 1)) ? -2 : 2;
  1359. else
  1360. off = (s->mb_x == (s->mb_width - 1)) ? -1 : 2;
  1361. } else {
  1362. //in 4-MV mode different blocks have different B predictor position
  1363. switch (n) {
  1364. case 0:
  1365. off = (s->mb_x > 0) ? -1 : 1;
  1366. break;
  1367. case 1:
  1368. off = (s->mb_x == (s->mb_width - 1)) ? -1 : 1;
  1369. break;
  1370. case 2:
  1371. off = 1;
  1372. break;
  1373. case 3:
  1374. off = -1;
  1375. }
  1376. }
  1377. B = s->current_picture.motion_val[dir][xy - wrap + off + v->blocks_off];
  1378. a_valid = !s->first_slice_line || (n == 2 || n == 3);
  1379. b_valid = a_valid && (s->mb_width > 1);
  1380. c_valid = s->mb_x || (n == 1 || n == 3);
  1381. if (v->field_mode) {
  1382. a_valid = a_valid && !is_intra[xy - wrap];
  1383. b_valid = b_valid && !is_intra[xy - wrap + off];
  1384. c_valid = c_valid && !is_intra[xy - 1];
  1385. }
  1386. if (a_valid) {
  1387. a_f = v->mv_f[dir][xy - wrap + v->blocks_off];
  1388. num_oppfield += a_f;
  1389. num_samefield += 1 - a_f;
  1390. field_predA[0] = A[0];
  1391. field_predA[1] = A[1];
  1392. } else {
  1393. field_predA[0] = field_predA[1] = 0;
  1394. a_f = 0;
  1395. }
  1396. if (b_valid) {
  1397. b_f = v->mv_f[dir][xy - wrap + off + v->blocks_off];
  1398. num_oppfield += b_f;
  1399. num_samefield += 1 - b_f;
  1400. field_predB[0] = B[0];
  1401. field_predB[1] = B[1];
  1402. } else {
  1403. field_predB[0] = field_predB[1] = 0;
  1404. b_f = 0;
  1405. }
  1406. if (c_valid) {
  1407. c_f = v->mv_f[dir][xy - 1 + v->blocks_off];
  1408. num_oppfield += c_f;
  1409. num_samefield += 1 - c_f;
  1410. field_predC[0] = C[0];
  1411. field_predC[1] = C[1];
  1412. } else {
  1413. field_predC[0] = field_predC[1] = 0;
  1414. c_f = 0;
  1415. }
  1416. if (v->field_mode) {
  1417. if (!v->numref)
  1418. // REFFIELD determines if the last field or the second-last field is
  1419. // to be used as reference
  1420. opposite = 1 - v->reffield;
  1421. else {
  1422. if (num_samefield <= num_oppfield)
  1423. opposite = 1 - pred_flag;
  1424. else
  1425. opposite = pred_flag;
  1426. }
  1427. } else
  1428. opposite = 0;
  1429. if (opposite) {
  1430. if (a_valid && !a_f) {
  1431. field_predA[0] = scaleforopp(v, field_predA[0], 0, dir);
  1432. field_predA[1] = scaleforopp(v, field_predA[1], 1, dir);
  1433. }
  1434. if (b_valid && !b_f) {
  1435. field_predB[0] = scaleforopp(v, field_predB[0], 0, dir);
  1436. field_predB[1] = scaleforopp(v, field_predB[1], 1, dir);
  1437. }
  1438. if (c_valid && !c_f) {
  1439. field_predC[0] = scaleforopp(v, field_predC[0], 0, dir);
  1440. field_predC[1] = scaleforopp(v, field_predC[1], 1, dir);
  1441. }
  1442. v->mv_f[dir][xy + v->blocks_off] = 1;
  1443. v->ref_field_type[dir] = !v->cur_field_type;
  1444. } else {
  1445. if (a_valid && a_f) {
  1446. field_predA[0] = scaleforsame(v, n, field_predA[0], 0, dir);
  1447. field_predA[1] = scaleforsame(v, n, field_predA[1], 1, dir);
  1448. }
  1449. if (b_valid && b_f) {
  1450. field_predB[0] = scaleforsame(v, n, field_predB[0], 0, dir);
  1451. field_predB[1] = scaleforsame(v, n, field_predB[1], 1, dir);
  1452. }
  1453. if (c_valid && c_f) {
  1454. field_predC[0] = scaleforsame(v, n, field_predC[0], 0, dir);
  1455. field_predC[1] = scaleforsame(v, n, field_predC[1], 1, dir);
  1456. }
  1457. v->mv_f[dir][xy + v->blocks_off] = 0;
  1458. v->ref_field_type[dir] = v->cur_field_type;
  1459. }
  1460. if (a_valid) {
  1461. px = field_predA[0];
  1462. py = field_predA[1];
  1463. } else if (c_valid) {
  1464. px = field_predC[0];
  1465. py = field_predC[1];
  1466. } else if (b_valid) {
  1467. px = field_predB[0];
  1468. py = field_predB[1];
  1469. } else {
  1470. px = 0;
  1471. py = 0;
  1472. }
  1473. if (num_samefield + num_oppfield > 1) {
  1474. px = mid_pred(field_predA[0], field_predB[0], field_predC[0]);
  1475. py = mid_pred(field_predA[1], field_predB[1], field_predC[1]);
  1476. }
  1477. /* Pullback MV as specified in 8.3.5.3.4 */
  1478. if (!v->field_mode) {
  1479. int qx, qy, X, Y;
  1480. qx = (s->mb_x << 6) + ((n == 1 || n == 3) ? 32 : 0);
  1481. qy = (s->mb_y << 6) + ((n == 2 || n == 3) ? 32 : 0);
  1482. X = (s->mb_width << 6) - 4;
  1483. Y = (s->mb_height << 6) - 4;
  1484. if (mv1) {
  1485. if (qx + px < -60) px = -60 - qx;
  1486. if (qy + py < -60) py = -60 - qy;
  1487. } else {
  1488. if (qx + px < -28) px = -28 - qx;
  1489. if (qy + py < -28) py = -28 - qy;
  1490. }
  1491. if (qx + px > X) px = X - qx;
  1492. if (qy + py > Y) py = Y - qy;
  1493. }
  1494. if (!v->field_mode || s->pict_type != AV_PICTURE_TYPE_B) {
  1495. /* Calculate hybrid prediction as specified in 8.3.5.3.5 (also 10.3.5.4.3.5) */
  1496. hybridmv_thresh = 32;
  1497. if (a_valid && c_valid) {
  1498. if (is_intra[xy - wrap])
  1499. sum = FFABS(px) + FFABS(py);
  1500. else
  1501. sum = FFABS(px - field_predA[0]) + FFABS(py - field_predA[1]);
  1502. if (sum > hybridmv_thresh) {
  1503. if (get_bits1(&s->gb)) { // read HYBRIDPRED bit
  1504. px = field_predA[0];
  1505. py = field_predA[1];
  1506. } else {
  1507. px = field_predC[0];
  1508. py = field_predC[1];
  1509. }
  1510. } else {
  1511. if (is_intra[xy - 1])
  1512. sum = FFABS(px) + FFABS(py);
  1513. else
  1514. sum = FFABS(px - field_predC[0]) + FFABS(py - field_predC[1]);
  1515. if (sum > hybridmv_thresh) {
  1516. if (get_bits1(&s->gb)) {
  1517. px = field_predA[0];
  1518. py = field_predA[1];
  1519. } else {
  1520. px = field_predC[0];
  1521. py = field_predC[1];
  1522. }
  1523. }
  1524. }
  1525. }
  1526. }
  1527. if (v->field_mode && v->numref)
  1528. r_y >>= 1;
  1529. if (v->field_mode && v->cur_field_type && v->ref_field_type[dir] == 0)
  1530. y_bias = 1;
  1531. /* store MV using signed modulus of MV range defined in 4.11 */
  1532. s->mv[dir][n][0] = s->current_picture.motion_val[dir][xy + v->blocks_off][0] = ((px + dmv_x + r_x) & ((r_x << 1) - 1)) - r_x;
  1533. s->mv[dir][n][1] = s->current_picture.motion_val[dir][xy + v->blocks_off][1] = ((py + dmv_y + r_y - y_bias) & ((r_y << 1) - 1)) - r_y + y_bias;
  1534. if (mv1) { /* duplicate motion data for 1-MV block */
  1535. s->current_picture.motion_val[dir][xy + 1 + v->blocks_off][0] = s->current_picture.motion_val[dir][xy + v->blocks_off][0];
  1536. s->current_picture.motion_val[dir][xy + 1 + v->blocks_off][1] = s->current_picture.motion_val[dir][xy + v->blocks_off][1];
  1537. s->current_picture.motion_val[dir][xy + wrap + v->blocks_off][0] = s->current_picture.motion_val[dir][xy + v->blocks_off][0];
  1538. s->current_picture.motion_val[dir][xy + wrap + v->blocks_off][1] = s->current_picture.motion_val[dir][xy + v->blocks_off][1];
  1539. s->current_picture.motion_val[dir][xy + wrap + 1 + v->blocks_off][0] = s->current_picture.motion_val[dir][xy + v->blocks_off][0];
  1540. s->current_picture.motion_val[dir][xy + wrap + 1 + v->blocks_off][1] = s->current_picture.motion_val[dir][xy + v->blocks_off][1];
  1541. v->mv_f[dir][xy + 1 + v->blocks_off] = v->mv_f[dir][xy + v->blocks_off];
  1542. v->mv_f[dir][xy + wrap + v->blocks_off] = v->mv_f[dir][xy + wrap + 1 + v->blocks_off] = v->mv_f[dir][xy + v->blocks_off];
  1543. }
  1544. }
  1545. /** Predict and set motion vector for interlaced frame picture MBs
  1546. */
  1547. static inline void vc1_pred_mv_intfr(VC1Context *v, int n, int dmv_x, int dmv_y,
  1548. int mvn, int r_x, int r_y, uint8_t* is_intra, int dir)
  1549. {
  1550. MpegEncContext *s = &v->s;
  1551. int xy, wrap, off = 0;
  1552. int A[2], B[2], C[2];
  1553. int px, py;
  1554. int a_valid = 0, b_valid = 0, c_valid = 0;
  1555. int field_a, field_b, field_c; // 0: same, 1: opposit
  1556. int total_valid, num_samefield, num_oppfield;
  1557. int pos_c, pos_b, n_adj;
  1558. wrap = s->b8_stride;
  1559. xy = s->block_index[n];
  1560. if (s->mb_intra) {
  1561. s->mv[0][n][0] = s->current_picture.motion_val[0][xy][0] = 0;
  1562. s->mv[0][n][1] = s->current_picture.motion_val[0][xy][1] = 0;
  1563. s->current_picture.motion_val[1][xy][0] = 0;
  1564. s->current_picture.motion_val[1][xy][1] = 0;
  1565. if (mvn == 1) { /* duplicate motion data for 1-MV block */
  1566. s->current_picture.motion_val[0][xy + 1][0] = 0;
  1567. s->current_picture.motion_val[0][xy + 1][1] = 0;
  1568. s->current_picture.motion_val[0][xy + wrap][0] = 0;
  1569. s->current_picture.motion_val[0][xy + wrap][1] = 0;
  1570. s->current_picture.motion_val[0][xy + wrap + 1][0] = 0;
  1571. s->current_picture.motion_val[0][xy + wrap + 1][1] = 0;
  1572. v->luma_mv[s->mb_x][0] = v->luma_mv[s->mb_x][1] = 0;
  1573. s->current_picture.motion_val[1][xy + 1][0] = 0;
  1574. s->current_picture.motion_val[1][xy + 1][1] = 0;
  1575. s->current_picture.motion_val[1][xy + wrap][0] = 0;
  1576. s->current_picture.motion_val[1][xy + wrap][1] = 0;
  1577. s->current_picture.motion_val[1][xy + wrap + 1][0] = 0;
  1578. s->current_picture.motion_val[1][xy + wrap + 1][1] = 0;
  1579. }
  1580. return;
  1581. }
  1582. off = ((n == 0) || (n == 1)) ? 1 : -1;
  1583. /* predict A */
  1584. if (s->mb_x || (n == 1) || (n == 3)) {
  1585. if ((v->blk_mv_type[xy]) // current block (MB) has a field MV
  1586. || (!v->blk_mv_type[xy] && !v->blk_mv_type[xy - 1])) { // or both have frame MV
  1587. A[0] = s->current_picture.motion_val[dir][xy - 1][0];
  1588. A[1] = s->current_picture.motion_val[dir][xy - 1][1];
  1589. a_valid = 1;
  1590. } else { // current block has frame mv and cand. has field MV (so average)
  1591. A[0] = (s->current_picture.motion_val[dir][xy - 1][0]
  1592. + s->current_picture.motion_val[dir][xy - 1 + off * wrap][0] + 1) >> 1;
  1593. A[1] = (s->current_picture.motion_val[dir][xy - 1][1]
  1594. + s->current_picture.motion_val[dir][xy - 1 + off * wrap][1] + 1) >> 1;
  1595. a_valid = 1;
  1596. }
  1597. if (!(n & 1) && v->is_intra[s->mb_x - 1]) {
  1598. a_valid = 0;
  1599. A[0] = A[1] = 0;
  1600. }
  1601. } else
  1602. A[0] = A[1] = 0;
  1603. /* Predict B and C */
  1604. B[0] = B[1] = C[0] = C[1] = 0;
  1605. if (n == 0 || n == 1 || v->blk_mv_type[xy]) {
  1606. if (!s->first_slice_line) {
  1607. if (!v->is_intra[s->mb_x - s->mb_stride]) {
  1608. b_valid = 1;
  1609. n_adj = n | 2;
  1610. pos_b = s->block_index[n_adj] - 2 * wrap;
  1611. if (v->blk_mv_type[pos_b] && v->blk_mv_type[xy]) {
  1612. n_adj = (n & 2) | (n & 1);
  1613. }
  1614. B[0] = s->current_picture.motion_val[dir][s->block_index[n_adj] - 2 * wrap][0];
  1615. B[1] = s->current_picture.motion_val[dir][s->block_index[n_adj] - 2 * wrap][1];
  1616. if (v->blk_mv_type[pos_b] && !v->blk_mv_type[xy]) {
  1617. B[0] = (B[0] + s->current_picture.motion_val[dir][s->block_index[n_adj ^ 2] - 2 * wrap][0] + 1) >> 1;
  1618. B[1] = (B[1] + s->current_picture.motion_val[dir][s->block_index[n_adj ^ 2] - 2 * wrap][1] + 1) >> 1;
  1619. }
  1620. }
  1621. if (s->mb_width > 1) {
  1622. if (!v->is_intra[s->mb_x - s->mb_stride + 1]) {
  1623. c_valid = 1;
  1624. n_adj = 2;
  1625. pos_c = s->block_index[2] - 2 * wrap + 2;
  1626. if (v->blk_mv_type[pos_c] && v->blk_mv_type[xy]) {
  1627. n_adj = n & 2;
  1628. }
  1629. C[0] = s->current_picture.motion_val[dir][s->block_index[n_adj] - 2 * wrap + 2][0];
  1630. C[1] = s->current_picture.motion_val[dir][s->block_index[n_adj] - 2 * wrap + 2][1];
  1631. if (v->blk_mv_type[pos_c] && !v->blk_mv_type[xy]) {
  1632. C[0] = (1 + C[0] + (s->current_picture.motion_val[dir][s->block_index[n_adj ^ 2] - 2 * wrap + 2][0])) >> 1;
  1633. C[1] = (1 + C[1] + (s->current_picture.motion_val[dir][s->block_index[n_adj ^ 2] - 2 * wrap + 2][1])) >> 1;
  1634. }
  1635. if (s->mb_x == s->mb_width - 1) {
  1636. if (!v->is_intra[s->mb_x - s->mb_stride - 1]) {
  1637. c_valid = 1;
  1638. n_adj = 3;
  1639. pos_c = s->block_index[3] - 2 * wrap - 2;
  1640. if (v->blk_mv_type[pos_c] && v->blk_mv_type[xy]) {
  1641. n_adj = n | 1;
  1642. }
  1643. C[0] = s->current_picture.motion_val[dir][s->block_index[n_adj] - 2 * wrap - 2][0];
  1644. C[1] = s->current_picture.motion_val[dir][s->block_index[n_adj] - 2 * wrap - 2][1];
  1645. if (v->blk_mv_type[pos_c] && !v->blk_mv_type[xy]) {
  1646. C[0] = (1 + C[0] + s->current_picture.motion_val[dir][s->block_index[1] - 2 * wrap - 2][0]) >> 1;
  1647. C[1] = (1 + C[1] + s->current_picture.motion_val[dir][s->block_index[1] - 2 * wrap - 2][1]) >> 1;
  1648. }
  1649. } else
  1650. c_valid = 0;
  1651. }
  1652. }
  1653. }
  1654. }
  1655. } else {
  1656. pos_b = s->block_index[1];
  1657. b_valid = 1;
  1658. B[0] = s->current_picture.motion_val[dir][pos_b][0];
  1659. B[1] = s->current_picture.motion_val[dir][pos_b][1];
  1660. pos_c = s->block_index[0];
  1661. c_valid = 1;
  1662. C[0] = s->current_picture.motion_val[dir][pos_c][0];
  1663. C[1] = s->current_picture.motion_val[dir][pos_c][1];
  1664. }
  1665. total_valid = a_valid + b_valid + c_valid;
  1666. // check if predictor A is out of bounds
  1667. if (!s->mb_x && !(n == 1 || n == 3)) {
  1668. A[0] = A[1] = 0;
  1669. }
  1670. // check if predictor B is out of bounds
  1671. if ((s->first_slice_line && v->blk_mv_type[xy]) || (s->first_slice_line && !(n & 2))) {
  1672. B[0] = B[1] = C[0] = C[1] = 0;
  1673. }
  1674. if (!v->blk_mv_type[xy]) {
  1675. if (s->mb_width == 1) {
  1676. px = B[0];
  1677. py = B[1];
  1678. } else {
  1679. if (total_valid >= 2) {
  1680. px = mid_pred(A[0], B[0], C[0]);
  1681. py = mid_pred(A[1], B[1], C[1]);
  1682. } else if (total_valid) {
  1683. if (a_valid) { px = A[0]; py = A[1]; }
  1684. if (b_valid) { px = B[0]; py = B[1]; }
  1685. if (c_valid) { px = C[0]; py = C[1]; }
  1686. } else
  1687. px = py = 0;
  1688. }
  1689. } else {
  1690. if (a_valid)
  1691. field_a = (A[1] & 4) ? 1 : 0;
  1692. else
  1693. field_a = 0;
  1694. if (b_valid)
  1695. field_b = (B[1] & 4) ? 1 : 0;
  1696. else
  1697. field_b = 0;
  1698. if (c_valid)
  1699. field_c = (C[1] & 4) ? 1 : 0;
  1700. else
  1701. field_c = 0;
  1702. num_oppfield = field_a + field_b + field_c;
  1703. num_samefield = total_valid - num_oppfield;
  1704. if (total_valid == 3) {
  1705. if ((num_samefield == 3) || (num_oppfield == 3)) {
  1706. px = mid_pred(A[0], B[0], C[0]);
  1707. py = mid_pred(A[1], B[1], C[1]);
  1708. } else if (num_samefield >= num_oppfield) {
  1709. /* take one MV from same field set depending on priority
  1710. the check for B may not be necessary */
  1711. px = !field_a ? A[0] : B[0];
  1712. py = !field_a ? A[1] : B[1];
  1713. } else {
  1714. px = field_a ? A[0] : B[0];
  1715. py = field_a ? A[1] : B[1];
  1716. }
  1717. } else if (total_valid == 2) {
  1718. if (num_samefield >= num_oppfield) {
  1719. if (!field_a && a_valid) {
  1720. px = A[0];
  1721. py = A[1];
  1722. } else if (!field_b && b_valid) {
  1723. px = B[0];
  1724. py = B[1];
  1725. } else if (c_valid) {
  1726. px = C[0];
  1727. py = C[1];
  1728. } else px = py = 0;
  1729. } else {
  1730. if (field_a && a_valid) {
  1731. px = A[0];
  1732. py = A[1];
  1733. } else if (field_b && b_valid) {
  1734. px = B[0];
  1735. py = B[1];
  1736. } else if (c_valid) {
  1737. px = C[0];
  1738. py = C[1];
  1739. } else
  1740. px = py = 0;
  1741. }
  1742. } else if (total_valid == 1) {
  1743. px = (a_valid) ? A[0] : ((b_valid) ? B[0] : C[0]);
  1744. py = (a_valid) ? A[1] : ((b_valid) ? B[1] : C[1]);
  1745. } else
  1746. px = py = 0;
  1747. }
  1748. /* store MV using signed modulus of MV range defined in 4.11 */
  1749. s->mv[dir][n][0] = s->current_picture.motion_val[dir][xy][0] = ((px + dmv_x + r_x) & ((r_x << 1) - 1)) - r_x;
  1750. s->mv[dir][n][1] = s->current_picture.motion_val[dir][xy][1] = ((py + dmv_y + r_y) & ((r_y << 1) - 1)) - r_y;
  1751. if (mvn == 1) { /* duplicate motion data for 1-MV block */
  1752. s->current_picture.motion_val[dir][xy + 1 ][0] = s->current_picture.motion_val[dir][xy][0];
  1753. s->current_picture.motion_val[dir][xy + 1 ][1] = s->current_picture.motion_val[dir][xy][1];
  1754. s->current_picture.motion_val[dir][xy + wrap ][0] = s->current_picture.motion_val[dir][xy][0];
  1755. s->current_picture.motion_val[dir][xy + wrap ][1] = s->current_picture.motion_val[dir][xy][1];
  1756. s->current_picture.motion_val[dir][xy + wrap + 1][0] = s->current_picture.motion_val[dir][xy][0];
  1757. s->current_picture.motion_val[dir][xy + wrap + 1][1] = s->current_picture.motion_val[dir][xy][1];
  1758. } else if (mvn == 2) { /* duplicate motion data for 2-Field MV block */
  1759. s->current_picture.motion_val[dir][xy + 1][0] = s->current_picture.motion_val[dir][xy][0];
  1760. s->current_picture.motion_val[dir][xy + 1][1] = s->current_picture.motion_val[dir][xy][1];
  1761. s->mv[dir][n + 1][0] = s->mv[dir][n][0];
  1762. s->mv[dir][n + 1][1] = s->mv[dir][n][1];
  1763. }
  1764. }
  1765. /** Motion compensation for direct or interpolated blocks in B-frames
  1766. */
  1767. static void vc1_interp_mc(VC1Context *v)
  1768. {
  1769. MpegEncContext *s = &v->s;
  1770. H264ChromaContext *h264chroma = &v->h264chroma;
  1771. uint8_t *srcY, *srcU, *srcV;
  1772. int dxy, mx, my, uvmx, uvmy, src_x, src_y, uvsrc_x, uvsrc_y;
  1773. int off, off_uv;
  1774. int v_edge_pos = s->v_edge_pos >> v->field_mode;
  1775. int use_ic = v->next_use_ic;
  1776. if (!v->field_mode && !v->s.next_picture.f->data[0])
  1777. return;
  1778. mx = s->mv[1][0][0];
  1779. my = s->mv[1][0][1];
  1780. uvmx = (mx + ((mx & 3) == 3)) >> 1;
  1781. uvmy = (my + ((my & 3) == 3)) >> 1;
  1782. if (v->field_mode) {
  1783. if (v->cur_field_type != v->ref_field_type[1])
  1784. my = my - 2 + 4 * v->cur_field_type;
  1785. uvmy = uvmy - 2 + 4 * v->cur_field_type;
  1786. }
  1787. if (v->fastuvmc) {
  1788. uvmx = uvmx + ((uvmx < 0) ? -(uvmx & 1) : (uvmx & 1));
  1789. uvmy = uvmy + ((uvmy < 0) ? -(uvmy & 1) : (uvmy & 1));
  1790. }
  1791. srcY = s->next_picture.f->data[0];
  1792. srcU = s->next_picture.f->data[1];
  1793. srcV = s->next_picture.f->data[2];
  1794. src_x = s->mb_x * 16 + (mx >> 2);
  1795. src_y = s->mb_y * 16 + (my >> 2);
  1796. uvsrc_x = s->mb_x * 8 + (uvmx >> 2);
  1797. uvsrc_y = s->mb_y * 8 + (uvmy >> 2);
  1798. if (v->profile != PROFILE_ADVANCED) {
  1799. src_x = av_clip( src_x, -16, s->mb_width * 16);
  1800. src_y = av_clip( src_y, -16, s->mb_height * 16);
  1801. uvsrc_x = av_clip(uvsrc_x, -8, s->mb_width * 8);
  1802. uvsrc_y = av_clip(uvsrc_y, -8, s->mb_height * 8);
  1803. } else {
  1804. src_x = av_clip( src_x, -17, s->avctx->coded_width);
  1805. src_y = av_clip( src_y, -18, s->avctx->coded_height + 1);
  1806. uvsrc_x = av_clip(uvsrc_x, -8, s->avctx->coded_width >> 1);
  1807. uvsrc_y = av_clip(uvsrc_y, -8, s->avctx->coded_height >> 1);
  1808. }
  1809. srcY += src_y * s->linesize + src_x;
  1810. srcU += uvsrc_y * s->uvlinesize + uvsrc_x;
  1811. srcV += uvsrc_y * s->uvlinesize + uvsrc_x;
  1812. if (v->field_mode && v->ref_field_type[1]) {
  1813. srcY += s->current_picture_ptr->f->linesize[0];
  1814. srcU += s->current_picture_ptr->f->linesize[1];
  1815. srcV += s->current_picture_ptr->f->linesize[2];
  1816. }
  1817. /* for grayscale we should not try to read from unknown area */
  1818. if (s->flags & CODEC_FLAG_GRAY) {
  1819. srcU = s->edge_emu_buffer + 18 * s->linesize;
  1820. srcV = s->edge_emu_buffer + 18 * s->linesize;
  1821. }
  1822. if (v->rangeredfrm || s->h_edge_pos < 22 || v_edge_pos < 22 || use_ic
  1823. || (unsigned)(src_x - 1) > s->h_edge_pos - (mx & 3) - 16 - 3
  1824. || (unsigned)(src_y - 1) > v_edge_pos - (my & 3) - 16 - 3) {
  1825. uint8_t *uvbuf = s->edge_emu_buffer + 19 * s->linesize;
  1826. srcY -= s->mspel * (1 + s->linesize);
  1827. s->vdsp.emulated_edge_mc(s->edge_emu_buffer, srcY,
  1828. s->linesize, s->linesize,
  1829. 17 + s->mspel * 2, 17 + s->mspel * 2,
  1830. src_x - s->mspel, src_y - s->mspel,
  1831. s->h_edge_pos, v_edge_pos);
  1832. srcY = s->edge_emu_buffer;
  1833. s->vdsp.emulated_edge_mc(uvbuf, srcU,
  1834. s->uvlinesize, s->uvlinesize,
  1835. 8 + 1, 8 + 1,
  1836. uvsrc_x, uvsrc_y, s->h_edge_pos >> 1, v_edge_pos >> 1);
  1837. s->vdsp.emulated_edge_mc(uvbuf + 16, srcV,
  1838. s->uvlinesize, s->uvlinesize,
  1839. 8 + 1, 8 + 1,
  1840. uvsrc_x, uvsrc_y, s->h_edge_pos >> 1, v_edge_pos >> 1);
  1841. srcU = uvbuf;
  1842. srcV = uvbuf + 16;
  1843. /* if we deal with range reduction we need to scale source blocks */
  1844. if (v->rangeredfrm) {
  1845. int i, j;
  1846. uint8_t *src, *src2;
  1847. src = srcY;
  1848. for (j = 0; j < 17 + s->mspel * 2; j++) {
  1849. for (i = 0; i < 17 + s->mspel * 2; i++)
  1850. src[i] = ((src[i] - 128) >> 1) + 128;
  1851. src += s->linesize;
  1852. }
  1853. src = srcU;
  1854. src2 = srcV;
  1855. for (j = 0; j < 9; j++) {
  1856. for (i = 0; i < 9; i++) {
  1857. src[i] = ((src[i] - 128) >> 1) + 128;
  1858. src2[i] = ((src2[i] - 128) >> 1) + 128;
  1859. }
  1860. src += s->uvlinesize;
  1861. src2 += s->uvlinesize;
  1862. }
  1863. }
  1864. if (use_ic) {
  1865. uint8_t (*luty )[256] = v->next_luty;
  1866. uint8_t (*lutuv)[256] = v->next_lutuv;
  1867. int i, j;
  1868. uint8_t *src, *src2;
  1869. src = srcY;
  1870. for (j = 0; j < 17 + s->mspel * 2; j++) {
  1871. int f = v->field_mode ? v->ref_field_type[1] : ((j+src_y - s->mspel) & 1);
  1872. for (i = 0; i < 17 + s->mspel * 2; i++)
  1873. src[i] = luty[f][src[i]];
  1874. src += s->linesize;
  1875. }
  1876. src = srcU;
  1877. src2 = srcV;
  1878. for (j = 0; j < 9; j++) {
  1879. int f = v->field_mode ? v->ref_field_type[1] : ((j+uvsrc_y) & 1);
  1880. for (i = 0; i < 9; i++) {
  1881. src[i] = lutuv[f][src[i]];
  1882. src2[i] = lutuv[f][src2[i]];
  1883. }
  1884. src += s->uvlinesize;
  1885. src2 += s->uvlinesize;
  1886. }
  1887. }
  1888. srcY += s->mspel * (1 + s->linesize);
  1889. }
  1890. off = 0;
  1891. off_uv = 0;
  1892. if (s->mspel) {
  1893. dxy = ((my & 3) << 2) | (mx & 3);
  1894. v->vc1dsp.avg_vc1_mspel_pixels_tab[dxy](s->dest[0] + off , srcY , s->linesize, v->rnd);
  1895. v->vc1dsp.avg_vc1_mspel_pixels_tab[dxy](s->dest[0] + off + 8, srcY + 8, s->linesize, v->rnd);
  1896. srcY += s->linesize * 8;
  1897. v->vc1dsp.avg_vc1_mspel_pixels_tab[dxy](s->dest[0] + off + 8 * s->linesize , srcY , s->linesize, v->rnd);
  1898. v->vc1dsp.avg_vc1_mspel_pixels_tab[dxy](s->dest[0] + off + 8 * s->linesize + 8, srcY + 8, s->linesize, v->rnd);
  1899. } else { // hpel mc
  1900. dxy = (my & 2) | ((mx & 2) >> 1);
  1901. if (!v->rnd)
  1902. s->hdsp.avg_pixels_tab[0][dxy](s->dest[0] + off, srcY, s->linesize, 16);
  1903. else
  1904. s->hdsp.avg_no_rnd_pixels_tab[dxy](s->dest[0] + off, srcY, s->linesize, 16);
  1905. }
  1906. if (s->flags & CODEC_FLAG_GRAY) return;
  1907. /* Chroma MC always uses qpel blilinear */
  1908. uvmx = (uvmx & 3) << 1;
  1909. uvmy = (uvmy & 3) << 1;
  1910. if (!v->rnd) {
  1911. h264chroma->avg_h264_chroma_pixels_tab[0](s->dest[1] + off_uv, srcU, s->uvlinesize, 8, uvmx, uvmy);
  1912. h264chroma->avg_h264_chroma_pixels_tab[0](s->dest[2] + off_uv, srcV, s->uvlinesize, 8, uvmx, uvmy);
  1913. } else {
  1914. v->vc1dsp.avg_no_rnd_vc1_chroma_pixels_tab[0](s->dest[1] + off_uv, srcU, s->uvlinesize, 8, uvmx, uvmy);
  1915. v->vc1dsp.avg_no_rnd_vc1_chroma_pixels_tab[0](s->dest[2] + off_uv, srcV, s->uvlinesize, 8, uvmx, uvmy);
  1916. }
  1917. }
  1918. static av_always_inline int scale_mv(int value, int bfrac, int inv, int qs)
  1919. {
  1920. int n = bfrac;
  1921. #if B_FRACTION_DEN==256
  1922. if (inv)
  1923. n -= 256;
  1924. if (!qs)
  1925. return 2 * ((value * n + 255) >> 9);
  1926. return (value * n + 128) >> 8;
  1927. #else
  1928. if (inv)
  1929. n -= B_FRACTION_DEN;
  1930. if (!qs)
  1931. return 2 * ((value * n + B_FRACTION_DEN - 1) / (2 * B_FRACTION_DEN));
  1932. return (value * n + B_FRACTION_DEN/2) / B_FRACTION_DEN;
  1933. #endif
  1934. }
  1935. /** Reconstruct motion vector for B-frame and do motion compensation
  1936. */
  1937. static inline void vc1_b_mc(VC1Context *v, int dmv_x[2], int dmv_y[2],
  1938. int direct, int mode)
  1939. {
  1940. if (direct) {
  1941. vc1_mc_1mv(v, 0);
  1942. vc1_interp_mc(v);
  1943. return;
  1944. }
  1945. if (mode == BMV_TYPE_INTERPOLATED) {
  1946. vc1_mc_1mv(v, 0);
  1947. vc1_interp_mc(v);
  1948. return;
  1949. }
  1950. vc1_mc_1mv(v, (mode == BMV_TYPE_BACKWARD));
  1951. }
  1952. static inline void vc1_pred_b_mv(VC1Context *v, int dmv_x[2], int dmv_y[2],
  1953. int direct, int mvtype)
  1954. {
  1955. MpegEncContext *s = &v->s;
  1956. int xy, wrap, off = 0;
  1957. int16_t *A, *B, *C;
  1958. int px, py;
  1959. int sum;
  1960. int r_x, r_y;
  1961. const uint8_t *is_intra = v->mb_type[0];
  1962. r_x = v->range_x;
  1963. r_y = v->range_y;
  1964. /* scale MV difference to be quad-pel */
  1965. dmv_x[0] <<= 1 - s->quarter_sample;
  1966. dmv_y[0] <<= 1 - s->quarter_sample;
  1967. dmv_x[1] <<= 1 - s->quarter_sample;
  1968. dmv_y[1] <<= 1 - s->quarter_sample;
  1969. wrap = s->b8_stride;
  1970. xy = s->block_index[0];
  1971. if (s->mb_intra) {
  1972. s->current_picture.motion_val[0][xy + v->blocks_off][0] =
  1973. s->current_picture.motion_val[0][xy + v->blocks_off][1] =
  1974. s->current_picture.motion_val[1][xy + v->blocks_off][0] =
  1975. s->current_picture.motion_val[1][xy + v->blocks_off][1] = 0;
  1976. return;
  1977. }
  1978. if (!v->field_mode) {
  1979. s->mv[0][0][0] = scale_mv(s->next_picture.motion_val[1][xy][0], v->bfraction, 0, s->quarter_sample);
  1980. s->mv[0][0][1] = scale_mv(s->next_picture.motion_val[1][xy][1], v->bfraction, 0, s->quarter_sample);
  1981. s->mv[1][0][0] = scale_mv(s->next_picture.motion_val[1][xy][0], v->bfraction, 1, s->quarter_sample);
  1982. s->mv[1][0][1] = scale_mv(s->next_picture.motion_val[1][xy][1], v->bfraction, 1, s->quarter_sample);
  1983. /* Pullback predicted motion vectors as specified in 8.4.5.4 */
  1984. s->mv[0][0][0] = av_clip(s->mv[0][0][0], -60 - (s->mb_x << 6), (s->mb_width << 6) - 4 - (s->mb_x << 6));
  1985. s->mv[0][0][1] = av_clip(s->mv[0][0][1], -60 - (s->mb_y << 6), (s->mb_height << 6) - 4 - (s->mb_y << 6));
  1986. s->mv[1][0][0] = av_clip(s->mv[1][0][0], -60 - (s->mb_x << 6), (s->mb_width << 6) - 4 - (s->mb_x << 6));
  1987. s->mv[1][0][1] = av_clip(s->mv[1][0][1], -60 - (s->mb_y << 6), (s->mb_height << 6) - 4 - (s->mb_y << 6));
  1988. }
  1989. if (direct) {
  1990. s->current_picture.motion_val[0][xy + v->blocks_off][0] = s->mv[0][0][0];
  1991. s->current_picture.motion_val[0][xy + v->blocks_off][1] = s->mv[0][0][1];
  1992. s->current_picture.motion_val[1][xy + v->blocks_off][0] = s->mv[1][0][0];
  1993. s->current_picture.motion_val[1][xy + v->blocks_off][1] = s->mv[1][0][1];
  1994. return;
  1995. }
  1996. if ((mvtype == BMV_TYPE_FORWARD) || (mvtype == BMV_TYPE_INTERPOLATED)) {
  1997. C = s->current_picture.motion_val[0][xy - 2];
  1998. A = s->current_picture.motion_val[0][xy - wrap * 2];
  1999. off = (s->mb_x == (s->mb_width - 1)) ? -2 : 2;
  2000. B = s->current_picture.motion_val[0][xy - wrap * 2 + off];
  2001. if (!s->mb_x) C[0] = C[1] = 0;
  2002. if (!s->first_slice_line) { // predictor A is not out of bounds
  2003. if (s->mb_width == 1) {
  2004. px = A[0];
  2005. py = A[1];
  2006. } else {
  2007. px = mid_pred(A[0], B[0], C[0]);
  2008. py = mid_pred(A[1], B[1], C[1]);
  2009. }
  2010. } else if (s->mb_x) { // predictor C is not out of bounds
  2011. px = C[0];
  2012. py = C[1];
  2013. } else {
  2014. px = py = 0;
  2015. }
  2016. /* Pullback MV as specified in 8.3.5.3.4 */
  2017. {
  2018. int qx, qy, X, Y;
  2019. if (v->profile < PROFILE_ADVANCED) {
  2020. qx = (s->mb_x << 5);
  2021. qy = (s->mb_y << 5);
  2022. X = (s->mb_width << 5) - 4;
  2023. Y = (s->mb_height << 5) - 4;
  2024. if (qx + px < -28) px = -28 - qx;
  2025. if (qy + py < -28) py = -28 - qy;
  2026. if (qx + px > X) px = X - qx;
  2027. if (qy + py > Y) py = Y - qy;
  2028. } else {
  2029. qx = (s->mb_x << 6);
  2030. qy = (s->mb_y << 6);
  2031. X = (s->mb_width << 6) - 4;
  2032. Y = (s->mb_height << 6) - 4;
  2033. if (qx + px < -60) px = -60 - qx;
  2034. if (qy + py < -60) py = -60 - qy;
  2035. if (qx + px > X) px = X - qx;
  2036. if (qy + py > Y) py = Y - qy;
  2037. }
  2038. }
  2039. /* Calculate hybrid prediction as specified in 8.3.5.3.5 */
  2040. if (0 && !s->first_slice_line && s->mb_x) {
  2041. if (is_intra[xy - wrap])
  2042. sum = FFABS(px) + FFABS(py);
  2043. else
  2044. sum = FFABS(px - A[0]) + FFABS(py - A[1]);
  2045. if (sum > 32) {
  2046. if (get_bits1(&s->gb)) {
  2047. px = A[0];
  2048. py = A[1];
  2049. } else {
  2050. px = C[0];
  2051. py = C[1];
  2052. }
  2053. } else {
  2054. if (is_intra[xy - 2])
  2055. sum = FFABS(px) + FFABS(py);
  2056. else
  2057. sum = FFABS(px - C[0]) + FFABS(py - C[1]);
  2058. if (sum > 32) {
  2059. if (get_bits1(&s->gb)) {
  2060. px = A[0];
  2061. py = A[1];
  2062. } else {
  2063. px = C[0];
  2064. py = C[1];
  2065. }
  2066. }
  2067. }
  2068. }
  2069. /* store MV using signed modulus of MV range defined in 4.11 */
  2070. s->mv[0][0][0] = ((px + dmv_x[0] + r_x) & ((r_x << 1) - 1)) - r_x;
  2071. s->mv[0][0][1] = ((py + dmv_y[0] + r_y) & ((r_y << 1) - 1)) - r_y;
  2072. }
  2073. if ((mvtype == BMV_TYPE_BACKWARD) || (mvtype == BMV_TYPE_INTERPOLATED)) {
  2074. C = s->current_picture.motion_val[1][xy - 2];
  2075. A = s->current_picture.motion_val[1][xy - wrap * 2];
  2076. off = (s->mb_x == (s->mb_width - 1)) ? -2 : 2;
  2077. B = s->current_picture.motion_val[1][xy - wrap * 2 + off];
  2078. if (!s->mb_x)
  2079. C[0] = C[1] = 0;
  2080. if (!s->first_slice_line) { // predictor A is not out of bounds
  2081. if (s->mb_width == 1) {
  2082. px = A[0];
  2083. py = A[1];
  2084. } else {
  2085. px = mid_pred(A[0], B[0], C[0]);
  2086. py = mid_pred(A[1], B[1], C[1]);
  2087. }
  2088. } else if (s->mb_x) { // predictor C is not out of bounds
  2089. px = C[0];
  2090. py = C[1];
  2091. } else {
  2092. px = py = 0;
  2093. }
  2094. /* Pullback MV as specified in 8.3.5.3.4 */
  2095. {
  2096. int qx, qy, X, Y;
  2097. if (v->profile < PROFILE_ADVANCED) {
  2098. qx = (s->mb_x << 5);
  2099. qy = (s->mb_y << 5);
  2100. X = (s->mb_width << 5) - 4;
  2101. Y = (s->mb_height << 5) - 4;
  2102. if (qx + px < -28) px = -28 - qx;
  2103. if (qy + py < -28) py = -28 - qy;
  2104. if (qx + px > X) px = X - qx;
  2105. if (qy + py > Y) py = Y - qy;
  2106. } else {
  2107. qx = (s->mb_x << 6);
  2108. qy = (s->mb_y << 6);
  2109. X = (s->mb_width << 6) - 4;
  2110. Y = (s->mb_height << 6) - 4;
  2111. if (qx + px < -60) px = -60 - qx;
  2112. if (qy + py < -60) py = -60 - qy;
  2113. if (qx + px > X) px = X - qx;
  2114. if (qy + py > Y) py = Y - qy;
  2115. }
  2116. }
  2117. /* Calculate hybrid prediction as specified in 8.3.5.3.5 */
  2118. if (0 && !s->first_slice_line && s->mb_x) {
  2119. if (is_intra[xy - wrap])
  2120. sum = FFABS(px) + FFABS(py);
  2121. else
  2122. sum = FFABS(px - A[0]) + FFABS(py - A[1]);
  2123. if (sum > 32) {
  2124. if (get_bits1(&s->gb)) {
  2125. px = A[0];
  2126. py = A[1];
  2127. } else {
  2128. px = C[0];
  2129. py = C[1];
  2130. }
  2131. } else {
  2132. if (is_intra[xy - 2])
  2133. sum = FFABS(px) + FFABS(py);
  2134. else
  2135. sum = FFABS(px - C[0]) + FFABS(py - C[1]);
  2136. if (sum > 32) {
  2137. if (get_bits1(&s->gb)) {
  2138. px = A[0];
  2139. py = A[1];
  2140. } else {
  2141. px = C[0];
  2142. py = C[1];
  2143. }
  2144. }
  2145. }
  2146. }
  2147. /* store MV using signed modulus of MV range defined in 4.11 */
  2148. s->mv[1][0][0] = ((px + dmv_x[1] + r_x) & ((r_x << 1) - 1)) - r_x;
  2149. s->mv[1][0][1] = ((py + dmv_y[1] + r_y) & ((r_y << 1) - 1)) - r_y;
  2150. }
  2151. s->current_picture.motion_val[0][xy][0] = s->mv[0][0][0];
  2152. s->current_picture.motion_val[0][xy][1] = s->mv[0][0][1];
  2153. s->current_picture.motion_val[1][xy][0] = s->mv[1][0][0];
  2154. s->current_picture.motion_val[1][xy][1] = s->mv[1][0][1];
  2155. }
  2156. static inline void vc1_pred_b_mv_intfi(VC1Context *v, int n, int *dmv_x, int *dmv_y, int mv1, int *pred_flag)
  2157. {
  2158. int dir = (v->bmvtype == BMV_TYPE_BACKWARD) ? 1 : 0;
  2159. MpegEncContext *s = &v->s;
  2160. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  2161. if (v->bmvtype == BMV_TYPE_DIRECT) {
  2162. int total_opp, k, f;
  2163. if (s->next_picture.mb_type[mb_pos + v->mb_off] != MB_TYPE_INTRA) {
  2164. s->mv[0][0][0] = scale_mv(s->next_picture.motion_val[1][s->block_index[0] + v->blocks_off][0],
  2165. v->bfraction, 0, s->quarter_sample);
  2166. s->mv[0][0][1] = scale_mv(s->next_picture.motion_val[1][s->block_index[0] + v->blocks_off][1],
  2167. v->bfraction, 0, s->quarter_sample);
  2168. s->mv[1][0][0] = scale_mv(s->next_picture.motion_val[1][s->block_index[0] + v->blocks_off][0],
  2169. v->bfraction, 1, s->quarter_sample);
  2170. s->mv[1][0][1] = scale_mv(s->next_picture.motion_val[1][s->block_index[0] + v->blocks_off][1],
  2171. v->bfraction, 1, s->quarter_sample);
  2172. total_opp = v->mv_f_next[0][s->block_index[0] + v->blocks_off]
  2173. + v->mv_f_next[0][s->block_index[1] + v->blocks_off]
  2174. + v->mv_f_next[0][s->block_index[2] + v->blocks_off]
  2175. + v->mv_f_next[0][s->block_index[3] + v->blocks_off];
  2176. f = (total_opp > 2) ? 1 : 0;
  2177. } else {
  2178. s->mv[0][0][0] = s->mv[0][0][1] = 0;
  2179. s->mv[1][0][0] = s->mv[1][0][1] = 0;
  2180. f = 0;
  2181. }
  2182. v->ref_field_type[0] = v->ref_field_type[1] = v->cur_field_type ^ f;
  2183. for (k = 0; k < 4; k++) {
  2184. s->current_picture.motion_val[0][s->block_index[k] + v->blocks_off][0] = s->mv[0][0][0];
  2185. s->current_picture.motion_val[0][s->block_index[k] + v->blocks_off][1] = s->mv[0][0][1];
  2186. s->current_picture.motion_val[1][s->block_index[k] + v->blocks_off][0] = s->mv[1][0][0];
  2187. s->current_picture.motion_val[1][s->block_index[k] + v->blocks_off][1] = s->mv[1][0][1];
  2188. v->mv_f[0][s->block_index[k] + v->blocks_off] = f;
  2189. v->mv_f[1][s->block_index[k] + v->blocks_off] = f;
  2190. }
  2191. return;
  2192. }
  2193. if (v->bmvtype == BMV_TYPE_INTERPOLATED) {
  2194. vc1_pred_mv(v, 0, dmv_x[0], dmv_y[0], 1, v->range_x, v->range_y, v->mb_type[0], pred_flag[0], 0);
  2195. vc1_pred_mv(v, 0, dmv_x[1], dmv_y[1], 1, v->range_x, v->range_y, v->mb_type[0], pred_flag[1], 1);
  2196. return;
  2197. }
  2198. if (dir) { // backward
  2199. vc1_pred_mv(v, n, dmv_x[1], dmv_y[1], mv1, v->range_x, v->range_y, v->mb_type[0], pred_flag[1], 1);
  2200. if (n == 3 || mv1) {
  2201. vc1_pred_mv(v, 0, dmv_x[0], dmv_y[0], 1, v->range_x, v->range_y, v->mb_type[0], 0, 0);
  2202. }
  2203. } else { // forward
  2204. vc1_pred_mv(v, n, dmv_x[0], dmv_y[0], mv1, v->range_x, v->range_y, v->mb_type[0], pred_flag[0], 0);
  2205. if (n == 3 || mv1) {
  2206. vc1_pred_mv(v, 0, dmv_x[1], dmv_y[1], 1, v->range_x, v->range_y, v->mb_type[0], 0, 1);
  2207. }
  2208. }
  2209. }
  2210. /** Get predicted DC value for I-frames only
  2211. * prediction dir: left=0, top=1
  2212. * @param s MpegEncContext
  2213. * @param overlap flag indicating that overlap filtering is used
  2214. * @param pq integer part of picture quantizer
  2215. * @param[in] n block index in the current MB
  2216. * @param dc_val_ptr Pointer to DC predictor
  2217. * @param dir_ptr Prediction direction for use in AC prediction
  2218. */
  2219. static inline int vc1_i_pred_dc(MpegEncContext *s, int overlap, int pq, int n,
  2220. int16_t **dc_val_ptr, int *dir_ptr)
  2221. {
  2222. int a, b, c, wrap, pred, scale;
  2223. int16_t *dc_val;
  2224. static const uint16_t dcpred[32] = {
  2225. -1, 1024, 512, 341, 256, 205, 171, 146, 128,
  2226. 114, 102, 93, 85, 79, 73, 68, 64,
  2227. 60, 57, 54, 51, 49, 47, 45, 43,
  2228. 41, 39, 38, 37, 35, 34, 33
  2229. };
  2230. /* find prediction - wmv3_dc_scale always used here in fact */
  2231. if (n < 4) scale = s->y_dc_scale;
  2232. else scale = s->c_dc_scale;
  2233. wrap = s->block_wrap[n];
  2234. dc_val = s->dc_val[0] + s->block_index[n];
  2235. /* B A
  2236. * C X
  2237. */
  2238. c = dc_val[ - 1];
  2239. b = dc_val[ - 1 - wrap];
  2240. a = dc_val[ - wrap];
  2241. if (pq < 9 || !overlap) {
  2242. /* Set outer values */
  2243. if (s->first_slice_line && (n != 2 && n != 3))
  2244. b = a = dcpred[scale];
  2245. if (s->mb_x == 0 && (n != 1 && n != 3))
  2246. b = c = dcpred[scale];
  2247. } else {
  2248. /* Set outer values */
  2249. if (s->first_slice_line && (n != 2 && n != 3))
  2250. b = a = 0;
  2251. if (s->mb_x == 0 && (n != 1 && n != 3))
  2252. b = c = 0;
  2253. }
  2254. if (abs(a - b) <= abs(b - c)) {
  2255. pred = c;
  2256. *dir_ptr = 1; // left
  2257. } else {
  2258. pred = a;
  2259. *dir_ptr = 0; // top
  2260. }
  2261. /* update predictor */
  2262. *dc_val_ptr = &dc_val[0];
  2263. return pred;
  2264. }
  2265. /** Get predicted DC value
  2266. * prediction dir: left=0, top=1
  2267. * @param s MpegEncContext
  2268. * @param overlap flag indicating that overlap filtering is used
  2269. * @param pq integer part of picture quantizer
  2270. * @param[in] n block index in the current MB
  2271. * @param a_avail flag indicating top block availability
  2272. * @param c_avail flag indicating left block availability
  2273. * @param dc_val_ptr Pointer to DC predictor
  2274. * @param dir_ptr Prediction direction for use in AC prediction
  2275. */
  2276. static inline int vc1_pred_dc(MpegEncContext *s, int overlap, int pq, int n,
  2277. int a_avail, int c_avail,
  2278. int16_t **dc_val_ptr, int *dir_ptr)
  2279. {
  2280. int a, b, c, wrap, pred;
  2281. int16_t *dc_val;
  2282. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  2283. int q1, q2 = 0;
  2284. int dqscale_index;
  2285. wrap = s->block_wrap[n];
  2286. dc_val = s->dc_val[0] + s->block_index[n];
  2287. /* B A
  2288. * C X
  2289. */
  2290. c = dc_val[ - 1];
  2291. b = dc_val[ - 1 - wrap];
  2292. a = dc_val[ - wrap];
  2293. /* scale predictors if needed */
  2294. q1 = s->current_picture.qscale_table[mb_pos];
  2295. dqscale_index = s->y_dc_scale_table[q1] - 1;
  2296. if (dqscale_index < 0)
  2297. return 0;
  2298. if (c_avail && (n != 1 && n != 3)) {
  2299. q2 = s->current_picture.qscale_table[mb_pos - 1];
  2300. if (q2 && q2 != q1)
  2301. c = (c * s->y_dc_scale_table[q2] * ff_vc1_dqscale[dqscale_index] + 0x20000) >> 18;
  2302. }
  2303. if (a_avail && (n != 2 && n != 3)) {
  2304. q2 = s->current_picture.qscale_table[mb_pos - s->mb_stride];
  2305. if (q2 && q2 != q1)
  2306. a = (a * s->y_dc_scale_table[q2] * ff_vc1_dqscale[dqscale_index] + 0x20000) >> 18;
  2307. }
  2308. if (a_avail && c_avail && (n != 3)) {
  2309. int off = mb_pos;
  2310. if (n != 1)
  2311. off--;
  2312. if (n != 2)
  2313. off -= s->mb_stride;
  2314. q2 = s->current_picture.qscale_table[off];
  2315. if (q2 && q2 != q1)
  2316. b = (b * s->y_dc_scale_table[q2] * ff_vc1_dqscale[dqscale_index] + 0x20000) >> 18;
  2317. }
  2318. if (a_avail && c_avail) {
  2319. if (abs(a - b) <= abs(b - c)) {
  2320. pred = c;
  2321. *dir_ptr = 1; // left
  2322. } else {
  2323. pred = a;
  2324. *dir_ptr = 0; // top
  2325. }
  2326. } else if (a_avail) {
  2327. pred = a;
  2328. *dir_ptr = 0; // top
  2329. } else if (c_avail) {
  2330. pred = c;
  2331. *dir_ptr = 1; // left
  2332. } else {
  2333. pred = 0;
  2334. *dir_ptr = 1; // left
  2335. }
  2336. /* update predictor */
  2337. *dc_val_ptr = &dc_val[0];
  2338. return pred;
  2339. }
  2340. /** @} */ // Block group
  2341. /**
  2342. * @name VC1 Macroblock-level functions in Simple/Main Profiles
  2343. * @see 7.1.4, p91 and 8.1.1.7, p(1)04
  2344. * @{
  2345. */
  2346. static inline int vc1_coded_block_pred(MpegEncContext * s, int n,
  2347. uint8_t **coded_block_ptr)
  2348. {
  2349. int xy, wrap, pred, a, b, c;
  2350. xy = s->block_index[n];
  2351. wrap = s->b8_stride;
  2352. /* B C
  2353. * A X
  2354. */
  2355. a = s->coded_block[xy - 1 ];
  2356. b = s->coded_block[xy - 1 - wrap];
  2357. c = s->coded_block[xy - wrap];
  2358. if (b == c) {
  2359. pred = a;
  2360. } else {
  2361. pred = c;
  2362. }
  2363. /* store value */
  2364. *coded_block_ptr = &s->coded_block[xy];
  2365. return pred;
  2366. }
  2367. /**
  2368. * Decode one AC coefficient
  2369. * @param v The VC1 context
  2370. * @param last Last coefficient
  2371. * @param skip How much zero coefficients to skip
  2372. * @param value Decoded AC coefficient value
  2373. * @param codingset set of VLC to decode data
  2374. * @see 8.1.3.4
  2375. */
  2376. static void vc1_decode_ac_coeff(VC1Context *v, int *last, int *skip,
  2377. int *value, int codingset)
  2378. {
  2379. GetBitContext *gb = &v->s.gb;
  2380. int index, escape, run = 0, level = 0, lst = 0;
  2381. index = get_vlc2(gb, ff_vc1_ac_coeff_table[codingset].table, AC_VLC_BITS, 3);
  2382. if (index != ff_vc1_ac_sizes[codingset] - 1) {
  2383. run = vc1_index_decode_table[codingset][index][0];
  2384. level = vc1_index_decode_table[codingset][index][1];
  2385. lst = index >= vc1_last_decode_table[codingset] || get_bits_left(gb) < 0;
  2386. if (get_bits1(gb))
  2387. level = -level;
  2388. } else {
  2389. escape = decode210(gb);
  2390. if (escape != 2) {
  2391. index = get_vlc2(gb, ff_vc1_ac_coeff_table[codingset].table, AC_VLC_BITS, 3);
  2392. run = vc1_index_decode_table[codingset][index][0];
  2393. level = vc1_index_decode_table[codingset][index][1];
  2394. lst = index >= vc1_last_decode_table[codingset];
  2395. if (escape == 0) {
  2396. if (lst)
  2397. level += vc1_last_delta_level_table[codingset][run];
  2398. else
  2399. level += vc1_delta_level_table[codingset][run];
  2400. } else {
  2401. if (lst)
  2402. run += vc1_last_delta_run_table[codingset][level] + 1;
  2403. else
  2404. run += vc1_delta_run_table[codingset][level] + 1;
  2405. }
  2406. if (get_bits1(gb))
  2407. level = -level;
  2408. } else {
  2409. int sign;
  2410. lst = get_bits1(gb);
  2411. if (v->s.esc3_level_length == 0) {
  2412. if (v->pq < 8 || v->dquantfrm) { // table 59
  2413. v->s.esc3_level_length = get_bits(gb, 3);
  2414. if (!v->s.esc3_level_length)
  2415. v->s.esc3_level_length = get_bits(gb, 2) + 8;
  2416. } else { // table 60
  2417. v->s.esc3_level_length = get_unary(gb, 1, 6) + 2;
  2418. }
  2419. v->s.esc3_run_length = 3 + get_bits(gb, 2);
  2420. }
  2421. run = get_bits(gb, v->s.esc3_run_length);
  2422. sign = get_bits1(gb);
  2423. level = get_bits(gb, v->s.esc3_level_length);
  2424. if (sign)
  2425. level = -level;
  2426. }
  2427. }
  2428. *last = lst;
  2429. *skip = run;
  2430. *value = level;
  2431. }
  2432. /** Decode intra block in intra frames - should be faster than decode_intra_block
  2433. * @param v VC1Context
  2434. * @param block block to decode
  2435. * @param[in] n subblock index
  2436. * @param coded are AC coeffs present or not
  2437. * @param codingset set of VLC to decode data
  2438. */
  2439. static int vc1_decode_i_block(VC1Context *v, int16_t block[64], int n,
  2440. int coded, int codingset)
  2441. {
  2442. GetBitContext *gb = &v->s.gb;
  2443. MpegEncContext *s = &v->s;
  2444. int dc_pred_dir = 0; /* Direction of the DC prediction used */
  2445. int i;
  2446. int16_t *dc_val;
  2447. int16_t *ac_val, *ac_val2;
  2448. int dcdiff;
  2449. /* Get DC differential */
  2450. if (n < 4) {
  2451. dcdiff = get_vlc2(&s->gb, ff_msmp4_dc_luma_vlc[s->dc_table_index].table, DC_VLC_BITS, 3);
  2452. } else {
  2453. dcdiff = get_vlc2(&s->gb, ff_msmp4_dc_chroma_vlc[s->dc_table_index].table, DC_VLC_BITS, 3);
  2454. }
  2455. if (dcdiff < 0) {
  2456. av_log(s->avctx, AV_LOG_ERROR, "Illegal DC VLC\n");
  2457. return -1;
  2458. }
  2459. if (dcdiff) {
  2460. if (dcdiff == 119 /* ESC index value */) {
  2461. /* TODO: Optimize */
  2462. if (v->pq == 1) dcdiff = get_bits(gb, 10);
  2463. else if (v->pq == 2) dcdiff = get_bits(gb, 9);
  2464. else dcdiff = get_bits(gb, 8);
  2465. } else {
  2466. if (v->pq == 1)
  2467. dcdiff = (dcdiff << 2) + get_bits(gb, 2) - 3;
  2468. else if (v->pq == 2)
  2469. dcdiff = (dcdiff << 1) + get_bits1(gb) - 1;
  2470. }
  2471. if (get_bits1(gb))
  2472. dcdiff = -dcdiff;
  2473. }
  2474. /* Prediction */
  2475. dcdiff += vc1_i_pred_dc(&v->s, v->overlap, v->pq, n, &dc_val, &dc_pred_dir);
  2476. *dc_val = dcdiff;
  2477. /* Store the quantized DC coeff, used for prediction */
  2478. if (n < 4) {
  2479. block[0] = dcdiff * s->y_dc_scale;
  2480. } else {
  2481. block[0] = dcdiff * s->c_dc_scale;
  2482. }
  2483. /* Skip ? */
  2484. if (!coded) {
  2485. goto not_coded;
  2486. }
  2487. // AC Decoding
  2488. i = 1;
  2489. {
  2490. int last = 0, skip, value;
  2491. const uint8_t *zz_table;
  2492. int scale;
  2493. int k;
  2494. scale = v->pq * 2 + v->halfpq;
  2495. if (v->s.ac_pred) {
  2496. if (!dc_pred_dir)
  2497. zz_table = v->zz_8x8[2];
  2498. else
  2499. zz_table = v->zz_8x8[3];
  2500. } else
  2501. zz_table = v->zz_8x8[1];
  2502. ac_val = s->ac_val[0][0] + s->block_index[n] * 16;
  2503. ac_val2 = ac_val;
  2504. if (dc_pred_dir) // left
  2505. ac_val -= 16;
  2506. else // top
  2507. ac_val -= 16 * s->block_wrap[n];
  2508. while (!last) {
  2509. vc1_decode_ac_coeff(v, &last, &skip, &value, codingset);
  2510. i += skip;
  2511. if (i > 63)
  2512. break;
  2513. block[zz_table[i++]] = value;
  2514. }
  2515. /* apply AC prediction if needed */
  2516. if (s->ac_pred) {
  2517. if (dc_pred_dir) { // left
  2518. for (k = 1; k < 8; k++)
  2519. block[k << v->left_blk_sh] += ac_val[k];
  2520. } else { // top
  2521. for (k = 1; k < 8; k++)
  2522. block[k << v->top_blk_sh] += ac_val[k + 8];
  2523. }
  2524. }
  2525. /* save AC coeffs for further prediction */
  2526. for (k = 1; k < 8; k++) {
  2527. ac_val2[k] = block[k << v->left_blk_sh];
  2528. ac_val2[k + 8] = block[k << v->top_blk_sh];
  2529. }
  2530. /* scale AC coeffs */
  2531. for (k = 1; k < 64; k++)
  2532. if (block[k]) {
  2533. block[k] *= scale;
  2534. if (!v->pquantizer)
  2535. block[k] += (block[k] < 0) ? -v->pq : v->pq;
  2536. }
  2537. if (s->ac_pred) i = 63;
  2538. }
  2539. not_coded:
  2540. if (!coded) {
  2541. int k, scale;
  2542. ac_val = s->ac_val[0][0] + s->block_index[n] * 16;
  2543. ac_val2 = ac_val;
  2544. i = 0;
  2545. scale = v->pq * 2 + v->halfpq;
  2546. memset(ac_val2, 0, 16 * 2);
  2547. if (dc_pred_dir) { // left
  2548. ac_val -= 16;
  2549. if (s->ac_pred)
  2550. memcpy(ac_val2, ac_val, 8 * 2);
  2551. } else { // top
  2552. ac_val -= 16 * s->block_wrap[n];
  2553. if (s->ac_pred)
  2554. memcpy(ac_val2 + 8, ac_val + 8, 8 * 2);
  2555. }
  2556. /* apply AC prediction if needed */
  2557. if (s->ac_pred) {
  2558. if (dc_pred_dir) { //left
  2559. for (k = 1; k < 8; k++) {
  2560. block[k << v->left_blk_sh] = ac_val[k] * scale;
  2561. if (!v->pquantizer && block[k << v->left_blk_sh])
  2562. block[k << v->left_blk_sh] += (block[k << v->left_blk_sh] < 0) ? -v->pq : v->pq;
  2563. }
  2564. } else { // top
  2565. for (k = 1; k < 8; k++) {
  2566. block[k << v->top_blk_sh] = ac_val[k + 8] * scale;
  2567. if (!v->pquantizer && block[k << v->top_blk_sh])
  2568. block[k << v->top_blk_sh] += (block[k << v->top_blk_sh] < 0) ? -v->pq : v->pq;
  2569. }
  2570. }
  2571. i = 63;
  2572. }
  2573. }
  2574. s->block_last_index[n] = i;
  2575. return 0;
  2576. }
  2577. /** Decode intra block in intra frames - should be faster than decode_intra_block
  2578. * @param v VC1Context
  2579. * @param block block to decode
  2580. * @param[in] n subblock number
  2581. * @param coded are AC coeffs present or not
  2582. * @param codingset set of VLC to decode data
  2583. * @param mquant quantizer value for this macroblock
  2584. */
  2585. static int vc1_decode_i_block_adv(VC1Context *v, int16_t block[64], int n,
  2586. int coded, int codingset, int mquant)
  2587. {
  2588. GetBitContext *gb = &v->s.gb;
  2589. MpegEncContext *s = &v->s;
  2590. int dc_pred_dir = 0; /* Direction of the DC prediction used */
  2591. int i;
  2592. int16_t *dc_val;
  2593. int16_t *ac_val, *ac_val2;
  2594. int dcdiff;
  2595. int a_avail = v->a_avail, c_avail = v->c_avail;
  2596. int use_pred = s->ac_pred;
  2597. int scale;
  2598. int q1, q2 = 0;
  2599. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  2600. /* Get DC differential */
  2601. if (n < 4) {
  2602. dcdiff = get_vlc2(&s->gb, ff_msmp4_dc_luma_vlc[s->dc_table_index].table, DC_VLC_BITS, 3);
  2603. } else {
  2604. dcdiff = get_vlc2(&s->gb, ff_msmp4_dc_chroma_vlc[s->dc_table_index].table, DC_VLC_BITS, 3);
  2605. }
  2606. if (dcdiff < 0) {
  2607. av_log(s->avctx, AV_LOG_ERROR, "Illegal DC VLC\n");
  2608. return -1;
  2609. }
  2610. if (dcdiff) {
  2611. if (dcdiff == 119 /* ESC index value */) {
  2612. /* TODO: Optimize */
  2613. if (mquant == 1) dcdiff = get_bits(gb, 10);
  2614. else if (mquant == 2) dcdiff = get_bits(gb, 9);
  2615. else dcdiff = get_bits(gb, 8);
  2616. } else {
  2617. if (mquant == 1)
  2618. dcdiff = (dcdiff << 2) + get_bits(gb, 2) - 3;
  2619. else if (mquant == 2)
  2620. dcdiff = (dcdiff << 1) + get_bits1(gb) - 1;
  2621. }
  2622. if (get_bits1(gb))
  2623. dcdiff = -dcdiff;
  2624. }
  2625. /* Prediction */
  2626. dcdiff += vc1_pred_dc(&v->s, v->overlap, mquant, n, v->a_avail, v->c_avail, &dc_val, &dc_pred_dir);
  2627. *dc_val = dcdiff;
  2628. /* Store the quantized DC coeff, used for prediction */
  2629. if (n < 4) {
  2630. block[0] = dcdiff * s->y_dc_scale;
  2631. } else {
  2632. block[0] = dcdiff * s->c_dc_scale;
  2633. }
  2634. //AC Decoding
  2635. i = 1;
  2636. /* check if AC is needed at all */
  2637. if (!a_avail && !c_avail)
  2638. use_pred = 0;
  2639. ac_val = s->ac_val[0][0] + s->block_index[n] * 16;
  2640. ac_val2 = ac_val;
  2641. scale = mquant * 2 + ((mquant == v->pq) ? v->halfpq : 0);
  2642. if (dc_pred_dir) // left
  2643. ac_val -= 16;
  2644. else // top
  2645. ac_val -= 16 * s->block_wrap[n];
  2646. q1 = s->current_picture.qscale_table[mb_pos];
  2647. if ( dc_pred_dir && c_avail && mb_pos)
  2648. q2 = s->current_picture.qscale_table[mb_pos - 1];
  2649. if (!dc_pred_dir && a_avail && mb_pos >= s->mb_stride)
  2650. q2 = s->current_picture.qscale_table[mb_pos - s->mb_stride];
  2651. if ( dc_pred_dir && n == 1)
  2652. q2 = q1;
  2653. if (!dc_pred_dir && n == 2)
  2654. q2 = q1;
  2655. if (n == 3)
  2656. q2 = q1;
  2657. if (coded) {
  2658. int last = 0, skip, value;
  2659. const uint8_t *zz_table;
  2660. int k;
  2661. if (v->s.ac_pred) {
  2662. if (!use_pred && v->fcm == ILACE_FRAME) {
  2663. zz_table = v->zzi_8x8;
  2664. } else {
  2665. if (!dc_pred_dir) // top
  2666. zz_table = v->zz_8x8[2];
  2667. else // left
  2668. zz_table = v->zz_8x8[3];
  2669. }
  2670. } else {
  2671. if (v->fcm != ILACE_FRAME)
  2672. zz_table = v->zz_8x8[1];
  2673. else
  2674. zz_table = v->zzi_8x8;
  2675. }
  2676. while (!last) {
  2677. vc1_decode_ac_coeff(v, &last, &skip, &value, codingset);
  2678. i += skip;
  2679. if (i > 63)
  2680. break;
  2681. block[zz_table[i++]] = value;
  2682. }
  2683. /* apply AC prediction if needed */
  2684. if (use_pred) {
  2685. /* scale predictors if needed*/
  2686. if (q2 && q1 != q2) {
  2687. q1 = q1 * 2 + ((q1 == v->pq) ? v->halfpq : 0) - 1;
  2688. q2 = q2 * 2 + ((q2 == v->pq) ? v->halfpq : 0) - 1;
  2689. if (q1 < 1)
  2690. return AVERROR_INVALIDDATA;
  2691. if (dc_pred_dir) { // left
  2692. for (k = 1; k < 8; k++)
  2693. block[k << v->left_blk_sh] += (ac_val[k] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2694. } else { // top
  2695. for (k = 1; k < 8; k++)
  2696. block[k << v->top_blk_sh] += (ac_val[k + 8] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2697. }
  2698. } else {
  2699. if (dc_pred_dir) { //left
  2700. for (k = 1; k < 8; k++)
  2701. block[k << v->left_blk_sh] += ac_val[k];
  2702. } else { //top
  2703. for (k = 1; k < 8; k++)
  2704. block[k << v->top_blk_sh] += ac_val[k + 8];
  2705. }
  2706. }
  2707. }
  2708. /* save AC coeffs for further prediction */
  2709. for (k = 1; k < 8; k++) {
  2710. ac_val2[k ] = block[k << v->left_blk_sh];
  2711. ac_val2[k + 8] = block[k << v->top_blk_sh];
  2712. }
  2713. /* scale AC coeffs */
  2714. for (k = 1; k < 64; k++)
  2715. if (block[k]) {
  2716. block[k] *= scale;
  2717. if (!v->pquantizer)
  2718. block[k] += (block[k] < 0) ? -mquant : mquant;
  2719. }
  2720. if (use_pred) i = 63;
  2721. } else { // no AC coeffs
  2722. int k;
  2723. memset(ac_val2, 0, 16 * 2);
  2724. if (dc_pred_dir) { // left
  2725. if (use_pred) {
  2726. memcpy(ac_val2, ac_val, 8 * 2);
  2727. if (q2 && q1 != q2) {
  2728. q1 = q1 * 2 + ((q1 == v->pq) ? v->halfpq : 0) - 1;
  2729. q2 = q2 * 2 + ((q2 == v->pq) ? v->halfpq : 0) - 1;
  2730. if (q1 < 1)
  2731. return AVERROR_INVALIDDATA;
  2732. for (k = 1; k < 8; k++)
  2733. ac_val2[k] = (ac_val2[k] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2734. }
  2735. }
  2736. } else { // top
  2737. if (use_pred) {
  2738. memcpy(ac_val2 + 8, ac_val + 8, 8 * 2);
  2739. if (q2 && q1 != q2) {
  2740. q1 = q1 * 2 + ((q1 == v->pq) ? v->halfpq : 0) - 1;
  2741. q2 = q2 * 2 + ((q2 == v->pq) ? v->halfpq : 0) - 1;
  2742. if (q1 < 1)
  2743. return AVERROR_INVALIDDATA;
  2744. for (k = 1; k < 8; k++)
  2745. ac_val2[k + 8] = (ac_val2[k + 8] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2746. }
  2747. }
  2748. }
  2749. /* apply AC prediction if needed */
  2750. if (use_pred) {
  2751. if (dc_pred_dir) { // left
  2752. for (k = 1; k < 8; k++) {
  2753. block[k << v->left_blk_sh] = ac_val2[k] * scale;
  2754. if (!v->pquantizer && block[k << v->left_blk_sh])
  2755. block[k << v->left_blk_sh] += (block[k << v->left_blk_sh] < 0) ? -mquant : mquant;
  2756. }
  2757. } else { // top
  2758. for (k = 1; k < 8; k++) {
  2759. block[k << v->top_blk_sh] = ac_val2[k + 8] * scale;
  2760. if (!v->pquantizer && block[k << v->top_blk_sh])
  2761. block[k << v->top_blk_sh] += (block[k << v->top_blk_sh] < 0) ? -mquant : mquant;
  2762. }
  2763. }
  2764. i = 63;
  2765. }
  2766. }
  2767. s->block_last_index[n] = i;
  2768. return 0;
  2769. }
  2770. /** Decode intra block in inter frames - more generic version than vc1_decode_i_block
  2771. * @param v VC1Context
  2772. * @param block block to decode
  2773. * @param[in] n subblock index
  2774. * @param coded are AC coeffs present or not
  2775. * @param mquant block quantizer
  2776. * @param codingset set of VLC to decode data
  2777. */
  2778. static int vc1_decode_intra_block(VC1Context *v, int16_t block[64], int n,
  2779. int coded, int mquant, int codingset)
  2780. {
  2781. GetBitContext *gb = &v->s.gb;
  2782. MpegEncContext *s = &v->s;
  2783. int dc_pred_dir = 0; /* Direction of the DC prediction used */
  2784. int i;
  2785. int16_t *dc_val;
  2786. int16_t *ac_val, *ac_val2;
  2787. int dcdiff;
  2788. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  2789. int a_avail = v->a_avail, c_avail = v->c_avail;
  2790. int use_pred = s->ac_pred;
  2791. int scale;
  2792. int q1, q2 = 0;
  2793. s->bdsp.clear_block(block);
  2794. /* XXX: Guard against dumb values of mquant */
  2795. mquant = (mquant < 1) ? 0 : ((mquant > 31) ? 31 : mquant);
  2796. /* Set DC scale - y and c use the same */
  2797. s->y_dc_scale = s->y_dc_scale_table[mquant];
  2798. s->c_dc_scale = s->c_dc_scale_table[mquant];
  2799. /* Get DC differential */
  2800. if (n < 4) {
  2801. dcdiff = get_vlc2(&s->gb, ff_msmp4_dc_luma_vlc[s->dc_table_index].table, DC_VLC_BITS, 3);
  2802. } else {
  2803. dcdiff = get_vlc2(&s->gb, ff_msmp4_dc_chroma_vlc[s->dc_table_index].table, DC_VLC_BITS, 3);
  2804. }
  2805. if (dcdiff < 0) {
  2806. av_log(s->avctx, AV_LOG_ERROR, "Illegal DC VLC\n");
  2807. return -1;
  2808. }
  2809. if (dcdiff) {
  2810. if (dcdiff == 119 /* ESC index value */) {
  2811. /* TODO: Optimize */
  2812. if (mquant == 1) dcdiff = get_bits(gb, 10);
  2813. else if (mquant == 2) dcdiff = get_bits(gb, 9);
  2814. else dcdiff = get_bits(gb, 8);
  2815. } else {
  2816. if (mquant == 1)
  2817. dcdiff = (dcdiff << 2) + get_bits(gb, 2) - 3;
  2818. else if (mquant == 2)
  2819. dcdiff = (dcdiff << 1) + get_bits1(gb) - 1;
  2820. }
  2821. if (get_bits1(gb))
  2822. dcdiff = -dcdiff;
  2823. }
  2824. /* Prediction */
  2825. dcdiff += vc1_pred_dc(&v->s, v->overlap, mquant, n, a_avail, c_avail, &dc_val, &dc_pred_dir);
  2826. *dc_val = dcdiff;
  2827. /* Store the quantized DC coeff, used for prediction */
  2828. if (n < 4) {
  2829. block[0] = dcdiff * s->y_dc_scale;
  2830. } else {
  2831. block[0] = dcdiff * s->c_dc_scale;
  2832. }
  2833. //AC Decoding
  2834. i = 1;
  2835. /* check if AC is needed at all and adjust direction if needed */
  2836. if (!a_avail) dc_pred_dir = 1;
  2837. if (!c_avail) dc_pred_dir = 0;
  2838. if (!a_avail && !c_avail) use_pred = 0;
  2839. ac_val = s->ac_val[0][0] + s->block_index[n] * 16;
  2840. ac_val2 = ac_val;
  2841. scale = mquant * 2 + v->halfpq;
  2842. if (dc_pred_dir) //left
  2843. ac_val -= 16;
  2844. else //top
  2845. ac_val -= 16 * s->block_wrap[n];
  2846. q1 = s->current_picture.qscale_table[mb_pos];
  2847. if (dc_pred_dir && c_avail && mb_pos)
  2848. q2 = s->current_picture.qscale_table[mb_pos - 1];
  2849. if (!dc_pred_dir && a_avail && mb_pos >= s->mb_stride)
  2850. q2 = s->current_picture.qscale_table[mb_pos - s->mb_stride];
  2851. if ( dc_pred_dir && n == 1)
  2852. q2 = q1;
  2853. if (!dc_pred_dir && n == 2)
  2854. q2 = q1;
  2855. if (n == 3) q2 = q1;
  2856. if (coded) {
  2857. int last = 0, skip, value;
  2858. int k;
  2859. while (!last) {
  2860. vc1_decode_ac_coeff(v, &last, &skip, &value, codingset);
  2861. i += skip;
  2862. if (i > 63)
  2863. break;
  2864. if (v->fcm == PROGRESSIVE)
  2865. block[v->zz_8x8[0][i++]] = value;
  2866. else {
  2867. if (use_pred && (v->fcm == ILACE_FRAME)) {
  2868. if (!dc_pred_dir) // top
  2869. block[v->zz_8x8[2][i++]] = value;
  2870. else // left
  2871. block[v->zz_8x8[3][i++]] = value;
  2872. } else {
  2873. block[v->zzi_8x8[i++]] = value;
  2874. }
  2875. }
  2876. }
  2877. /* apply AC prediction if needed */
  2878. if (use_pred) {
  2879. /* scale predictors if needed*/
  2880. if (q2 && q1 != q2) {
  2881. q1 = q1 * 2 + ((q1 == v->pq) ? v->halfpq : 0) - 1;
  2882. q2 = q2 * 2 + ((q2 == v->pq) ? v->halfpq : 0) - 1;
  2883. if (q1 < 1)
  2884. return AVERROR_INVALIDDATA;
  2885. if (dc_pred_dir) { // left
  2886. for (k = 1; k < 8; k++)
  2887. block[k << v->left_blk_sh] += (ac_val[k] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2888. } else { //top
  2889. for (k = 1; k < 8; k++)
  2890. block[k << v->top_blk_sh] += (ac_val[k + 8] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2891. }
  2892. } else {
  2893. if (dc_pred_dir) { // left
  2894. for (k = 1; k < 8; k++)
  2895. block[k << v->left_blk_sh] += ac_val[k];
  2896. } else { // top
  2897. for (k = 1; k < 8; k++)
  2898. block[k << v->top_blk_sh] += ac_val[k + 8];
  2899. }
  2900. }
  2901. }
  2902. /* save AC coeffs for further prediction */
  2903. for (k = 1; k < 8; k++) {
  2904. ac_val2[k ] = block[k << v->left_blk_sh];
  2905. ac_val2[k + 8] = block[k << v->top_blk_sh];
  2906. }
  2907. /* scale AC coeffs */
  2908. for (k = 1; k < 64; k++)
  2909. if (block[k]) {
  2910. block[k] *= scale;
  2911. if (!v->pquantizer)
  2912. block[k] += (block[k] < 0) ? -mquant : mquant;
  2913. }
  2914. if (use_pred) i = 63;
  2915. } else { // no AC coeffs
  2916. int k;
  2917. memset(ac_val2, 0, 16 * 2);
  2918. if (dc_pred_dir) { // left
  2919. if (use_pred) {
  2920. memcpy(ac_val2, ac_val, 8 * 2);
  2921. if (q2 && q1 != q2) {
  2922. q1 = q1 * 2 + ((q1 == v->pq) ? v->halfpq : 0) - 1;
  2923. q2 = q2 * 2 + ((q2 == v->pq) ? v->halfpq : 0) - 1;
  2924. if (q1 < 1)
  2925. return AVERROR_INVALIDDATA;
  2926. for (k = 1; k < 8; k++)
  2927. ac_val2[k] = (ac_val2[k] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2928. }
  2929. }
  2930. } else { // top
  2931. if (use_pred) {
  2932. memcpy(ac_val2 + 8, ac_val + 8, 8 * 2);
  2933. if (q2 && q1 != q2) {
  2934. q1 = q1 * 2 + ((q1 == v->pq) ? v->halfpq : 0) - 1;
  2935. q2 = q2 * 2 + ((q2 == v->pq) ? v->halfpq : 0) - 1;
  2936. if (q1 < 1)
  2937. return AVERROR_INVALIDDATA;
  2938. for (k = 1; k < 8; k++)
  2939. ac_val2[k + 8] = (ac_val2[k + 8] * q2 * ff_vc1_dqscale[q1 - 1] + 0x20000) >> 18;
  2940. }
  2941. }
  2942. }
  2943. /* apply AC prediction if needed */
  2944. if (use_pred) {
  2945. if (dc_pred_dir) { // left
  2946. for (k = 1; k < 8; k++) {
  2947. block[k << v->left_blk_sh] = ac_val2[k] * scale;
  2948. if (!v->pquantizer && block[k << v->left_blk_sh])
  2949. block[k << v->left_blk_sh] += (block[k << v->left_blk_sh] < 0) ? -mquant : mquant;
  2950. }
  2951. } else { // top
  2952. for (k = 1; k < 8; k++) {
  2953. block[k << v->top_blk_sh] = ac_val2[k + 8] * scale;
  2954. if (!v->pquantizer && block[k << v->top_blk_sh])
  2955. block[k << v->top_blk_sh] += (block[k << v->top_blk_sh] < 0) ? -mquant : mquant;
  2956. }
  2957. }
  2958. i = 63;
  2959. }
  2960. }
  2961. s->block_last_index[n] = i;
  2962. return 0;
  2963. }
  2964. /** Decode P block
  2965. */
  2966. static int vc1_decode_p_block(VC1Context *v, int16_t block[64], int n,
  2967. int mquant, int ttmb, int first_block,
  2968. uint8_t *dst, int linesize, int skip_block,
  2969. int *ttmb_out)
  2970. {
  2971. MpegEncContext *s = &v->s;
  2972. GetBitContext *gb = &s->gb;
  2973. int i, j;
  2974. int subblkpat = 0;
  2975. int scale, off, idx, last, skip, value;
  2976. int ttblk = ttmb & 7;
  2977. int pat = 0;
  2978. s->bdsp.clear_block(block);
  2979. if (ttmb == -1) {
  2980. ttblk = ff_vc1_ttblk_to_tt[v->tt_index][get_vlc2(gb, ff_vc1_ttblk_vlc[v->tt_index].table, VC1_TTBLK_VLC_BITS, 1)];
  2981. }
  2982. if (ttblk == TT_4X4) {
  2983. subblkpat = ~(get_vlc2(gb, ff_vc1_subblkpat_vlc[v->tt_index].table, VC1_SUBBLKPAT_VLC_BITS, 1) + 1);
  2984. }
  2985. if ((ttblk != TT_8X8 && ttblk != TT_4X4)
  2986. && ((v->ttmbf || (ttmb != -1 && (ttmb & 8) && !first_block))
  2987. || (!v->res_rtm_flag && !first_block))) {
  2988. subblkpat = decode012(gb);
  2989. if (subblkpat)
  2990. subblkpat ^= 3; // swap decoded pattern bits
  2991. if (ttblk == TT_8X4_TOP || ttblk == TT_8X4_BOTTOM)
  2992. ttblk = TT_8X4;
  2993. if (ttblk == TT_4X8_RIGHT || ttblk == TT_4X8_LEFT)
  2994. ttblk = TT_4X8;
  2995. }
  2996. scale = 2 * mquant + ((v->pq == mquant) ? v->halfpq : 0);
  2997. // convert transforms like 8X4_TOP to generic TT and SUBBLKPAT
  2998. if (ttblk == TT_8X4_TOP || ttblk == TT_8X4_BOTTOM) {
  2999. subblkpat = 2 - (ttblk == TT_8X4_TOP);
  3000. ttblk = TT_8X4;
  3001. }
  3002. if (ttblk == TT_4X8_RIGHT || ttblk == TT_4X8_LEFT) {
  3003. subblkpat = 2 - (ttblk == TT_4X8_LEFT);
  3004. ttblk = TT_4X8;
  3005. }
  3006. switch (ttblk) {
  3007. case TT_8X8:
  3008. pat = 0xF;
  3009. i = 0;
  3010. last = 0;
  3011. while (!last) {
  3012. vc1_decode_ac_coeff(v, &last, &skip, &value, v->codingset2);
  3013. i += skip;
  3014. if (i > 63)
  3015. break;
  3016. if (!v->fcm)
  3017. idx = v->zz_8x8[0][i++];
  3018. else
  3019. idx = v->zzi_8x8[i++];
  3020. block[idx] = value * scale;
  3021. if (!v->pquantizer)
  3022. block[idx] += (block[idx] < 0) ? -mquant : mquant;
  3023. }
  3024. if (!skip_block) {
  3025. if (i == 1)
  3026. v->vc1dsp.vc1_inv_trans_8x8_dc(dst, linesize, block);
  3027. else {
  3028. v->vc1dsp.vc1_inv_trans_8x8(block);
  3029. s->idsp.add_pixels_clamped(block, dst, linesize);
  3030. }
  3031. }
  3032. break;
  3033. case TT_4X4:
  3034. pat = ~subblkpat & 0xF;
  3035. for (j = 0; j < 4; j++) {
  3036. last = subblkpat & (1 << (3 - j));
  3037. i = 0;
  3038. off = (j & 1) * 4 + (j & 2) * 16;
  3039. while (!last) {
  3040. vc1_decode_ac_coeff(v, &last, &skip, &value, v->codingset2);
  3041. i += skip;
  3042. if (i > 15)
  3043. break;
  3044. if (!v->fcm)
  3045. idx = ff_vc1_simple_progressive_4x4_zz[i++];
  3046. else
  3047. idx = ff_vc1_adv_interlaced_4x4_zz[i++];
  3048. block[idx + off] = value * scale;
  3049. if (!v->pquantizer)
  3050. block[idx + off] += (block[idx + off] < 0) ? -mquant : mquant;
  3051. }
  3052. if (!(subblkpat & (1 << (3 - j))) && !skip_block) {
  3053. if (i == 1)
  3054. v->vc1dsp.vc1_inv_trans_4x4_dc(dst + (j & 1) * 4 + (j & 2) * 2 * linesize, linesize, block + off);
  3055. else
  3056. v->vc1dsp.vc1_inv_trans_4x4(dst + (j & 1) * 4 + (j & 2) * 2 * linesize, linesize, block + off);
  3057. }
  3058. }
  3059. break;
  3060. case TT_8X4:
  3061. pat = ~((subblkpat & 2) * 6 + (subblkpat & 1) * 3) & 0xF;
  3062. for (j = 0; j < 2; j++) {
  3063. last = subblkpat & (1 << (1 - j));
  3064. i = 0;
  3065. off = j * 32;
  3066. while (!last) {
  3067. vc1_decode_ac_coeff(v, &last, &skip, &value, v->codingset2);
  3068. i += skip;
  3069. if (i > 31)
  3070. break;
  3071. if (!v->fcm)
  3072. idx = v->zz_8x4[i++] + off;
  3073. else
  3074. idx = ff_vc1_adv_interlaced_8x4_zz[i++] + off;
  3075. block[idx] = value * scale;
  3076. if (!v->pquantizer)
  3077. block[idx] += (block[idx] < 0) ? -mquant : mquant;
  3078. }
  3079. if (!(subblkpat & (1 << (1 - j))) && !skip_block) {
  3080. if (i == 1)
  3081. v->vc1dsp.vc1_inv_trans_8x4_dc(dst + j * 4 * linesize, linesize, block + off);
  3082. else
  3083. v->vc1dsp.vc1_inv_trans_8x4(dst + j * 4 * linesize, linesize, block + off);
  3084. }
  3085. }
  3086. break;
  3087. case TT_4X8:
  3088. pat = ~(subblkpat * 5) & 0xF;
  3089. for (j = 0; j < 2; j++) {
  3090. last = subblkpat & (1 << (1 - j));
  3091. i = 0;
  3092. off = j * 4;
  3093. while (!last) {
  3094. vc1_decode_ac_coeff(v, &last, &skip, &value, v->codingset2);
  3095. i += skip;
  3096. if (i > 31)
  3097. break;
  3098. if (!v->fcm)
  3099. idx = v->zz_4x8[i++] + off;
  3100. else
  3101. idx = ff_vc1_adv_interlaced_4x8_zz[i++] + off;
  3102. block[idx] = value * scale;
  3103. if (!v->pquantizer)
  3104. block[idx] += (block[idx] < 0) ? -mquant : mquant;
  3105. }
  3106. if (!(subblkpat & (1 << (1 - j))) && !skip_block) {
  3107. if (i == 1)
  3108. v->vc1dsp.vc1_inv_trans_4x8_dc(dst + j * 4, linesize, block + off);
  3109. else
  3110. v->vc1dsp.vc1_inv_trans_4x8(dst + j*4, linesize, block + off);
  3111. }
  3112. }
  3113. break;
  3114. }
  3115. if (ttmb_out)
  3116. *ttmb_out |= ttblk << (n * 4);
  3117. return pat;
  3118. }
  3119. /** @} */ // Macroblock group
  3120. static const int size_table [6] = { 0, 2, 3, 4, 5, 8 };
  3121. static const int offset_table[6] = { 0, 1, 3, 7, 15, 31 };
  3122. static av_always_inline void vc1_apply_p_v_loop_filter(VC1Context *v, int block_num)
  3123. {
  3124. MpegEncContext *s = &v->s;
  3125. int mb_cbp = v->cbp[s->mb_x - s->mb_stride],
  3126. block_cbp = mb_cbp >> (block_num * 4), bottom_cbp,
  3127. mb_is_intra = v->is_intra[s->mb_x - s->mb_stride],
  3128. block_is_intra = mb_is_intra >> (block_num * 4), bottom_is_intra;
  3129. int idx, linesize = block_num > 3 ? s->uvlinesize : s->linesize, ttblk;
  3130. uint8_t *dst;
  3131. if (block_num > 3) {
  3132. dst = s->dest[block_num - 3];
  3133. } else {
  3134. dst = s->dest[0] + (block_num & 1) * 8 + ((block_num & 2) * 4 - 8) * linesize;
  3135. }
  3136. if (s->mb_y != s->end_mb_y || block_num < 2) {
  3137. int16_t (*mv)[2];
  3138. int mv_stride;
  3139. if (block_num > 3) {
  3140. bottom_cbp = v->cbp[s->mb_x] >> (block_num * 4);
  3141. bottom_is_intra = v->is_intra[s->mb_x] >> (block_num * 4);
  3142. mv = &v->luma_mv[s->mb_x - s->mb_stride];
  3143. mv_stride = s->mb_stride;
  3144. } else {
  3145. bottom_cbp = (block_num < 2) ? (mb_cbp >> ((block_num + 2) * 4))
  3146. : (v->cbp[s->mb_x] >> ((block_num - 2) * 4));
  3147. bottom_is_intra = (block_num < 2) ? (mb_is_intra >> ((block_num + 2) * 4))
  3148. : (v->is_intra[s->mb_x] >> ((block_num - 2) * 4));
  3149. mv_stride = s->b8_stride;
  3150. mv = &s->current_picture.motion_val[0][s->block_index[block_num] - 2 * mv_stride];
  3151. }
  3152. if (bottom_is_intra & 1 || block_is_intra & 1 ||
  3153. mv[0][0] != mv[mv_stride][0] || mv[0][1] != mv[mv_stride][1]) {
  3154. v->vc1dsp.vc1_v_loop_filter8(dst, linesize, v->pq);
  3155. } else {
  3156. idx = ((bottom_cbp >> 2) | block_cbp) & 3;
  3157. if (idx == 3) {
  3158. v->vc1dsp.vc1_v_loop_filter8(dst, linesize, v->pq);
  3159. } else if (idx) {
  3160. if (idx == 1)
  3161. v->vc1dsp.vc1_v_loop_filter4(dst + 4, linesize, v->pq);
  3162. else
  3163. v->vc1dsp.vc1_v_loop_filter4(dst, linesize, v->pq);
  3164. }
  3165. }
  3166. }
  3167. dst -= 4 * linesize;
  3168. ttblk = (v->ttblk[s->mb_x - s->mb_stride] >> (block_num * 4)) & 0xF;
  3169. if (ttblk == TT_4X4 || ttblk == TT_8X4) {
  3170. idx = (block_cbp | (block_cbp >> 2)) & 3;
  3171. if (idx == 3) {
  3172. v->vc1dsp.vc1_v_loop_filter8(dst, linesize, v->pq);
  3173. } else if (idx) {
  3174. if (idx == 1)
  3175. v->vc1dsp.vc1_v_loop_filter4(dst + 4, linesize, v->pq);
  3176. else
  3177. v->vc1dsp.vc1_v_loop_filter4(dst, linesize, v->pq);
  3178. }
  3179. }
  3180. }
  3181. static av_always_inline void vc1_apply_p_h_loop_filter(VC1Context *v, int block_num)
  3182. {
  3183. MpegEncContext *s = &v->s;
  3184. int mb_cbp = v->cbp[s->mb_x - 1 - s->mb_stride],
  3185. block_cbp = mb_cbp >> (block_num * 4), right_cbp,
  3186. mb_is_intra = v->is_intra[s->mb_x - 1 - s->mb_stride],
  3187. block_is_intra = mb_is_intra >> (block_num * 4), right_is_intra;
  3188. int idx, linesize = block_num > 3 ? s->uvlinesize : s->linesize, ttblk;
  3189. uint8_t *dst;
  3190. if (block_num > 3) {
  3191. dst = s->dest[block_num - 3] - 8 * linesize;
  3192. } else {
  3193. dst = s->dest[0] + (block_num & 1) * 8 + ((block_num & 2) * 4 - 16) * linesize - 8;
  3194. }
  3195. if (s->mb_x != s->mb_width || !(block_num & 5)) {
  3196. int16_t (*mv)[2];
  3197. if (block_num > 3) {
  3198. right_cbp = v->cbp[s->mb_x - s->mb_stride] >> (block_num * 4);
  3199. right_is_intra = v->is_intra[s->mb_x - s->mb_stride] >> (block_num * 4);
  3200. mv = &v->luma_mv[s->mb_x - s->mb_stride - 1];
  3201. } else {
  3202. right_cbp = (block_num & 1) ? (v->cbp[s->mb_x - s->mb_stride] >> ((block_num - 1) * 4))
  3203. : (mb_cbp >> ((block_num + 1) * 4));
  3204. right_is_intra = (block_num & 1) ? (v->is_intra[s->mb_x - s->mb_stride] >> ((block_num - 1) * 4))
  3205. : (mb_is_intra >> ((block_num + 1) * 4));
  3206. mv = &s->current_picture.motion_val[0][s->block_index[block_num] - s->b8_stride * 2 - 2];
  3207. }
  3208. if (block_is_intra & 1 || right_is_intra & 1 || mv[0][0] != mv[1][0] || mv[0][1] != mv[1][1]) {
  3209. v->vc1dsp.vc1_h_loop_filter8(dst, linesize, v->pq);
  3210. } else {
  3211. idx = ((right_cbp >> 1) | block_cbp) & 5; // FIXME check
  3212. if (idx == 5) {
  3213. v->vc1dsp.vc1_h_loop_filter8(dst, linesize, v->pq);
  3214. } else if (idx) {
  3215. if (idx == 1)
  3216. v->vc1dsp.vc1_h_loop_filter4(dst + 4 * linesize, linesize, v->pq);
  3217. else
  3218. v->vc1dsp.vc1_h_loop_filter4(dst, linesize, v->pq);
  3219. }
  3220. }
  3221. }
  3222. dst -= 4;
  3223. ttblk = (v->ttblk[s->mb_x - s->mb_stride - 1] >> (block_num * 4)) & 0xf;
  3224. if (ttblk == TT_4X4 || ttblk == TT_4X8) {
  3225. idx = (block_cbp | (block_cbp >> 1)) & 5;
  3226. if (idx == 5) {
  3227. v->vc1dsp.vc1_h_loop_filter8(dst, linesize, v->pq);
  3228. } else if (idx) {
  3229. if (idx == 1)
  3230. v->vc1dsp.vc1_h_loop_filter4(dst + linesize * 4, linesize, v->pq);
  3231. else
  3232. v->vc1dsp.vc1_h_loop_filter4(dst, linesize, v->pq);
  3233. }
  3234. }
  3235. }
  3236. static void vc1_apply_p_loop_filter(VC1Context *v)
  3237. {
  3238. MpegEncContext *s = &v->s;
  3239. int i;
  3240. for (i = 0; i < 6; i++) {
  3241. vc1_apply_p_v_loop_filter(v, i);
  3242. }
  3243. /* V always precedes H, therefore we run H one MB before V;
  3244. * at the end of a row, we catch up to complete the row */
  3245. if (s->mb_x) {
  3246. for (i = 0; i < 6; i++) {
  3247. vc1_apply_p_h_loop_filter(v, i);
  3248. }
  3249. if (s->mb_x == s->mb_width - 1) {
  3250. s->mb_x++;
  3251. ff_update_block_index(s);
  3252. for (i = 0; i < 6; i++) {
  3253. vc1_apply_p_h_loop_filter(v, i);
  3254. }
  3255. }
  3256. }
  3257. }
  3258. /** Decode one P-frame MB
  3259. */
  3260. static int vc1_decode_p_mb(VC1Context *v)
  3261. {
  3262. MpegEncContext *s = &v->s;
  3263. GetBitContext *gb = &s->gb;
  3264. int i, j;
  3265. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  3266. int cbp; /* cbp decoding stuff */
  3267. int mqdiff, mquant; /* MB quantization */
  3268. int ttmb = v->ttfrm; /* MB Transform type */
  3269. int mb_has_coeffs = 1; /* last_flag */
  3270. int dmv_x, dmv_y; /* Differential MV components */
  3271. int index, index1; /* LUT indexes */
  3272. int val, sign; /* temp values */
  3273. int first_block = 1;
  3274. int dst_idx, off;
  3275. int skipped, fourmv;
  3276. int block_cbp = 0, pat, block_tt = 0, block_intra = 0;
  3277. mquant = v->pq; /* lossy initialization */
  3278. if (v->mv_type_is_raw)
  3279. fourmv = get_bits1(gb);
  3280. else
  3281. fourmv = v->mv_type_mb_plane[mb_pos];
  3282. if (v->skip_is_raw)
  3283. skipped = get_bits1(gb);
  3284. else
  3285. skipped = v->s.mbskip_table[mb_pos];
  3286. if (!fourmv) { /* 1MV mode */
  3287. if (!skipped) {
  3288. GET_MVDATA(dmv_x, dmv_y);
  3289. if (s->mb_intra) {
  3290. s->current_picture.motion_val[1][s->block_index[0]][0] = 0;
  3291. s->current_picture.motion_val[1][s->block_index[0]][1] = 0;
  3292. }
  3293. s->current_picture.mb_type[mb_pos] = s->mb_intra ? MB_TYPE_INTRA : MB_TYPE_16x16;
  3294. vc1_pred_mv(v, 0, dmv_x, dmv_y, 1, v->range_x, v->range_y, v->mb_type[0], 0, 0);
  3295. /* FIXME Set DC val for inter block ? */
  3296. if (s->mb_intra && !mb_has_coeffs) {
  3297. GET_MQUANT();
  3298. s->ac_pred = get_bits1(gb);
  3299. cbp = 0;
  3300. } else if (mb_has_coeffs) {
  3301. if (s->mb_intra)
  3302. s->ac_pred = get_bits1(gb);
  3303. cbp = get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3304. GET_MQUANT();
  3305. } else {
  3306. mquant = v->pq;
  3307. cbp = 0;
  3308. }
  3309. s->current_picture.qscale_table[mb_pos] = mquant;
  3310. if (!v->ttmbf && !s->mb_intra && mb_has_coeffs)
  3311. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table,
  3312. VC1_TTMB_VLC_BITS, 2);
  3313. if (!s->mb_intra) vc1_mc_1mv(v, 0);
  3314. dst_idx = 0;
  3315. for (i = 0; i < 6; i++) {
  3316. s->dc_val[0][s->block_index[i]] = 0;
  3317. dst_idx += i >> 2;
  3318. val = ((cbp >> (5 - i)) & 1);
  3319. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  3320. v->mb_type[0][s->block_index[i]] = s->mb_intra;
  3321. if (s->mb_intra) {
  3322. /* check if prediction blocks A and C are available */
  3323. v->a_avail = v->c_avail = 0;
  3324. if (i == 2 || i == 3 || !s->first_slice_line)
  3325. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  3326. if (i == 1 || i == 3 || s->mb_x)
  3327. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  3328. vc1_decode_intra_block(v, s->block[i], i, val, mquant,
  3329. (i & 4) ? v->codingset2 : v->codingset);
  3330. if ((i>3) && (s->flags & CODEC_FLAG_GRAY))
  3331. continue;
  3332. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  3333. if (v->rangeredfrm)
  3334. for (j = 0; j < 64; j++)
  3335. s->block[i][j] <<= 1;
  3336. s->idsp.put_signed_pixels_clamped(s->block[i],
  3337. s->dest[dst_idx] + off,
  3338. i & 4 ? s->uvlinesize
  3339. : s->linesize);
  3340. if (v->pq >= 9 && v->overlap) {
  3341. if (v->c_avail)
  3342. v->vc1dsp.vc1_h_overlap(s->dest[dst_idx] + off, i & 4 ? s->uvlinesize : s->linesize);
  3343. if (v->a_avail)
  3344. v->vc1dsp.vc1_v_overlap(s->dest[dst_idx] + off, i & 4 ? s->uvlinesize : s->linesize);
  3345. }
  3346. block_cbp |= 0xF << (i << 2);
  3347. block_intra |= 1 << i;
  3348. } else if (val) {
  3349. pat = vc1_decode_p_block(v, s->block[i], i, mquant, ttmb, first_block,
  3350. s->dest[dst_idx] + off, (i & 4) ? s->uvlinesize : s->linesize,
  3351. (i & 4) && (s->flags & CODEC_FLAG_GRAY), &block_tt);
  3352. block_cbp |= pat << (i << 2);
  3353. if (!v->ttmbf && ttmb < 8)
  3354. ttmb = -1;
  3355. first_block = 0;
  3356. }
  3357. }
  3358. } else { // skipped
  3359. s->mb_intra = 0;
  3360. for (i = 0; i < 6; i++) {
  3361. v->mb_type[0][s->block_index[i]] = 0;
  3362. s->dc_val[0][s->block_index[i]] = 0;
  3363. }
  3364. s->current_picture.mb_type[mb_pos] = MB_TYPE_SKIP;
  3365. s->current_picture.qscale_table[mb_pos] = 0;
  3366. vc1_pred_mv(v, 0, 0, 0, 1, v->range_x, v->range_y, v->mb_type[0], 0, 0);
  3367. vc1_mc_1mv(v, 0);
  3368. }
  3369. } else { // 4MV mode
  3370. if (!skipped /* unskipped MB */) {
  3371. int intra_count = 0, coded_inter = 0;
  3372. int is_intra[6], is_coded[6];
  3373. /* Get CBPCY */
  3374. cbp = get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3375. for (i = 0; i < 6; i++) {
  3376. val = ((cbp >> (5 - i)) & 1);
  3377. s->dc_val[0][s->block_index[i]] = 0;
  3378. s->mb_intra = 0;
  3379. if (i < 4) {
  3380. dmv_x = dmv_y = 0;
  3381. s->mb_intra = 0;
  3382. mb_has_coeffs = 0;
  3383. if (val) {
  3384. GET_MVDATA(dmv_x, dmv_y);
  3385. }
  3386. vc1_pred_mv(v, i, dmv_x, dmv_y, 0, v->range_x, v->range_y, v->mb_type[0], 0, 0);
  3387. if (!s->mb_intra)
  3388. vc1_mc_4mv_luma(v, i, 0, 0);
  3389. intra_count += s->mb_intra;
  3390. is_intra[i] = s->mb_intra;
  3391. is_coded[i] = mb_has_coeffs;
  3392. }
  3393. if (i & 4) {
  3394. is_intra[i] = (intra_count >= 3);
  3395. is_coded[i] = val;
  3396. }
  3397. if (i == 4)
  3398. vc1_mc_4mv_chroma(v, 0);
  3399. v->mb_type[0][s->block_index[i]] = is_intra[i];
  3400. if (!coded_inter)
  3401. coded_inter = !is_intra[i] & is_coded[i];
  3402. }
  3403. // if there are no coded blocks then don't do anything more
  3404. dst_idx = 0;
  3405. if (!intra_count && !coded_inter)
  3406. goto end;
  3407. GET_MQUANT();
  3408. s->current_picture.qscale_table[mb_pos] = mquant;
  3409. /* test if block is intra and has pred */
  3410. {
  3411. int intrapred = 0;
  3412. for (i = 0; i < 6; i++)
  3413. if (is_intra[i]) {
  3414. if (((!s->first_slice_line || (i == 2 || i == 3)) && v->mb_type[0][s->block_index[i] - s->block_wrap[i]])
  3415. || ((s->mb_x || (i == 1 || i == 3)) && v->mb_type[0][s->block_index[i] - 1])) {
  3416. intrapred = 1;
  3417. break;
  3418. }
  3419. }
  3420. if (intrapred)
  3421. s->ac_pred = get_bits1(gb);
  3422. else
  3423. s->ac_pred = 0;
  3424. }
  3425. if (!v->ttmbf && coded_inter)
  3426. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  3427. for (i = 0; i < 6; i++) {
  3428. dst_idx += i >> 2;
  3429. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  3430. s->mb_intra = is_intra[i];
  3431. if (is_intra[i]) {
  3432. /* check if prediction blocks A and C are available */
  3433. v->a_avail = v->c_avail = 0;
  3434. if (i == 2 || i == 3 || !s->first_slice_line)
  3435. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  3436. if (i == 1 || i == 3 || s->mb_x)
  3437. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  3438. vc1_decode_intra_block(v, s->block[i], i, is_coded[i], mquant,
  3439. (i & 4) ? v->codingset2 : v->codingset);
  3440. if ((i>3) && (s->flags & CODEC_FLAG_GRAY))
  3441. continue;
  3442. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  3443. if (v->rangeredfrm)
  3444. for (j = 0; j < 64; j++)
  3445. s->block[i][j] <<= 1;
  3446. s->idsp.put_signed_pixels_clamped(s->block[i],
  3447. s->dest[dst_idx] + off,
  3448. (i & 4) ? s->uvlinesize
  3449. : s->linesize);
  3450. if (v->pq >= 9 && v->overlap) {
  3451. if (v->c_avail)
  3452. v->vc1dsp.vc1_h_overlap(s->dest[dst_idx] + off, i & 4 ? s->uvlinesize : s->linesize);
  3453. if (v->a_avail)
  3454. v->vc1dsp.vc1_v_overlap(s->dest[dst_idx] + off, i & 4 ? s->uvlinesize : s->linesize);
  3455. }
  3456. block_cbp |= 0xF << (i << 2);
  3457. block_intra |= 1 << i;
  3458. } else if (is_coded[i]) {
  3459. pat = vc1_decode_p_block(v, s->block[i], i, mquant, ttmb,
  3460. first_block, s->dest[dst_idx] + off,
  3461. (i & 4) ? s->uvlinesize : s->linesize,
  3462. (i & 4) && (s->flags & CODEC_FLAG_GRAY),
  3463. &block_tt);
  3464. block_cbp |= pat << (i << 2);
  3465. if (!v->ttmbf && ttmb < 8)
  3466. ttmb = -1;
  3467. first_block = 0;
  3468. }
  3469. }
  3470. } else { // skipped MB
  3471. s->mb_intra = 0;
  3472. s->current_picture.qscale_table[mb_pos] = 0;
  3473. for (i = 0; i < 6; i++) {
  3474. v->mb_type[0][s->block_index[i]] = 0;
  3475. s->dc_val[0][s->block_index[i]] = 0;
  3476. }
  3477. for (i = 0; i < 4; i++) {
  3478. vc1_pred_mv(v, i, 0, 0, 0, v->range_x, v->range_y, v->mb_type[0], 0, 0);
  3479. vc1_mc_4mv_luma(v, i, 0, 0);
  3480. }
  3481. vc1_mc_4mv_chroma(v, 0);
  3482. s->current_picture.qscale_table[mb_pos] = 0;
  3483. }
  3484. }
  3485. end:
  3486. v->cbp[s->mb_x] = block_cbp;
  3487. v->ttblk[s->mb_x] = block_tt;
  3488. v->is_intra[s->mb_x] = block_intra;
  3489. return 0;
  3490. }
  3491. /* Decode one macroblock in an interlaced frame p picture */
  3492. static int vc1_decode_p_mb_intfr(VC1Context *v)
  3493. {
  3494. MpegEncContext *s = &v->s;
  3495. GetBitContext *gb = &s->gb;
  3496. int i;
  3497. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  3498. int cbp = 0; /* cbp decoding stuff */
  3499. int mqdiff, mquant; /* MB quantization */
  3500. int ttmb = v->ttfrm; /* MB Transform type */
  3501. int mb_has_coeffs = 1; /* last_flag */
  3502. int dmv_x, dmv_y; /* Differential MV components */
  3503. int val; /* temp value */
  3504. int first_block = 1;
  3505. int dst_idx, off;
  3506. int skipped, fourmv = 0, twomv = 0;
  3507. int block_cbp = 0, pat, block_tt = 0;
  3508. int idx_mbmode = 0, mvbp;
  3509. int stride_y, fieldtx;
  3510. mquant = v->pq; /* Loosy initialization */
  3511. if (v->skip_is_raw)
  3512. skipped = get_bits1(gb);
  3513. else
  3514. skipped = v->s.mbskip_table[mb_pos];
  3515. if (!skipped) {
  3516. if (v->fourmvswitch)
  3517. idx_mbmode = get_vlc2(gb, v->mbmode_vlc->table, VC1_INTFR_4MV_MBMODE_VLC_BITS, 2); // try getting this done
  3518. else
  3519. idx_mbmode = get_vlc2(gb, v->mbmode_vlc->table, VC1_INTFR_NON4MV_MBMODE_VLC_BITS, 2); // in a single line
  3520. switch (ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][0]) {
  3521. /* store the motion vector type in a flag (useful later) */
  3522. case MV_PMODE_INTFR_4MV:
  3523. fourmv = 1;
  3524. v->blk_mv_type[s->block_index[0]] = 0;
  3525. v->blk_mv_type[s->block_index[1]] = 0;
  3526. v->blk_mv_type[s->block_index[2]] = 0;
  3527. v->blk_mv_type[s->block_index[3]] = 0;
  3528. break;
  3529. case MV_PMODE_INTFR_4MV_FIELD:
  3530. fourmv = 1;
  3531. v->blk_mv_type[s->block_index[0]] = 1;
  3532. v->blk_mv_type[s->block_index[1]] = 1;
  3533. v->blk_mv_type[s->block_index[2]] = 1;
  3534. v->blk_mv_type[s->block_index[3]] = 1;
  3535. break;
  3536. case MV_PMODE_INTFR_2MV_FIELD:
  3537. twomv = 1;
  3538. v->blk_mv_type[s->block_index[0]] = 1;
  3539. v->blk_mv_type[s->block_index[1]] = 1;
  3540. v->blk_mv_type[s->block_index[2]] = 1;
  3541. v->blk_mv_type[s->block_index[3]] = 1;
  3542. break;
  3543. case MV_PMODE_INTFR_1MV:
  3544. v->blk_mv_type[s->block_index[0]] = 0;
  3545. v->blk_mv_type[s->block_index[1]] = 0;
  3546. v->blk_mv_type[s->block_index[2]] = 0;
  3547. v->blk_mv_type[s->block_index[3]] = 0;
  3548. break;
  3549. }
  3550. if (ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][0] == MV_PMODE_INTFR_INTRA) { // intra MB
  3551. for (i = 0; i < 4; i++) {
  3552. s->current_picture.motion_val[1][s->block_index[i]][0] = 0;
  3553. s->current_picture.motion_val[1][s->block_index[i]][1] = 0;
  3554. }
  3555. s->current_picture.mb_type[mb_pos] = MB_TYPE_INTRA;
  3556. s->mb_intra = v->is_intra[s->mb_x] = 1;
  3557. for (i = 0; i < 6; i++)
  3558. v->mb_type[0][s->block_index[i]] = 1;
  3559. fieldtx = v->fieldtx_plane[mb_pos] = get_bits1(gb);
  3560. mb_has_coeffs = get_bits1(gb);
  3561. if (mb_has_coeffs)
  3562. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3563. v->s.ac_pred = v->acpred_plane[mb_pos] = get_bits1(gb);
  3564. GET_MQUANT();
  3565. s->current_picture.qscale_table[mb_pos] = mquant;
  3566. /* Set DC scale - y and c use the same (not sure if necessary here) */
  3567. s->y_dc_scale = s->y_dc_scale_table[mquant];
  3568. s->c_dc_scale = s->c_dc_scale_table[mquant];
  3569. dst_idx = 0;
  3570. for (i = 0; i < 6; i++) {
  3571. s->dc_val[0][s->block_index[i]] = 0;
  3572. dst_idx += i >> 2;
  3573. val = ((cbp >> (5 - i)) & 1);
  3574. v->mb_type[0][s->block_index[i]] = s->mb_intra;
  3575. v->a_avail = v->c_avail = 0;
  3576. if (i == 2 || i == 3 || !s->first_slice_line)
  3577. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  3578. if (i == 1 || i == 3 || s->mb_x)
  3579. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  3580. vc1_decode_intra_block(v, s->block[i], i, val, mquant,
  3581. (i & 4) ? v->codingset2 : v->codingset);
  3582. if ((i>3) && (s->flags & CODEC_FLAG_GRAY)) continue;
  3583. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  3584. if (i < 4) {
  3585. stride_y = s->linesize << fieldtx;
  3586. off = (fieldtx) ? ((i & 1) * 8) + ((i & 2) >> 1) * s->linesize : (i & 1) * 8 + 4 * (i & 2) * s->linesize;
  3587. } else {
  3588. stride_y = s->uvlinesize;
  3589. off = 0;
  3590. }
  3591. s->idsp.put_signed_pixels_clamped(s->block[i],
  3592. s->dest[dst_idx] + off,
  3593. stride_y);
  3594. //TODO: loop filter
  3595. }
  3596. } else { // inter MB
  3597. mb_has_coeffs = ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][3];
  3598. if (mb_has_coeffs)
  3599. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3600. if (ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][0] == MV_PMODE_INTFR_2MV_FIELD) {
  3601. v->twomvbp = get_vlc2(gb, v->twomvbp_vlc->table, VC1_2MV_BLOCK_PATTERN_VLC_BITS, 1);
  3602. } else {
  3603. if ((ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][0] == MV_PMODE_INTFR_4MV)
  3604. || (ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][0] == MV_PMODE_INTFR_4MV_FIELD)) {
  3605. v->fourmvbp = get_vlc2(gb, v->fourmvbp_vlc->table, VC1_4MV_BLOCK_PATTERN_VLC_BITS, 1);
  3606. }
  3607. }
  3608. s->mb_intra = v->is_intra[s->mb_x] = 0;
  3609. for (i = 0; i < 6; i++)
  3610. v->mb_type[0][s->block_index[i]] = 0;
  3611. fieldtx = v->fieldtx_plane[mb_pos] = ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][1];
  3612. /* for all motion vector read MVDATA and motion compensate each block */
  3613. dst_idx = 0;
  3614. if (fourmv) {
  3615. mvbp = v->fourmvbp;
  3616. for (i = 0; i < 6; i++) {
  3617. if (i < 4) {
  3618. dmv_x = dmv_y = 0;
  3619. val = ((mvbp >> (3 - i)) & 1);
  3620. if (val) {
  3621. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  3622. }
  3623. vc1_pred_mv_intfr(v, i, dmv_x, dmv_y, 0, v->range_x, v->range_y, v->mb_type[0], 0);
  3624. vc1_mc_4mv_luma(v, i, 0, 0);
  3625. } else if (i == 4) {
  3626. vc1_mc_4mv_chroma4(v, 0, 0, 0);
  3627. }
  3628. }
  3629. } else if (twomv) {
  3630. mvbp = v->twomvbp;
  3631. dmv_x = dmv_y = 0;
  3632. if (mvbp & 2) {
  3633. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  3634. }
  3635. vc1_pred_mv_intfr(v, 0, dmv_x, dmv_y, 2, v->range_x, v->range_y, v->mb_type[0], 0);
  3636. vc1_mc_4mv_luma(v, 0, 0, 0);
  3637. vc1_mc_4mv_luma(v, 1, 0, 0);
  3638. dmv_x = dmv_y = 0;
  3639. if (mvbp & 1) {
  3640. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  3641. }
  3642. vc1_pred_mv_intfr(v, 2, dmv_x, dmv_y, 2, v->range_x, v->range_y, v->mb_type[0], 0);
  3643. vc1_mc_4mv_luma(v, 2, 0, 0);
  3644. vc1_mc_4mv_luma(v, 3, 0, 0);
  3645. vc1_mc_4mv_chroma4(v, 0, 0, 0);
  3646. } else {
  3647. mvbp = ff_vc1_mbmode_intfrp[v->fourmvswitch][idx_mbmode][2];
  3648. dmv_x = dmv_y = 0;
  3649. if (mvbp) {
  3650. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  3651. }
  3652. vc1_pred_mv_intfr(v, 0, dmv_x, dmv_y, 1, v->range_x, v->range_y, v->mb_type[0], 0);
  3653. vc1_mc_1mv(v, 0);
  3654. }
  3655. if (cbp)
  3656. GET_MQUANT(); // p. 227
  3657. s->current_picture.qscale_table[mb_pos] = mquant;
  3658. if (!v->ttmbf && cbp)
  3659. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  3660. for (i = 0; i < 6; i++) {
  3661. s->dc_val[0][s->block_index[i]] = 0;
  3662. dst_idx += i >> 2;
  3663. val = ((cbp >> (5 - i)) & 1);
  3664. if (!fieldtx)
  3665. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  3666. else
  3667. off = (i & 4) ? 0 : ((i & 1) * 8 + ((i > 1) * s->linesize));
  3668. if (val) {
  3669. pat = vc1_decode_p_block(v, s->block[i], i, mquant, ttmb,
  3670. first_block, s->dest[dst_idx] + off,
  3671. (i & 4) ? s->uvlinesize : (s->linesize << fieldtx),
  3672. (i & 4) && (s->flags & CODEC_FLAG_GRAY), &block_tt);
  3673. block_cbp |= pat << (i << 2);
  3674. if (!v->ttmbf && ttmb < 8)
  3675. ttmb = -1;
  3676. first_block = 0;
  3677. }
  3678. }
  3679. }
  3680. } else { // skipped
  3681. s->mb_intra = v->is_intra[s->mb_x] = 0;
  3682. for (i = 0; i < 6; i++) {
  3683. v->mb_type[0][s->block_index[i]] = 0;
  3684. s->dc_val[0][s->block_index[i]] = 0;
  3685. }
  3686. s->current_picture.mb_type[mb_pos] = MB_TYPE_SKIP;
  3687. s->current_picture.qscale_table[mb_pos] = 0;
  3688. v->blk_mv_type[s->block_index[0]] = 0;
  3689. v->blk_mv_type[s->block_index[1]] = 0;
  3690. v->blk_mv_type[s->block_index[2]] = 0;
  3691. v->blk_mv_type[s->block_index[3]] = 0;
  3692. vc1_pred_mv_intfr(v, 0, 0, 0, 1, v->range_x, v->range_y, v->mb_type[0], 0);
  3693. vc1_mc_1mv(v, 0);
  3694. }
  3695. if (s->mb_x == s->mb_width - 1)
  3696. memmove(v->is_intra_base, v->is_intra, sizeof(v->is_intra_base[0])*s->mb_stride);
  3697. return 0;
  3698. }
  3699. static int vc1_decode_p_mb_intfi(VC1Context *v)
  3700. {
  3701. MpegEncContext *s = &v->s;
  3702. GetBitContext *gb = &s->gb;
  3703. int i;
  3704. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  3705. int cbp = 0; /* cbp decoding stuff */
  3706. int mqdiff, mquant; /* MB quantization */
  3707. int ttmb = v->ttfrm; /* MB Transform type */
  3708. int mb_has_coeffs = 1; /* last_flag */
  3709. int dmv_x, dmv_y; /* Differential MV components */
  3710. int val; /* temp values */
  3711. int first_block = 1;
  3712. int dst_idx, off;
  3713. int pred_flag;
  3714. int block_cbp = 0, pat, block_tt = 0;
  3715. int idx_mbmode = 0;
  3716. mquant = v->pq; /* Loosy initialization */
  3717. idx_mbmode = get_vlc2(gb, v->mbmode_vlc->table, VC1_IF_MBMODE_VLC_BITS, 2);
  3718. if (idx_mbmode <= 1) { // intra MB
  3719. s->mb_intra = v->is_intra[s->mb_x] = 1;
  3720. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][0] = 0;
  3721. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][1] = 0;
  3722. s->current_picture.mb_type[mb_pos + v->mb_off] = MB_TYPE_INTRA;
  3723. GET_MQUANT();
  3724. s->current_picture.qscale_table[mb_pos] = mquant;
  3725. /* Set DC scale - y and c use the same (not sure if necessary here) */
  3726. s->y_dc_scale = s->y_dc_scale_table[mquant];
  3727. s->c_dc_scale = s->c_dc_scale_table[mquant];
  3728. v->s.ac_pred = v->acpred_plane[mb_pos] = get_bits1(gb);
  3729. mb_has_coeffs = idx_mbmode & 1;
  3730. if (mb_has_coeffs)
  3731. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_ICBPCY_VLC_BITS, 2);
  3732. dst_idx = 0;
  3733. for (i = 0; i < 6; i++) {
  3734. s->dc_val[0][s->block_index[i]] = 0;
  3735. v->mb_type[0][s->block_index[i]] = 1;
  3736. dst_idx += i >> 2;
  3737. val = ((cbp >> (5 - i)) & 1);
  3738. v->a_avail = v->c_avail = 0;
  3739. if (i == 2 || i == 3 || !s->first_slice_line)
  3740. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  3741. if (i == 1 || i == 3 || s->mb_x)
  3742. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  3743. vc1_decode_intra_block(v, s->block[i], i, val, mquant,
  3744. (i & 4) ? v->codingset2 : v->codingset);
  3745. if ((i>3) && (s->flags & CODEC_FLAG_GRAY))
  3746. continue;
  3747. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  3748. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  3749. s->idsp.put_signed_pixels_clamped(s->block[i],
  3750. s->dest[dst_idx] + off,
  3751. (i & 4) ? s->uvlinesize
  3752. : s->linesize);
  3753. // TODO: loop filter
  3754. }
  3755. } else {
  3756. s->mb_intra = v->is_intra[s->mb_x] = 0;
  3757. s->current_picture.mb_type[mb_pos + v->mb_off] = MB_TYPE_16x16;
  3758. for (i = 0; i < 6; i++) v->mb_type[0][s->block_index[i]] = 0;
  3759. if (idx_mbmode <= 5) { // 1-MV
  3760. dmv_x = dmv_y = pred_flag = 0;
  3761. if (idx_mbmode & 1) {
  3762. get_mvdata_interlaced(v, &dmv_x, &dmv_y, &pred_flag);
  3763. }
  3764. vc1_pred_mv(v, 0, dmv_x, dmv_y, 1, v->range_x, v->range_y, v->mb_type[0], pred_flag, 0);
  3765. vc1_mc_1mv(v, 0);
  3766. mb_has_coeffs = !(idx_mbmode & 2);
  3767. } else { // 4-MV
  3768. v->fourmvbp = get_vlc2(gb, v->fourmvbp_vlc->table, VC1_4MV_BLOCK_PATTERN_VLC_BITS, 1);
  3769. for (i = 0; i < 6; i++) {
  3770. if (i < 4) {
  3771. dmv_x = dmv_y = pred_flag = 0;
  3772. val = ((v->fourmvbp >> (3 - i)) & 1);
  3773. if (val) {
  3774. get_mvdata_interlaced(v, &dmv_x, &dmv_y, &pred_flag);
  3775. }
  3776. vc1_pred_mv(v, i, dmv_x, dmv_y, 0, v->range_x, v->range_y, v->mb_type[0], pred_flag, 0);
  3777. vc1_mc_4mv_luma(v, i, 0, 0);
  3778. } else if (i == 4)
  3779. vc1_mc_4mv_chroma(v, 0);
  3780. }
  3781. mb_has_coeffs = idx_mbmode & 1;
  3782. }
  3783. if (mb_has_coeffs)
  3784. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3785. if (cbp) {
  3786. GET_MQUANT();
  3787. }
  3788. s->current_picture.qscale_table[mb_pos] = mquant;
  3789. if (!v->ttmbf && cbp) {
  3790. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  3791. }
  3792. dst_idx = 0;
  3793. for (i = 0; i < 6; i++) {
  3794. s->dc_val[0][s->block_index[i]] = 0;
  3795. dst_idx += i >> 2;
  3796. val = ((cbp >> (5 - i)) & 1);
  3797. off = (i & 4) ? 0 : (i & 1) * 8 + (i & 2) * 4 * s->linesize;
  3798. if (val) {
  3799. pat = vc1_decode_p_block(v, s->block[i], i, mquant, ttmb,
  3800. first_block, s->dest[dst_idx] + off,
  3801. (i & 4) ? s->uvlinesize : s->linesize,
  3802. (i & 4) && (s->flags & CODEC_FLAG_GRAY),
  3803. &block_tt);
  3804. block_cbp |= pat << (i << 2);
  3805. if (!v->ttmbf && ttmb < 8) ttmb = -1;
  3806. first_block = 0;
  3807. }
  3808. }
  3809. }
  3810. if (s->mb_x == s->mb_width - 1)
  3811. memmove(v->is_intra_base, v->is_intra, sizeof(v->is_intra_base[0]) * s->mb_stride);
  3812. return 0;
  3813. }
  3814. /** Decode one B-frame MB (in Main profile)
  3815. */
  3816. static void vc1_decode_b_mb(VC1Context *v)
  3817. {
  3818. MpegEncContext *s = &v->s;
  3819. GetBitContext *gb = &s->gb;
  3820. int i, j;
  3821. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  3822. int cbp = 0; /* cbp decoding stuff */
  3823. int mqdiff, mquant; /* MB quantization */
  3824. int ttmb = v->ttfrm; /* MB Transform type */
  3825. int mb_has_coeffs = 0; /* last_flag */
  3826. int index, index1; /* LUT indexes */
  3827. int val, sign; /* temp values */
  3828. int first_block = 1;
  3829. int dst_idx, off;
  3830. int skipped, direct;
  3831. int dmv_x[2], dmv_y[2];
  3832. int bmvtype = BMV_TYPE_BACKWARD;
  3833. mquant = v->pq; /* lossy initialization */
  3834. s->mb_intra = 0;
  3835. if (v->dmb_is_raw)
  3836. direct = get_bits1(gb);
  3837. else
  3838. direct = v->direct_mb_plane[mb_pos];
  3839. if (v->skip_is_raw)
  3840. skipped = get_bits1(gb);
  3841. else
  3842. skipped = v->s.mbskip_table[mb_pos];
  3843. dmv_x[0] = dmv_x[1] = dmv_y[0] = dmv_y[1] = 0;
  3844. for (i = 0; i < 6; i++) {
  3845. v->mb_type[0][s->block_index[i]] = 0;
  3846. s->dc_val[0][s->block_index[i]] = 0;
  3847. }
  3848. s->current_picture.qscale_table[mb_pos] = 0;
  3849. if (!direct) {
  3850. if (!skipped) {
  3851. GET_MVDATA(dmv_x[0], dmv_y[0]);
  3852. dmv_x[1] = dmv_x[0];
  3853. dmv_y[1] = dmv_y[0];
  3854. }
  3855. if (skipped || !s->mb_intra) {
  3856. bmvtype = decode012(gb);
  3857. switch (bmvtype) {
  3858. case 0:
  3859. bmvtype = (v->bfraction >= (B_FRACTION_DEN/2)) ? BMV_TYPE_BACKWARD : BMV_TYPE_FORWARD;
  3860. break;
  3861. case 1:
  3862. bmvtype = (v->bfraction >= (B_FRACTION_DEN/2)) ? BMV_TYPE_FORWARD : BMV_TYPE_BACKWARD;
  3863. break;
  3864. case 2:
  3865. bmvtype = BMV_TYPE_INTERPOLATED;
  3866. dmv_x[0] = dmv_y[0] = 0;
  3867. }
  3868. }
  3869. }
  3870. for (i = 0; i < 6; i++)
  3871. v->mb_type[0][s->block_index[i]] = s->mb_intra;
  3872. if (skipped) {
  3873. if (direct)
  3874. bmvtype = BMV_TYPE_INTERPOLATED;
  3875. vc1_pred_b_mv(v, dmv_x, dmv_y, direct, bmvtype);
  3876. vc1_b_mc(v, dmv_x, dmv_y, direct, bmvtype);
  3877. return;
  3878. }
  3879. if (direct) {
  3880. cbp = get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3881. GET_MQUANT();
  3882. s->mb_intra = 0;
  3883. s->current_picture.qscale_table[mb_pos] = mquant;
  3884. if (!v->ttmbf)
  3885. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  3886. dmv_x[0] = dmv_y[0] = dmv_x[1] = dmv_y[1] = 0;
  3887. vc1_pred_b_mv(v, dmv_x, dmv_y, direct, bmvtype);
  3888. vc1_b_mc(v, dmv_x, dmv_y, direct, bmvtype);
  3889. } else {
  3890. if (!mb_has_coeffs && !s->mb_intra) {
  3891. /* no coded blocks - effectively skipped */
  3892. vc1_pred_b_mv(v, dmv_x, dmv_y, direct, bmvtype);
  3893. vc1_b_mc(v, dmv_x, dmv_y, direct, bmvtype);
  3894. return;
  3895. }
  3896. if (s->mb_intra && !mb_has_coeffs) {
  3897. GET_MQUANT();
  3898. s->current_picture.qscale_table[mb_pos] = mquant;
  3899. s->ac_pred = get_bits1(gb);
  3900. cbp = 0;
  3901. vc1_pred_b_mv(v, dmv_x, dmv_y, direct, bmvtype);
  3902. } else {
  3903. if (bmvtype == BMV_TYPE_INTERPOLATED) {
  3904. GET_MVDATA(dmv_x[0], dmv_y[0]);
  3905. if (!mb_has_coeffs) {
  3906. /* interpolated skipped block */
  3907. vc1_pred_b_mv(v, dmv_x, dmv_y, direct, bmvtype);
  3908. vc1_b_mc(v, dmv_x, dmv_y, direct, bmvtype);
  3909. return;
  3910. }
  3911. }
  3912. vc1_pred_b_mv(v, dmv_x, dmv_y, direct, bmvtype);
  3913. if (!s->mb_intra) {
  3914. vc1_b_mc(v, dmv_x, dmv_y, direct, bmvtype);
  3915. }
  3916. if (s->mb_intra)
  3917. s->ac_pred = get_bits1(gb);
  3918. cbp = get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  3919. GET_MQUANT();
  3920. s->current_picture.qscale_table[mb_pos] = mquant;
  3921. if (!v->ttmbf && !s->mb_intra && mb_has_coeffs)
  3922. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  3923. }
  3924. }
  3925. dst_idx = 0;
  3926. for (i = 0; i < 6; i++) {
  3927. s->dc_val[0][s->block_index[i]] = 0;
  3928. dst_idx += i >> 2;
  3929. val = ((cbp >> (5 - i)) & 1);
  3930. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  3931. v->mb_type[0][s->block_index[i]] = s->mb_intra;
  3932. if (s->mb_intra) {
  3933. /* check if prediction blocks A and C are available */
  3934. v->a_avail = v->c_avail = 0;
  3935. if (i == 2 || i == 3 || !s->first_slice_line)
  3936. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  3937. if (i == 1 || i == 3 || s->mb_x)
  3938. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  3939. vc1_decode_intra_block(v, s->block[i], i, val, mquant,
  3940. (i & 4) ? v->codingset2 : v->codingset);
  3941. if ((i>3) && (s->flags & CODEC_FLAG_GRAY))
  3942. continue;
  3943. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  3944. if (v->rangeredfrm)
  3945. for (j = 0; j < 64; j++)
  3946. s->block[i][j] <<= 1;
  3947. s->idsp.put_signed_pixels_clamped(s->block[i],
  3948. s->dest[dst_idx] + off,
  3949. i & 4 ? s->uvlinesize
  3950. : s->linesize);
  3951. } else if (val) {
  3952. vc1_decode_p_block(v, s->block[i], i, mquant, ttmb,
  3953. first_block, s->dest[dst_idx] + off,
  3954. (i & 4) ? s->uvlinesize : s->linesize,
  3955. (i & 4) && (s->flags & CODEC_FLAG_GRAY), NULL);
  3956. if (!v->ttmbf && ttmb < 8)
  3957. ttmb = -1;
  3958. first_block = 0;
  3959. }
  3960. }
  3961. }
  3962. /** Decode one B-frame MB (in interlaced field B picture)
  3963. */
  3964. static void vc1_decode_b_mb_intfi(VC1Context *v)
  3965. {
  3966. MpegEncContext *s = &v->s;
  3967. GetBitContext *gb = &s->gb;
  3968. int i, j;
  3969. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  3970. int cbp = 0; /* cbp decoding stuff */
  3971. int mqdiff, mquant; /* MB quantization */
  3972. int ttmb = v->ttfrm; /* MB Transform type */
  3973. int mb_has_coeffs = 0; /* last_flag */
  3974. int val; /* temp value */
  3975. int first_block = 1;
  3976. int dst_idx, off;
  3977. int fwd;
  3978. int dmv_x[2], dmv_y[2], pred_flag[2];
  3979. int bmvtype = BMV_TYPE_BACKWARD;
  3980. int idx_mbmode, interpmvp;
  3981. mquant = v->pq; /* Loosy initialization */
  3982. s->mb_intra = 0;
  3983. idx_mbmode = get_vlc2(gb, v->mbmode_vlc->table, VC1_IF_MBMODE_VLC_BITS, 2);
  3984. if (idx_mbmode <= 1) { // intra MB
  3985. s->mb_intra = v->is_intra[s->mb_x] = 1;
  3986. s->current_picture.motion_val[1][s->block_index[0]][0] = 0;
  3987. s->current_picture.motion_val[1][s->block_index[0]][1] = 0;
  3988. s->current_picture.mb_type[mb_pos + v->mb_off] = MB_TYPE_INTRA;
  3989. GET_MQUANT();
  3990. s->current_picture.qscale_table[mb_pos] = mquant;
  3991. /* Set DC scale - y and c use the same (not sure if necessary here) */
  3992. s->y_dc_scale = s->y_dc_scale_table[mquant];
  3993. s->c_dc_scale = s->c_dc_scale_table[mquant];
  3994. v->s.ac_pred = v->acpred_plane[mb_pos] = get_bits1(gb);
  3995. mb_has_coeffs = idx_mbmode & 1;
  3996. if (mb_has_coeffs)
  3997. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_ICBPCY_VLC_BITS, 2);
  3998. dst_idx = 0;
  3999. for (i = 0; i < 6; i++) {
  4000. s->dc_val[0][s->block_index[i]] = 0;
  4001. dst_idx += i >> 2;
  4002. val = ((cbp >> (5 - i)) & 1);
  4003. v->mb_type[0][s->block_index[i]] = s->mb_intra;
  4004. v->a_avail = v->c_avail = 0;
  4005. if (i == 2 || i == 3 || !s->first_slice_line)
  4006. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  4007. if (i == 1 || i == 3 || s->mb_x)
  4008. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  4009. vc1_decode_intra_block(v, s->block[i], i, val, mquant,
  4010. (i & 4) ? v->codingset2 : v->codingset);
  4011. if ((i>3) && (s->flags & CODEC_FLAG_GRAY))
  4012. continue;
  4013. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  4014. if (v->rangeredfrm)
  4015. for (j = 0; j < 64; j++)
  4016. s->block[i][j] <<= 1;
  4017. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  4018. s->idsp.put_signed_pixels_clamped(s->block[i],
  4019. s->dest[dst_idx] + off,
  4020. (i & 4) ? s->uvlinesize
  4021. : s->linesize);
  4022. // TODO: yet to perform loop filter
  4023. }
  4024. } else {
  4025. s->mb_intra = v->is_intra[s->mb_x] = 0;
  4026. s->current_picture.mb_type[mb_pos + v->mb_off] = MB_TYPE_16x16;
  4027. for (i = 0; i < 6; i++) v->mb_type[0][s->block_index[i]] = 0;
  4028. if (v->fmb_is_raw)
  4029. fwd = v->forward_mb_plane[mb_pos] = get_bits1(gb);
  4030. else
  4031. fwd = v->forward_mb_plane[mb_pos];
  4032. if (idx_mbmode <= 5) { // 1-MV
  4033. dmv_x[0] = dmv_x[1] = dmv_y[0] = dmv_y[1] = 0;
  4034. pred_flag[0] = pred_flag[1] = 0;
  4035. if (fwd)
  4036. bmvtype = BMV_TYPE_FORWARD;
  4037. else {
  4038. bmvtype = decode012(gb);
  4039. switch (bmvtype) {
  4040. case 0:
  4041. bmvtype = BMV_TYPE_BACKWARD;
  4042. break;
  4043. case 1:
  4044. bmvtype = BMV_TYPE_DIRECT;
  4045. break;
  4046. case 2:
  4047. bmvtype = BMV_TYPE_INTERPOLATED;
  4048. interpmvp = get_bits1(gb);
  4049. }
  4050. }
  4051. v->bmvtype = bmvtype;
  4052. if (bmvtype != BMV_TYPE_DIRECT && idx_mbmode & 1) {
  4053. get_mvdata_interlaced(v, &dmv_x[bmvtype == BMV_TYPE_BACKWARD], &dmv_y[bmvtype == BMV_TYPE_BACKWARD], &pred_flag[bmvtype == BMV_TYPE_BACKWARD]);
  4054. }
  4055. if (bmvtype == BMV_TYPE_INTERPOLATED && interpmvp) {
  4056. get_mvdata_interlaced(v, &dmv_x[1], &dmv_y[1], &pred_flag[1]);
  4057. }
  4058. if (bmvtype == BMV_TYPE_DIRECT) {
  4059. dmv_x[0] = dmv_y[0] = pred_flag[0] = 0;
  4060. dmv_x[1] = dmv_y[1] = pred_flag[0] = 0;
  4061. }
  4062. vc1_pred_b_mv_intfi(v, 0, dmv_x, dmv_y, 1, pred_flag);
  4063. vc1_b_mc(v, dmv_x, dmv_y, (bmvtype == BMV_TYPE_DIRECT), bmvtype);
  4064. mb_has_coeffs = !(idx_mbmode & 2);
  4065. } else { // 4-MV
  4066. if (fwd)
  4067. bmvtype = BMV_TYPE_FORWARD;
  4068. v->bmvtype = bmvtype;
  4069. v->fourmvbp = get_vlc2(gb, v->fourmvbp_vlc->table, VC1_4MV_BLOCK_PATTERN_VLC_BITS, 1);
  4070. for (i = 0; i < 6; i++) {
  4071. if (i < 4) {
  4072. dmv_x[0] = dmv_y[0] = pred_flag[0] = 0;
  4073. dmv_x[1] = dmv_y[1] = pred_flag[1] = 0;
  4074. val = ((v->fourmvbp >> (3 - i)) & 1);
  4075. if (val) {
  4076. get_mvdata_interlaced(v, &dmv_x[bmvtype == BMV_TYPE_BACKWARD],
  4077. &dmv_y[bmvtype == BMV_TYPE_BACKWARD],
  4078. &pred_flag[bmvtype == BMV_TYPE_BACKWARD]);
  4079. }
  4080. vc1_pred_b_mv_intfi(v, i, dmv_x, dmv_y, 0, pred_flag);
  4081. vc1_mc_4mv_luma(v, i, bmvtype == BMV_TYPE_BACKWARD, 0);
  4082. } else if (i == 4)
  4083. vc1_mc_4mv_chroma(v, bmvtype == BMV_TYPE_BACKWARD);
  4084. }
  4085. mb_has_coeffs = idx_mbmode & 1;
  4086. }
  4087. if (mb_has_coeffs)
  4088. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  4089. if (cbp) {
  4090. GET_MQUANT();
  4091. }
  4092. s->current_picture.qscale_table[mb_pos] = mquant;
  4093. if (!v->ttmbf && cbp) {
  4094. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  4095. }
  4096. dst_idx = 0;
  4097. for (i = 0; i < 6; i++) {
  4098. s->dc_val[0][s->block_index[i]] = 0;
  4099. dst_idx += i >> 2;
  4100. val = ((cbp >> (5 - i)) & 1);
  4101. off = (i & 4) ? 0 : (i & 1) * 8 + (i & 2) * 4 * s->linesize;
  4102. if (val) {
  4103. vc1_decode_p_block(v, s->block[i], i, mquant, ttmb,
  4104. first_block, s->dest[dst_idx] + off,
  4105. (i & 4) ? s->uvlinesize : s->linesize,
  4106. (i & 4) && (s->flags & CODEC_FLAG_GRAY), NULL);
  4107. if (!v->ttmbf && ttmb < 8)
  4108. ttmb = -1;
  4109. first_block = 0;
  4110. }
  4111. }
  4112. }
  4113. }
  4114. /** Decode one B-frame MB (in interlaced frame B picture)
  4115. */
  4116. static int vc1_decode_b_mb_intfr(VC1Context *v)
  4117. {
  4118. MpegEncContext *s = &v->s;
  4119. GetBitContext *gb = &s->gb;
  4120. int i, j;
  4121. int mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  4122. int cbp = 0; /* cbp decoding stuff */
  4123. int mqdiff, mquant; /* MB quantization */
  4124. int ttmb = v->ttfrm; /* MB Transform type */
  4125. int mvsw = 0; /* motion vector switch */
  4126. int mb_has_coeffs = 1; /* last_flag */
  4127. int dmv_x, dmv_y; /* Differential MV components */
  4128. int val; /* temp value */
  4129. int first_block = 1;
  4130. int dst_idx, off;
  4131. int skipped, direct, twomv = 0;
  4132. int block_cbp = 0, pat, block_tt = 0;
  4133. int idx_mbmode = 0, mvbp;
  4134. int stride_y, fieldtx;
  4135. int bmvtype = BMV_TYPE_BACKWARD;
  4136. int dir, dir2;
  4137. mquant = v->pq; /* Lossy initialization */
  4138. s->mb_intra = 0;
  4139. if (v->skip_is_raw)
  4140. skipped = get_bits1(gb);
  4141. else
  4142. skipped = v->s.mbskip_table[mb_pos];
  4143. if (!skipped) {
  4144. idx_mbmode = get_vlc2(gb, v->mbmode_vlc->table, VC1_INTFR_NON4MV_MBMODE_VLC_BITS, 2);
  4145. if (ff_vc1_mbmode_intfrp[0][idx_mbmode][0] == MV_PMODE_INTFR_2MV_FIELD) {
  4146. twomv = 1;
  4147. v->blk_mv_type[s->block_index[0]] = 1;
  4148. v->blk_mv_type[s->block_index[1]] = 1;
  4149. v->blk_mv_type[s->block_index[2]] = 1;
  4150. v->blk_mv_type[s->block_index[3]] = 1;
  4151. } else {
  4152. v->blk_mv_type[s->block_index[0]] = 0;
  4153. v->blk_mv_type[s->block_index[1]] = 0;
  4154. v->blk_mv_type[s->block_index[2]] = 0;
  4155. v->blk_mv_type[s->block_index[3]] = 0;
  4156. }
  4157. }
  4158. if (v->dmb_is_raw)
  4159. direct = get_bits1(gb);
  4160. else
  4161. direct = v->direct_mb_plane[mb_pos];
  4162. if (direct) {
  4163. s->mv[0][0][0] = s->current_picture.motion_val[0][s->block_index[0]][0] = scale_mv(s->next_picture.motion_val[1][s->block_index[0]][0], v->bfraction, 0, s->quarter_sample);
  4164. s->mv[0][0][1] = s->current_picture.motion_val[0][s->block_index[0]][1] = scale_mv(s->next_picture.motion_val[1][s->block_index[0]][1], v->bfraction, 0, s->quarter_sample);
  4165. s->mv[1][0][0] = s->current_picture.motion_val[1][s->block_index[0]][0] = scale_mv(s->next_picture.motion_val[1][s->block_index[0]][0], v->bfraction, 1, s->quarter_sample);
  4166. s->mv[1][0][1] = s->current_picture.motion_val[1][s->block_index[0]][1] = scale_mv(s->next_picture.motion_val[1][s->block_index[0]][1], v->bfraction, 1, s->quarter_sample);
  4167. if (twomv) {
  4168. s->mv[0][2][0] = s->current_picture.motion_val[0][s->block_index[2]][0] = scale_mv(s->next_picture.motion_val[1][s->block_index[2]][0], v->bfraction, 0, s->quarter_sample);
  4169. s->mv[0][2][1] = s->current_picture.motion_val[0][s->block_index[2]][1] = scale_mv(s->next_picture.motion_val[1][s->block_index[2]][1], v->bfraction, 0, s->quarter_sample);
  4170. s->mv[1][2][0] = s->current_picture.motion_val[1][s->block_index[2]][0] = scale_mv(s->next_picture.motion_val[1][s->block_index[2]][0], v->bfraction, 1, s->quarter_sample);
  4171. s->mv[1][2][1] = s->current_picture.motion_val[1][s->block_index[2]][1] = scale_mv(s->next_picture.motion_val[1][s->block_index[2]][1], v->bfraction, 1, s->quarter_sample);
  4172. for (i = 1; i < 4; i += 2) {
  4173. s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0] = s->mv[0][i-1][0];
  4174. s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1] = s->mv[0][i-1][1];
  4175. s->mv[1][i][0] = s->current_picture.motion_val[1][s->block_index[i]][0] = s->mv[1][i-1][0];
  4176. s->mv[1][i][1] = s->current_picture.motion_val[1][s->block_index[i]][1] = s->mv[1][i-1][1];
  4177. }
  4178. } else {
  4179. for (i = 1; i < 4; i++) {
  4180. s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0] = s->mv[0][0][0];
  4181. s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1] = s->mv[0][0][1];
  4182. s->mv[1][i][0] = s->current_picture.motion_val[1][s->block_index[i]][0] = s->mv[1][0][0];
  4183. s->mv[1][i][1] = s->current_picture.motion_val[1][s->block_index[i]][1] = s->mv[1][0][1];
  4184. }
  4185. }
  4186. }
  4187. if (ff_vc1_mbmode_intfrp[0][idx_mbmode][0] == MV_PMODE_INTFR_INTRA) { // intra MB
  4188. for (i = 0; i < 4; i++) {
  4189. s->mv[0][i][0] = s->current_picture.motion_val[0][s->block_index[i]][0] = 0;
  4190. s->mv[0][i][1] = s->current_picture.motion_val[0][s->block_index[i]][1] = 0;
  4191. s->mv[1][i][0] = s->current_picture.motion_val[1][s->block_index[i]][0] = 0;
  4192. s->mv[1][i][1] = s->current_picture.motion_val[1][s->block_index[i]][1] = 0;
  4193. }
  4194. s->current_picture.mb_type[mb_pos] = MB_TYPE_INTRA;
  4195. s->mb_intra = v->is_intra[s->mb_x] = 1;
  4196. for (i = 0; i < 6; i++)
  4197. v->mb_type[0][s->block_index[i]] = 1;
  4198. fieldtx = v->fieldtx_plane[mb_pos] = get_bits1(gb);
  4199. mb_has_coeffs = get_bits1(gb);
  4200. if (mb_has_coeffs)
  4201. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  4202. v->s.ac_pred = v->acpred_plane[mb_pos] = get_bits1(gb);
  4203. GET_MQUANT();
  4204. s->current_picture.qscale_table[mb_pos] = mquant;
  4205. /* Set DC scale - y and c use the same (not sure if necessary here) */
  4206. s->y_dc_scale = s->y_dc_scale_table[mquant];
  4207. s->c_dc_scale = s->c_dc_scale_table[mquant];
  4208. dst_idx = 0;
  4209. for (i = 0; i < 6; i++) {
  4210. s->dc_val[0][s->block_index[i]] = 0;
  4211. dst_idx += i >> 2;
  4212. val = ((cbp >> (5 - i)) & 1);
  4213. v->mb_type[0][s->block_index[i]] = s->mb_intra;
  4214. v->a_avail = v->c_avail = 0;
  4215. if (i == 2 || i == 3 || !s->first_slice_line)
  4216. v->a_avail = v->mb_type[0][s->block_index[i] - s->block_wrap[i]];
  4217. if (i == 1 || i == 3 || s->mb_x)
  4218. v->c_avail = v->mb_type[0][s->block_index[i] - 1];
  4219. vc1_decode_intra_block(v, s->block[i], i, val, mquant,
  4220. (i & 4) ? v->codingset2 : v->codingset);
  4221. if (i > 3 && (s->flags & CODEC_FLAG_GRAY))
  4222. continue;
  4223. v->vc1dsp.vc1_inv_trans_8x8(s->block[i]);
  4224. if (i < 4) {
  4225. stride_y = s->linesize << fieldtx;
  4226. off = (fieldtx) ? ((i & 1) * 8) + ((i & 2) >> 1) * s->linesize : (i & 1) * 8 + 4 * (i & 2) * s->linesize;
  4227. } else {
  4228. stride_y = s->uvlinesize;
  4229. off = 0;
  4230. }
  4231. s->idsp.put_signed_pixels_clamped(s->block[i],
  4232. s->dest[dst_idx] + off,
  4233. stride_y);
  4234. }
  4235. } else {
  4236. s->mb_intra = v->is_intra[s->mb_x] = 0;
  4237. if (!direct) {
  4238. if (skipped || !s->mb_intra) {
  4239. bmvtype = decode012(gb);
  4240. switch (bmvtype) {
  4241. case 0:
  4242. bmvtype = (v->bfraction >= (B_FRACTION_DEN/2)) ? BMV_TYPE_BACKWARD : BMV_TYPE_FORWARD;
  4243. break;
  4244. case 1:
  4245. bmvtype = (v->bfraction >= (B_FRACTION_DEN/2)) ? BMV_TYPE_FORWARD : BMV_TYPE_BACKWARD;
  4246. break;
  4247. case 2:
  4248. bmvtype = BMV_TYPE_INTERPOLATED;
  4249. }
  4250. }
  4251. if (twomv && bmvtype != BMV_TYPE_INTERPOLATED)
  4252. mvsw = get_bits1(gb);
  4253. }
  4254. if (!skipped) { // inter MB
  4255. mb_has_coeffs = ff_vc1_mbmode_intfrp[0][idx_mbmode][3];
  4256. if (mb_has_coeffs)
  4257. cbp = 1 + get_vlc2(&v->s.gb, v->cbpcy_vlc->table, VC1_CBPCY_P_VLC_BITS, 2);
  4258. if (!direct) {
  4259. if (bmvtype == BMV_TYPE_INTERPOLATED & twomv) {
  4260. v->fourmvbp = get_vlc2(gb, v->fourmvbp_vlc->table, VC1_4MV_BLOCK_PATTERN_VLC_BITS, 1);
  4261. } else if (bmvtype == BMV_TYPE_INTERPOLATED | twomv) {
  4262. v->twomvbp = get_vlc2(gb, v->twomvbp_vlc->table, VC1_2MV_BLOCK_PATTERN_VLC_BITS, 1);
  4263. }
  4264. }
  4265. for (i = 0; i < 6; i++)
  4266. v->mb_type[0][s->block_index[i]] = 0;
  4267. fieldtx = v->fieldtx_plane[mb_pos] = ff_vc1_mbmode_intfrp[0][idx_mbmode][1];
  4268. /* for all motion vector read MVDATA and motion compensate each block */
  4269. dst_idx = 0;
  4270. if (direct) {
  4271. if (twomv) {
  4272. for (i = 0; i < 4; i++) {
  4273. vc1_mc_4mv_luma(v, i, 0, 0);
  4274. vc1_mc_4mv_luma(v, i, 1, 1);
  4275. }
  4276. vc1_mc_4mv_chroma4(v, 0, 0, 0);
  4277. vc1_mc_4mv_chroma4(v, 1, 1, 1);
  4278. } else {
  4279. vc1_mc_1mv(v, 0);
  4280. vc1_interp_mc(v);
  4281. }
  4282. } else if (twomv && bmvtype == BMV_TYPE_INTERPOLATED) {
  4283. mvbp = v->fourmvbp;
  4284. for (i = 0; i < 4; i++) {
  4285. dir = i==1 || i==3;
  4286. dmv_x = dmv_y = 0;
  4287. val = ((mvbp >> (3 - i)) & 1);
  4288. if (val)
  4289. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  4290. j = i > 1 ? 2 : 0;
  4291. vc1_pred_mv_intfr(v, j, dmv_x, dmv_y, 2, v->range_x, v->range_y, v->mb_type[0], dir);
  4292. vc1_mc_4mv_luma(v, j, dir, dir);
  4293. vc1_mc_4mv_luma(v, j+1, dir, dir);
  4294. }
  4295. vc1_mc_4mv_chroma4(v, 0, 0, 0);
  4296. vc1_mc_4mv_chroma4(v, 1, 1, 1);
  4297. } else if (bmvtype == BMV_TYPE_INTERPOLATED) {
  4298. mvbp = v->twomvbp;
  4299. dmv_x = dmv_y = 0;
  4300. if (mvbp & 2)
  4301. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  4302. vc1_pred_mv_intfr(v, 0, dmv_x, dmv_y, 1, v->range_x, v->range_y, v->mb_type[0], 0);
  4303. vc1_mc_1mv(v, 0);
  4304. dmv_x = dmv_y = 0;
  4305. if (mvbp & 1)
  4306. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  4307. vc1_pred_mv_intfr(v, 0, dmv_x, dmv_y, 1, v->range_x, v->range_y, v->mb_type[0], 1);
  4308. vc1_interp_mc(v);
  4309. } else if (twomv) {
  4310. dir = bmvtype == BMV_TYPE_BACKWARD;
  4311. dir2 = dir;
  4312. if (mvsw)
  4313. dir2 = !dir;
  4314. mvbp = v->twomvbp;
  4315. dmv_x = dmv_y = 0;
  4316. if (mvbp & 2)
  4317. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  4318. vc1_pred_mv_intfr(v, 0, dmv_x, dmv_y, 2, v->range_x, v->range_y, v->mb_type[0], dir);
  4319. dmv_x = dmv_y = 0;
  4320. if (mvbp & 1)
  4321. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  4322. vc1_pred_mv_intfr(v, 2, dmv_x, dmv_y, 2, v->range_x, v->range_y, v->mb_type[0], dir2);
  4323. if (mvsw) {
  4324. for (i = 0; i < 2; i++) {
  4325. s->mv[dir][i+2][0] = s->mv[dir][i][0] = s->current_picture.motion_val[dir][s->block_index[i+2]][0] = s->current_picture.motion_val[dir][s->block_index[i]][0];
  4326. s->mv[dir][i+2][1] = s->mv[dir][i][1] = s->current_picture.motion_val[dir][s->block_index[i+2]][1] = s->current_picture.motion_val[dir][s->block_index[i]][1];
  4327. s->mv[dir2][i+2][0] = s->mv[dir2][i][0] = s->current_picture.motion_val[dir2][s->block_index[i]][0] = s->current_picture.motion_val[dir2][s->block_index[i+2]][0];
  4328. s->mv[dir2][i+2][1] = s->mv[dir2][i][1] = s->current_picture.motion_val[dir2][s->block_index[i]][1] = s->current_picture.motion_val[dir2][s->block_index[i+2]][1];
  4329. }
  4330. } else {
  4331. vc1_pred_mv_intfr(v, 0, 0, 0, 2, v->range_x, v->range_y, v->mb_type[0], !dir);
  4332. vc1_pred_mv_intfr(v, 2, 0, 0, 2, v->range_x, v->range_y, v->mb_type[0], !dir);
  4333. }
  4334. vc1_mc_4mv_luma(v, 0, dir, 0);
  4335. vc1_mc_4mv_luma(v, 1, dir, 0);
  4336. vc1_mc_4mv_luma(v, 2, dir2, 0);
  4337. vc1_mc_4mv_luma(v, 3, dir2, 0);
  4338. vc1_mc_4mv_chroma4(v, dir, dir2, 0);
  4339. } else {
  4340. dir = bmvtype == BMV_TYPE_BACKWARD;
  4341. mvbp = ff_vc1_mbmode_intfrp[0][idx_mbmode][2];
  4342. dmv_x = dmv_y = 0;
  4343. if (mvbp)
  4344. get_mvdata_interlaced(v, &dmv_x, &dmv_y, 0);
  4345. vc1_pred_mv_intfr(v, 0, dmv_x, dmv_y, 1, v->range_x, v->range_y, v->mb_type[0], dir);
  4346. v->blk_mv_type[s->block_index[0]] = 1;
  4347. v->blk_mv_type[s->block_index[1]] = 1;
  4348. v->blk_mv_type[s->block_index[2]] = 1;
  4349. v->blk_mv_type[s->block_index[3]] = 1;
  4350. vc1_pred_mv_intfr(v, 0, 0, 0, 2, v->range_x, v->range_y, 0, !dir);
  4351. for (i = 0; i < 2; i++) {
  4352. s->mv[!dir][i+2][0] = s->mv[!dir][i][0] = s->current_picture.motion_val[!dir][s->block_index[i+2]][0] = s->current_picture.motion_val[!dir][s->block_index[i]][0];
  4353. s->mv[!dir][i+2][1] = s->mv[!dir][i][1] = s->current_picture.motion_val[!dir][s->block_index[i+2]][1] = s->current_picture.motion_val[!dir][s->block_index[i]][1];
  4354. }
  4355. vc1_mc_1mv(v, dir);
  4356. }
  4357. if (cbp)
  4358. GET_MQUANT(); // p. 227
  4359. s->current_picture.qscale_table[mb_pos] = mquant;
  4360. if (!v->ttmbf && cbp)
  4361. ttmb = get_vlc2(gb, ff_vc1_ttmb_vlc[v->tt_index].table, VC1_TTMB_VLC_BITS, 2);
  4362. for (i = 0; i < 6; i++) {
  4363. s->dc_val[0][s->block_index[i]] = 0;
  4364. dst_idx += i >> 2;
  4365. val = ((cbp >> (5 - i)) & 1);
  4366. if (!fieldtx)
  4367. off = (i & 4) ? 0 : ((i & 1) * 8 + (i & 2) * 4 * s->linesize);
  4368. else
  4369. off = (i & 4) ? 0 : ((i & 1) * 8 + ((i > 1) * s->linesize));
  4370. if (val) {
  4371. pat = vc1_decode_p_block(v, s->block[i], i, mquant, ttmb,
  4372. first_block, s->dest[dst_idx] + off,
  4373. (i & 4) ? s->uvlinesize : (s->linesize << fieldtx),
  4374. (i & 4) && (s->flags & CODEC_FLAG_GRAY), &block_tt);
  4375. block_cbp |= pat << (i << 2);
  4376. if (!v->ttmbf && ttmb < 8)
  4377. ttmb = -1;
  4378. first_block = 0;
  4379. }
  4380. }
  4381. } else { // skipped
  4382. dir = 0;
  4383. for (i = 0; i < 6; i++) {
  4384. v->mb_type[0][s->block_index[i]] = 0;
  4385. s->dc_val[0][s->block_index[i]] = 0;
  4386. }
  4387. s->current_picture.mb_type[mb_pos] = MB_TYPE_SKIP;
  4388. s->current_picture.qscale_table[mb_pos] = 0;
  4389. v->blk_mv_type[s->block_index[0]] = 0;
  4390. v->blk_mv_type[s->block_index[1]] = 0;
  4391. v->blk_mv_type[s->block_index[2]] = 0;
  4392. v->blk_mv_type[s->block_index[3]] = 0;
  4393. if (!direct) {
  4394. if (bmvtype == BMV_TYPE_INTERPOLATED) {
  4395. vc1_pred_mv_intfr(v, 0, 0, 0, 1, v->range_x, v->range_y, v->mb_type[0], 0);
  4396. vc1_pred_mv_intfr(v, 0, 0, 0, 1, v->range_x, v->range_y, v->mb_type[0], 1);
  4397. } else {
  4398. dir = bmvtype == BMV_TYPE_BACKWARD;
  4399. vc1_pred_mv_intfr(v, 0, 0, 0, 1, v->range_x, v->range_y, v->mb_type[0], dir);
  4400. if (mvsw) {
  4401. int dir2 = dir;
  4402. if (mvsw)
  4403. dir2 = !dir;
  4404. for (i = 0; i < 2; i++) {
  4405. s->mv[dir][i+2][0] = s->mv[dir][i][0] = s->current_picture.motion_val[dir][s->block_index[i+2]][0] = s->current_picture.motion_val[dir][s->block_index[i]][0];
  4406. s->mv[dir][i+2][1] = s->mv[dir][i][1] = s->current_picture.motion_val[dir][s->block_index[i+2]][1] = s->current_picture.motion_val[dir][s->block_index[i]][1];
  4407. s->mv[dir2][i+2][0] = s->mv[dir2][i][0] = s->current_picture.motion_val[dir2][s->block_index[i]][0] = s->current_picture.motion_val[dir2][s->block_index[i+2]][0];
  4408. s->mv[dir2][i+2][1] = s->mv[dir2][i][1] = s->current_picture.motion_val[dir2][s->block_index[i]][1] = s->current_picture.motion_val[dir2][s->block_index[i+2]][1];
  4409. }
  4410. } else {
  4411. v->blk_mv_type[s->block_index[0]] = 1;
  4412. v->blk_mv_type[s->block_index[1]] = 1;
  4413. v->blk_mv_type[s->block_index[2]] = 1;
  4414. v->blk_mv_type[s->block_index[3]] = 1;
  4415. vc1_pred_mv_intfr(v, 0, 0, 0, 2, v->range_x, v->range_y, 0, !dir);
  4416. for (i = 0; i < 2; i++) {
  4417. s->mv[!dir][i+2][0] = s->mv[!dir][i][0] = s->current_picture.motion_val[!dir][s->block_index[i+2]][0] = s->current_picture.motion_val[!dir][s->block_index[i]][0];
  4418. s->mv[!dir][i+2][1] = s->mv[!dir][i][1] = s->current_picture.motion_val[!dir][s->block_index[i+2]][1] = s->current_picture.motion_val[!dir][s->block_index[i]][1];
  4419. }
  4420. }
  4421. }
  4422. }
  4423. vc1_mc_1mv(v, dir);
  4424. if (direct || bmvtype == BMV_TYPE_INTERPOLATED) {
  4425. vc1_interp_mc(v);
  4426. }
  4427. }
  4428. }
  4429. if (s->mb_x == s->mb_width - 1)
  4430. memmove(v->is_intra_base, v->is_intra, sizeof(v->is_intra_base[0]) * s->mb_stride);
  4431. v->cbp[s->mb_x] = block_cbp;
  4432. v->ttblk[s->mb_x] = block_tt;
  4433. return 0;
  4434. }
  4435. /** Decode blocks of I-frame
  4436. */
  4437. static void vc1_decode_i_blocks(VC1Context *v)
  4438. {
  4439. int k, j;
  4440. MpegEncContext *s = &v->s;
  4441. int cbp, val;
  4442. uint8_t *coded_val;
  4443. int mb_pos;
  4444. /* select codingmode used for VLC tables selection */
  4445. switch (v->y_ac_table_index) {
  4446. case 0:
  4447. v->codingset = (v->pqindex <= 8) ? CS_HIGH_RATE_INTRA : CS_LOW_MOT_INTRA;
  4448. break;
  4449. case 1:
  4450. v->codingset = CS_HIGH_MOT_INTRA;
  4451. break;
  4452. case 2:
  4453. v->codingset = CS_MID_RATE_INTRA;
  4454. break;
  4455. }
  4456. switch (v->c_ac_table_index) {
  4457. case 0:
  4458. v->codingset2 = (v->pqindex <= 8) ? CS_HIGH_RATE_INTER : CS_LOW_MOT_INTER;
  4459. break;
  4460. case 1:
  4461. v->codingset2 = CS_HIGH_MOT_INTER;
  4462. break;
  4463. case 2:
  4464. v->codingset2 = CS_MID_RATE_INTER;
  4465. break;
  4466. }
  4467. /* Set DC scale - y and c use the same */
  4468. s->y_dc_scale = s->y_dc_scale_table[v->pq];
  4469. s->c_dc_scale = s->c_dc_scale_table[v->pq];
  4470. //do frame decode
  4471. s->mb_x = s->mb_y = 0;
  4472. s->mb_intra = 1;
  4473. s->first_slice_line = 1;
  4474. for (s->mb_y = 0; s->mb_y < s->end_mb_y; s->mb_y++) {
  4475. s->mb_x = 0;
  4476. init_block_index(v);
  4477. for (; s->mb_x < v->end_mb_x; s->mb_x++) {
  4478. uint8_t *dst[6];
  4479. ff_update_block_index(s);
  4480. dst[0] = s->dest[0];
  4481. dst[1] = dst[0] + 8;
  4482. dst[2] = s->dest[0] + s->linesize * 8;
  4483. dst[3] = dst[2] + 8;
  4484. dst[4] = s->dest[1];
  4485. dst[5] = s->dest[2];
  4486. s->bdsp.clear_blocks(s->block[0]);
  4487. mb_pos = s->mb_x + s->mb_y * s->mb_width;
  4488. s->current_picture.mb_type[mb_pos] = MB_TYPE_INTRA;
  4489. s->current_picture.qscale_table[mb_pos] = v->pq;
  4490. s->current_picture.motion_val[1][s->block_index[0]][0] = 0;
  4491. s->current_picture.motion_val[1][s->block_index[0]][1] = 0;
  4492. // do actual MB decoding and displaying
  4493. cbp = get_vlc2(&v->s.gb, ff_msmp4_mb_i_vlc.table, MB_INTRA_VLC_BITS, 2);
  4494. v->s.ac_pred = get_bits1(&v->s.gb);
  4495. for (k = 0; k < 6; k++) {
  4496. val = ((cbp >> (5 - k)) & 1);
  4497. if (k < 4) {
  4498. int pred = vc1_coded_block_pred(&v->s, k, &coded_val);
  4499. val = val ^ pred;
  4500. *coded_val = val;
  4501. }
  4502. cbp |= val << (5 - k);
  4503. vc1_decode_i_block(v, s->block[k], k, val, (k < 4) ? v->codingset : v->codingset2);
  4504. if (k > 3 && (s->flags & CODEC_FLAG_GRAY))
  4505. continue;
  4506. v->vc1dsp.vc1_inv_trans_8x8(s->block[k]);
  4507. if (v->pq >= 9 && v->overlap) {
  4508. if (v->rangeredfrm)
  4509. for (j = 0; j < 64; j++)
  4510. s->block[k][j] <<= 1;
  4511. s->idsp.put_signed_pixels_clamped(s->block[k], dst[k],
  4512. k & 4 ? s->uvlinesize
  4513. : s->linesize);
  4514. } else {
  4515. if (v->rangeredfrm)
  4516. for (j = 0; j < 64; j++)
  4517. s->block[k][j] = (s->block[k][j] - 64) << 1;
  4518. s->idsp.put_pixels_clamped(s->block[k], dst[k],
  4519. k & 4 ? s->uvlinesize
  4520. : s->linesize);
  4521. }
  4522. }
  4523. if (v->pq >= 9 && v->overlap) {
  4524. if (s->mb_x) {
  4525. v->vc1dsp.vc1_h_overlap(s->dest[0], s->linesize);
  4526. v->vc1dsp.vc1_h_overlap(s->dest[0] + 8 * s->linesize, s->linesize);
  4527. if (!(s->flags & CODEC_FLAG_GRAY)) {
  4528. v->vc1dsp.vc1_h_overlap(s->dest[1], s->uvlinesize);
  4529. v->vc1dsp.vc1_h_overlap(s->dest[2], s->uvlinesize);
  4530. }
  4531. }
  4532. v->vc1dsp.vc1_h_overlap(s->dest[0] + 8, s->linesize);
  4533. v->vc1dsp.vc1_h_overlap(s->dest[0] + 8 * s->linesize + 8, s->linesize);
  4534. if (!s->first_slice_line) {
  4535. v->vc1dsp.vc1_v_overlap(s->dest[0], s->linesize);
  4536. v->vc1dsp.vc1_v_overlap(s->dest[0] + 8, s->linesize);
  4537. if (!(s->flags & CODEC_FLAG_GRAY)) {
  4538. v->vc1dsp.vc1_v_overlap(s->dest[1], s->uvlinesize);
  4539. v->vc1dsp.vc1_v_overlap(s->dest[2], s->uvlinesize);
  4540. }
  4541. }
  4542. v->vc1dsp.vc1_v_overlap(s->dest[0] + 8 * s->linesize, s->linesize);
  4543. v->vc1dsp.vc1_v_overlap(s->dest[0] + 8 * s->linesize + 8, s->linesize);
  4544. }
  4545. if (v->s.loop_filter) vc1_loop_filter_iblk(v, v->pq);
  4546. if (get_bits_count(&s->gb) > v->bits) {
  4547. ff_er_add_slice(&s->er, 0, 0, s->mb_x, s->mb_y, ER_MB_ERROR);
  4548. av_log(s->avctx, AV_LOG_ERROR, "Bits overconsumption: %i > %i\n",
  4549. get_bits_count(&s->gb), v->bits);
  4550. return;
  4551. }
  4552. }
  4553. if (!v->s.loop_filter)
  4554. ff_mpeg_draw_horiz_band(s, s->mb_y * 16, 16);
  4555. else if (s->mb_y)
  4556. ff_mpeg_draw_horiz_band(s, (s->mb_y - 1) * 16, 16);
  4557. s->first_slice_line = 0;
  4558. }
  4559. if (v->s.loop_filter)
  4560. ff_mpeg_draw_horiz_band(s, (s->end_mb_y - 1) * 16, 16);
  4561. /* This is intentionally mb_height and not end_mb_y - unlike in advanced
  4562. * profile, these only differ are when decoding MSS2 rectangles. */
  4563. ff_er_add_slice(&s->er, 0, 0, s->mb_width - 1, s->mb_height - 1, ER_MB_END);
  4564. }
  4565. /** Decode blocks of I-frame for advanced profile
  4566. */
  4567. static void vc1_decode_i_blocks_adv(VC1Context *v)
  4568. {
  4569. int k;
  4570. MpegEncContext *s = &v->s;
  4571. int cbp, val;
  4572. uint8_t *coded_val;
  4573. int mb_pos;
  4574. int mquant = v->pq;
  4575. int mqdiff;
  4576. GetBitContext *gb = &s->gb;
  4577. /* select codingmode used for VLC tables selection */
  4578. switch (v->y_ac_table_index) {
  4579. case 0:
  4580. v->codingset = (v->pqindex <= 8) ? CS_HIGH_RATE_INTRA : CS_LOW_MOT_INTRA;
  4581. break;
  4582. case 1:
  4583. v->codingset = CS_HIGH_MOT_INTRA;
  4584. break;
  4585. case 2:
  4586. v->codingset = CS_MID_RATE_INTRA;
  4587. break;
  4588. }
  4589. switch (v->c_ac_table_index) {
  4590. case 0:
  4591. v->codingset2 = (v->pqindex <= 8) ? CS_HIGH_RATE_INTER : CS_LOW_MOT_INTER;
  4592. break;
  4593. case 1:
  4594. v->codingset2 = CS_HIGH_MOT_INTER;
  4595. break;
  4596. case 2:
  4597. v->codingset2 = CS_MID_RATE_INTER;
  4598. break;
  4599. }
  4600. // do frame decode
  4601. s->mb_x = s->mb_y = 0;
  4602. s->mb_intra = 1;
  4603. s->first_slice_line = 1;
  4604. s->mb_y = s->start_mb_y;
  4605. if (s->start_mb_y) {
  4606. s->mb_x = 0;
  4607. init_block_index(v);
  4608. memset(&s->coded_block[s->block_index[0] - s->b8_stride], 0,
  4609. (1 + s->b8_stride) * sizeof(*s->coded_block));
  4610. }
  4611. for (; s->mb_y < s->end_mb_y; s->mb_y++) {
  4612. s->mb_x = 0;
  4613. init_block_index(v);
  4614. for (;s->mb_x < s->mb_width; s->mb_x++) {
  4615. int16_t (*block)[64] = v->block[v->cur_blk_idx];
  4616. ff_update_block_index(s);
  4617. s->bdsp.clear_blocks(block[0]);
  4618. mb_pos = s->mb_x + s->mb_y * s->mb_stride;
  4619. s->current_picture.mb_type[mb_pos + v->mb_off] = MB_TYPE_INTRA;
  4620. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][0] = 0;
  4621. s->current_picture.motion_val[1][s->block_index[0] + v->blocks_off][1] = 0;
  4622. // do actual MB decoding and displaying
  4623. if (v->fieldtx_is_raw)
  4624. v->fieldtx_plane[mb_pos] = get_bits1(&v->s.gb);
  4625. cbp = get_vlc2(&v->s.gb, ff_msmp4_mb_i_vlc.table, MB_INTRA_VLC_BITS, 2);
  4626. if ( v->acpred_is_raw)
  4627. v->s.ac_pred = get_bits1(&v->s.gb);
  4628. else
  4629. v->s.ac_pred = v->acpred_plane[mb_pos];
  4630. if (v->condover == CONDOVER_SELECT && v->overflg_is_raw)
  4631. v->over_flags_plane[mb_pos] = get_bits1(&v->s.gb);
  4632. GET_MQUANT();
  4633. s->current_picture.qscale_table[mb_pos] = mquant;
  4634. /* Set DC scale - y and c use the same */
  4635. s->y_dc_scale = s->y_dc_scale_table[mquant];
  4636. s->c_dc_scale = s->c_dc_scale_table[mquant];
  4637. for (k = 0; k < 6; k++) {
  4638. val = ((cbp >> (5 - k)) & 1);
  4639. if (k < 4) {
  4640. int pred = vc1_coded_block_pred(&v->s, k, &coded_val);
  4641. val = val ^ pred;
  4642. *coded_val = val;
  4643. }
  4644. cbp |= val << (5 - k);
  4645. v->a_avail = !s->first_slice_line || (k == 2 || k == 3);
  4646. v->c_avail = !!s->mb_x || (k == 1 || k == 3);
  4647. vc1_decode_i_block_adv(v, block[k], k, val,
  4648. (k < 4) ? v->codingset : v->codingset2, mquant);
  4649. if (k > 3 && (s->flags & CODEC_FLAG_GRAY))
  4650. continue;
  4651. v->vc1dsp.vc1_inv_trans_8x8(block[k]);
  4652. }
  4653. vc1_smooth_overlap_filter_iblk(v);
  4654. vc1_put_signed_blocks_clamped(v);
  4655. if (v->s.loop_filter) vc1_loop_filter_iblk_delayed(v, v->pq);
  4656. if (get_bits_count(&s->gb) > v->bits) {
  4657. // TODO: may need modification to handle slice coding
  4658. ff_er_add_slice(&s->er, 0, s->start_mb_y, s->mb_x, s->mb_y, ER_MB_ERROR);
  4659. av_log(s->avctx, AV_LOG_ERROR, "Bits overconsumption: %i > %i\n",
  4660. get_bits_count(&s->gb), v->bits);
  4661. return;
  4662. }
  4663. }
  4664. if (!v->s.loop_filter)
  4665. ff_mpeg_draw_horiz_band(s, s->mb_y * 16, 16);
  4666. else if (s->mb_y)
  4667. ff_mpeg_draw_horiz_band(s, (s->mb_y-1) * 16, 16);
  4668. s->first_slice_line = 0;
  4669. }
  4670. /* raw bottom MB row */
  4671. s->mb_x = 0;
  4672. init_block_index(v);
  4673. for (;s->mb_x < s->mb_width; s->mb_x++) {
  4674. ff_update_block_index(s);
  4675. vc1_put_signed_blocks_clamped(v);
  4676. if (v->s.loop_filter)
  4677. vc1_loop_filter_iblk_delayed(v, v->pq);
  4678. }
  4679. if (v->s.loop_filter)
  4680. ff_mpeg_draw_horiz_band(s, (s->end_mb_y-1)*16, 16);
  4681. ff_er_add_slice(&s->er, 0, s->start_mb_y << v->field_mode, s->mb_width - 1,
  4682. (s->end_mb_y << v->field_mode) - 1, ER_MB_END);
  4683. }
  4684. static void vc1_decode_p_blocks(VC1Context *v)
  4685. {
  4686. MpegEncContext *s = &v->s;
  4687. int apply_loop_filter;
  4688. /* select codingmode used for VLC tables selection */
  4689. switch (v->c_ac_table_index) {
  4690. case 0:
  4691. v->codingset = (v->pqindex <= 8) ? CS_HIGH_RATE_INTRA : CS_LOW_MOT_INTRA;
  4692. break;
  4693. case 1:
  4694. v->codingset = CS_HIGH_MOT_INTRA;
  4695. break;
  4696. case 2:
  4697. v->codingset = CS_MID_RATE_INTRA;
  4698. break;
  4699. }
  4700. switch (v->c_ac_table_index) {
  4701. case 0:
  4702. v->codingset2 = (v->pqindex <= 8) ? CS_HIGH_RATE_INTER : CS_LOW_MOT_INTER;
  4703. break;
  4704. case 1:
  4705. v->codingset2 = CS_HIGH_MOT_INTER;
  4706. break;
  4707. case 2:
  4708. v->codingset2 = CS_MID_RATE_INTER;
  4709. break;
  4710. }
  4711. apply_loop_filter = s->loop_filter && !(s->avctx->skip_loop_filter >= AVDISCARD_NONKEY) &&
  4712. v->fcm == PROGRESSIVE;
  4713. s->first_slice_line = 1;
  4714. memset(v->cbp_base, 0, sizeof(v->cbp_base[0])*2*s->mb_stride);
  4715. for (s->mb_y = s->start_mb_y; s->mb_y < s->end_mb_y; s->mb_y++) {
  4716. s->mb_x = 0;
  4717. init_block_index(v);
  4718. for (; s->mb_x < s->mb_width; s->mb_x++) {
  4719. ff_update_block_index(s);
  4720. if (v->fcm == ILACE_FIELD)
  4721. vc1_decode_p_mb_intfi(v);
  4722. else if (v->fcm == ILACE_FRAME)
  4723. vc1_decode_p_mb_intfr(v);
  4724. else vc1_decode_p_mb(v);
  4725. if (s->mb_y != s->start_mb_y && apply_loop_filter)
  4726. vc1_apply_p_loop_filter(v);
  4727. if (get_bits_count(&s->gb) > v->bits || get_bits_count(&s->gb) < 0) {
  4728. // TODO: may need modification to handle slice coding
  4729. ff_er_add_slice(&s->er, 0, s->start_mb_y, s->mb_x, s->mb_y, ER_MB_ERROR);
  4730. av_log(s->avctx, AV_LOG_ERROR, "Bits overconsumption: %i > %i at %ix%i\n",
  4731. get_bits_count(&s->gb), v->bits, s->mb_x, s->mb_y);
  4732. return;
  4733. }
  4734. }
  4735. memmove(v->cbp_base, v->cbp, sizeof(v->cbp_base[0]) * s->mb_stride);
  4736. memmove(v->ttblk_base, v->ttblk, sizeof(v->ttblk_base[0]) * s->mb_stride);
  4737. memmove(v->is_intra_base, v->is_intra, sizeof(v->is_intra_base[0]) * s->mb_stride);
  4738. memmove(v->luma_mv_base, v->luma_mv, sizeof(v->luma_mv_base[0]) * s->mb_stride);
  4739. if (s->mb_y != s->start_mb_y) ff_mpeg_draw_horiz_band(s, (s->mb_y - 1) * 16, 16);
  4740. s->first_slice_line = 0;
  4741. }
  4742. if (apply_loop_filter) {
  4743. s->mb_x = 0;
  4744. init_block_index(v);
  4745. for (; s->mb_x < s->mb_width; s->mb_x++) {
  4746. ff_update_block_index(s);
  4747. vc1_apply_p_loop_filter(v);
  4748. }
  4749. }
  4750. if (s->end_mb_y >= s->start_mb_y)
  4751. ff_mpeg_draw_horiz_band(s, (s->end_mb_y - 1) * 16, 16);
  4752. ff_er_add_slice(&s->er, 0, s->start_mb_y << v->field_mode, s->mb_width - 1,
  4753. (s->end_mb_y << v->field_mode) - 1, ER_MB_END);
  4754. }
  4755. static void vc1_decode_b_blocks(VC1Context *v)
  4756. {
  4757. MpegEncContext *s = &v->s;
  4758. /* select codingmode used for VLC tables selection */
  4759. switch (v->c_ac_table_index) {
  4760. case 0:
  4761. v->codingset = (v->pqindex <= 8) ? CS_HIGH_RATE_INTRA : CS_LOW_MOT_INTRA;
  4762. break;
  4763. case 1:
  4764. v->codingset = CS_HIGH_MOT_INTRA;
  4765. break;
  4766. case 2:
  4767. v->codingset = CS_MID_RATE_INTRA;
  4768. break;
  4769. }
  4770. switch (v->c_ac_table_index) {
  4771. case 0:
  4772. v->codingset2 = (v->pqindex <= 8) ? CS_HIGH_RATE_INTER : CS_LOW_MOT_INTER;
  4773. break;
  4774. case 1:
  4775. v->codingset2 = CS_HIGH_MOT_INTER;
  4776. break;
  4777. case 2:
  4778. v->codingset2 = CS_MID_RATE_INTER;
  4779. break;
  4780. }
  4781. s->first_slice_line = 1;
  4782. for (s->mb_y = s->start_mb_y; s->mb_y < s->end_mb_y; s->mb_y++) {
  4783. s->mb_x = 0;
  4784. init_block_index(v);
  4785. for (; s->mb_x < s->mb_width; s->mb_x++) {
  4786. ff_update_block_index(s);
  4787. if (v->fcm == ILACE_FIELD)
  4788. vc1_decode_b_mb_intfi(v);
  4789. else if (v->fcm == ILACE_FRAME)
  4790. vc1_decode_b_mb_intfr(v);
  4791. else
  4792. vc1_decode_b_mb(v);
  4793. if (get_bits_count(&s->gb) > v->bits || get_bits_count(&s->gb) < 0) {
  4794. // TODO: may need modification to handle slice coding
  4795. ff_er_add_slice(&s->er, 0, s->start_mb_y, s->mb_x, s->mb_y, ER_MB_ERROR);
  4796. av_log(s->avctx, AV_LOG_ERROR, "Bits overconsumption: %i > %i at %ix%i\n",
  4797. get_bits_count(&s->gb), v->bits, s->mb_x, s->mb_y);
  4798. return;
  4799. }
  4800. if (v->s.loop_filter) vc1_loop_filter_iblk(v, v->pq);
  4801. }
  4802. if (!v->s.loop_filter)
  4803. ff_mpeg_draw_horiz_band(s, s->mb_y * 16, 16);
  4804. else if (s->mb_y)
  4805. ff_mpeg_draw_horiz_band(s, (s->mb_y - 1) * 16, 16);
  4806. s->first_slice_line = 0;
  4807. }
  4808. if (v->s.loop_filter)
  4809. ff_mpeg_draw_horiz_band(s, (s->end_mb_y - 1) * 16, 16);
  4810. ff_er_add_slice(&s->er, 0, s->start_mb_y << v->field_mode, s->mb_width - 1,
  4811. (s->end_mb_y << v->field_mode) - 1, ER_MB_END);
  4812. }
  4813. static void vc1_decode_skip_blocks(VC1Context *v)
  4814. {
  4815. MpegEncContext *s = &v->s;
  4816. if (!v->s.last_picture.f->data[0])
  4817. return;
  4818. ff_er_add_slice(&s->er, 0, s->start_mb_y, s->mb_width - 1, s->end_mb_y - 1, ER_MB_END);
  4819. s->first_slice_line = 1;
  4820. for (s->mb_y = s->start_mb_y; s->mb_y < s->end_mb_y; s->mb_y++) {
  4821. s->mb_x = 0;
  4822. init_block_index(v);
  4823. ff_update_block_index(s);
  4824. memcpy(s->dest[0], s->last_picture.f->data[0] + s->mb_y * 16 * s->linesize, s->linesize * 16);
  4825. memcpy(s->dest[1], s->last_picture.f->data[1] + s->mb_y * 8 * s->uvlinesize, s->uvlinesize * 8);
  4826. memcpy(s->dest[2], s->last_picture.f->data[2] + s->mb_y * 8 * s->uvlinesize, s->uvlinesize * 8);
  4827. ff_mpeg_draw_horiz_band(s, s->mb_y * 16, 16);
  4828. s->first_slice_line = 0;
  4829. }
  4830. s->pict_type = AV_PICTURE_TYPE_P;
  4831. }
  4832. void ff_vc1_decode_blocks(VC1Context *v)
  4833. {
  4834. v->s.esc3_level_length = 0;
  4835. if (v->x8_type) {
  4836. ff_intrax8_decode_picture(&v->x8, 2*v->pq + v->halfpq, v->pq * !v->pquantizer);
  4837. } else {
  4838. v->cur_blk_idx = 0;
  4839. v->left_blk_idx = -1;
  4840. v->topleft_blk_idx = 1;
  4841. v->top_blk_idx = 2;
  4842. switch (v->s.pict_type) {
  4843. case AV_PICTURE_TYPE_I:
  4844. if (v->profile == PROFILE_ADVANCED)
  4845. vc1_decode_i_blocks_adv(v);
  4846. else
  4847. vc1_decode_i_blocks(v);
  4848. break;
  4849. case AV_PICTURE_TYPE_P:
  4850. if (v->p_frame_skipped)
  4851. vc1_decode_skip_blocks(v);
  4852. else
  4853. vc1_decode_p_blocks(v);
  4854. break;
  4855. case AV_PICTURE_TYPE_B:
  4856. if (v->bi_type) {
  4857. if (v->profile == PROFILE_ADVANCED)
  4858. vc1_decode_i_blocks_adv(v);
  4859. else
  4860. vc1_decode_i_blocks(v);
  4861. } else
  4862. vc1_decode_b_blocks(v);
  4863. break;
  4864. }
  4865. }
  4866. }
  4867. #if CONFIG_WMV3IMAGE_DECODER || CONFIG_VC1IMAGE_DECODER
  4868. typedef struct {
  4869. /**
  4870. * Transform coefficients for both sprites in 16.16 fixed point format,
  4871. * in the order they appear in the bitstream:
  4872. * x scale
  4873. * rotation 1 (unused)
  4874. * x offset
  4875. * rotation 2 (unused)
  4876. * y scale
  4877. * y offset
  4878. * alpha
  4879. */
  4880. int coefs[2][7];
  4881. int effect_type, effect_flag;
  4882. int effect_pcount1, effect_pcount2; ///< amount of effect parameters stored in effect_params
  4883. int effect_params1[15], effect_params2[10]; ///< effect parameters in 16.16 fixed point format
  4884. } SpriteData;
  4885. static inline int get_fp_val(GetBitContext* gb)
  4886. {
  4887. return (get_bits_long(gb, 30) - (1 << 29)) << 1;
  4888. }
  4889. static void vc1_sprite_parse_transform(GetBitContext* gb, int c[7])
  4890. {
  4891. c[1] = c[3] = 0;
  4892. switch (get_bits(gb, 2)) {
  4893. case 0:
  4894. c[0] = 1 << 16;
  4895. c[2] = get_fp_val(gb);
  4896. c[4] = 1 << 16;
  4897. break;
  4898. case 1:
  4899. c[0] = c[4] = get_fp_val(gb);
  4900. c[2] = get_fp_val(gb);
  4901. break;
  4902. case 2:
  4903. c[0] = get_fp_val(gb);
  4904. c[2] = get_fp_val(gb);
  4905. c[4] = get_fp_val(gb);
  4906. break;
  4907. case 3:
  4908. c[0] = get_fp_val(gb);
  4909. c[1] = get_fp_val(gb);
  4910. c[2] = get_fp_val(gb);
  4911. c[3] = get_fp_val(gb);
  4912. c[4] = get_fp_val(gb);
  4913. break;
  4914. }
  4915. c[5] = get_fp_val(gb);
  4916. if (get_bits1(gb))
  4917. c[6] = get_fp_val(gb);
  4918. else
  4919. c[6] = 1 << 16;
  4920. }
  4921. static void vc1_parse_sprites(VC1Context *v, GetBitContext* gb, SpriteData* sd)
  4922. {
  4923. AVCodecContext *avctx = v->s.avctx;
  4924. int sprite, i;
  4925. for (sprite = 0; sprite <= v->two_sprites; sprite++) {
  4926. vc1_sprite_parse_transform(gb, sd->coefs[sprite]);
  4927. if (sd->coefs[sprite][1] || sd->coefs[sprite][3])
  4928. avpriv_request_sample(avctx, "Non-zero rotation coefficients");
  4929. av_log(avctx, AV_LOG_DEBUG, sprite ? "S2:" : "S1:");
  4930. for (i = 0; i < 7; i++)
  4931. av_log(avctx, AV_LOG_DEBUG, " %d.%.3d",
  4932. sd->coefs[sprite][i] / (1<<16),
  4933. (abs(sd->coefs[sprite][i]) & 0xFFFF) * 1000 / (1 << 16));
  4934. av_log(avctx, AV_LOG_DEBUG, "\n");
  4935. }
  4936. skip_bits(gb, 2);
  4937. if (sd->effect_type = get_bits_long(gb, 30)) {
  4938. switch (sd->effect_pcount1 = get_bits(gb, 4)) {
  4939. case 7:
  4940. vc1_sprite_parse_transform(gb, sd->effect_params1);
  4941. break;
  4942. case 14:
  4943. vc1_sprite_parse_transform(gb, sd->effect_params1);
  4944. vc1_sprite_parse_transform(gb, sd->effect_params1 + 7);
  4945. break;
  4946. default:
  4947. for (i = 0; i < sd->effect_pcount1; i++)
  4948. sd->effect_params1[i] = get_fp_val(gb);
  4949. }
  4950. if (sd->effect_type != 13 || sd->effect_params1[0] != sd->coefs[0][6]) {
  4951. // effect 13 is simple alpha blending and matches the opacity above
  4952. av_log(avctx, AV_LOG_DEBUG, "Effect: %d; params: ", sd->effect_type);
  4953. for (i = 0; i < sd->effect_pcount1; i++)
  4954. av_log(avctx, AV_LOG_DEBUG, " %d.%.2d",
  4955. sd->effect_params1[i] / (1 << 16),
  4956. (abs(sd->effect_params1[i]) & 0xFFFF) * 1000 / (1 << 16));
  4957. av_log(avctx, AV_LOG_DEBUG, "\n");
  4958. }
  4959. sd->effect_pcount2 = get_bits(gb, 16);
  4960. if (sd->effect_pcount2 > 10) {
  4961. av_log(avctx, AV_LOG_ERROR, "Too many effect parameters\n");
  4962. return;
  4963. } else if (sd->effect_pcount2) {
  4964. i = -1;
  4965. av_log(avctx, AV_LOG_DEBUG, "Effect params 2: ");
  4966. while (++i < sd->effect_pcount2) {
  4967. sd->effect_params2[i] = get_fp_val(gb);
  4968. av_log(avctx, AV_LOG_DEBUG, " %d.%.2d",
  4969. sd->effect_params2[i] / (1 << 16),
  4970. (abs(sd->effect_params2[i]) & 0xFFFF) * 1000 / (1 << 16));
  4971. }
  4972. av_log(avctx, AV_LOG_DEBUG, "\n");
  4973. }
  4974. }
  4975. if (sd->effect_flag = get_bits1(gb))
  4976. av_log(avctx, AV_LOG_DEBUG, "Effect flag set\n");
  4977. if (get_bits_count(gb) >= gb->size_in_bits +
  4978. (avctx->codec_id == AV_CODEC_ID_WMV3IMAGE ? 64 : 0))
  4979. av_log(avctx, AV_LOG_ERROR, "Buffer overrun\n");
  4980. if (get_bits_count(gb) < gb->size_in_bits - 8)
  4981. av_log(avctx, AV_LOG_WARNING, "Buffer not fully read\n");
  4982. }
  4983. static void vc1_draw_sprites(VC1Context *v, SpriteData* sd)
  4984. {
  4985. int i, plane, row, sprite;
  4986. int sr_cache[2][2] = { { -1, -1 }, { -1, -1 } };
  4987. uint8_t* src_h[2][2];
  4988. int xoff[2], xadv[2], yoff[2], yadv[2], alpha;
  4989. int ysub[2];
  4990. MpegEncContext *s = &v->s;
  4991. for (i = 0; i < 2; i++) {
  4992. xoff[i] = av_clip(sd->coefs[i][2], 0, v->sprite_width-1 << 16);
  4993. xadv[i] = sd->coefs[i][0];
  4994. if (xadv[i] != 1<<16 || (v->sprite_width << 16) - (v->output_width << 16) - xoff[i])
  4995. xadv[i] = av_clip(xadv[i], 0, ((v->sprite_width<<16) - xoff[i] - 1) / v->output_width);
  4996. yoff[i] = av_clip(sd->coefs[i][5], 0, v->sprite_height-1 << 16);
  4997. yadv[i] = av_clip(sd->coefs[i][4], 0, ((v->sprite_height << 16) - yoff[i]) / v->output_height);
  4998. }
  4999. alpha = av_clip(sd->coefs[1][6], 0, (1<<16) - 1);
  5000. for (plane = 0; plane < (s->flags&CODEC_FLAG_GRAY ? 1 : 3); plane++) {
  5001. int width = v->output_width>>!!plane;
  5002. for (row = 0; row < v->output_height>>!!plane; row++) {
  5003. uint8_t *dst = v->sprite_output_frame->data[plane] +
  5004. v->sprite_output_frame->linesize[plane] * row;
  5005. for (sprite = 0; sprite <= v->two_sprites; sprite++) {
  5006. uint8_t *iplane = s->current_picture.f->data[plane];
  5007. int iline = s->current_picture.f->linesize[plane];
  5008. int ycoord = yoff[sprite] + yadv[sprite] * row;
  5009. int yline = ycoord >> 16;
  5010. int next_line;
  5011. ysub[sprite] = ycoord & 0xFFFF;
  5012. if (sprite) {
  5013. iplane = s->last_picture.f->data[plane];
  5014. iline = s->last_picture.f->linesize[plane];
  5015. }
  5016. next_line = FFMIN(yline + 1, (v->sprite_height >> !!plane) - 1) * iline;
  5017. if (!(xoff[sprite] & 0xFFFF) && xadv[sprite] == 1 << 16) {
  5018. src_h[sprite][0] = iplane + (xoff[sprite] >> 16) + yline * iline;
  5019. if (ysub[sprite])
  5020. src_h[sprite][1] = iplane + (xoff[sprite] >> 16) + next_line;
  5021. } else {
  5022. if (sr_cache[sprite][0] != yline) {
  5023. if (sr_cache[sprite][1] == yline) {
  5024. FFSWAP(uint8_t*, v->sr_rows[sprite][0], v->sr_rows[sprite][1]);
  5025. FFSWAP(int, sr_cache[sprite][0], sr_cache[sprite][1]);
  5026. } else {
  5027. v->vc1dsp.sprite_h(v->sr_rows[sprite][0], iplane + yline * iline, xoff[sprite], xadv[sprite], width);
  5028. sr_cache[sprite][0] = yline;
  5029. }
  5030. }
  5031. if (ysub[sprite] && sr_cache[sprite][1] != yline + 1) {
  5032. v->vc1dsp.sprite_h(v->sr_rows[sprite][1],
  5033. iplane + next_line, xoff[sprite],
  5034. xadv[sprite], width);
  5035. sr_cache[sprite][1] = yline + 1;
  5036. }
  5037. src_h[sprite][0] = v->sr_rows[sprite][0];
  5038. src_h[sprite][1] = v->sr_rows[sprite][1];
  5039. }
  5040. }
  5041. if (!v->two_sprites) {
  5042. if (ysub[0]) {
  5043. v->vc1dsp.sprite_v_single(dst, src_h[0][0], src_h[0][1], ysub[0], width);
  5044. } else {
  5045. memcpy(dst, src_h[0][0], width);
  5046. }
  5047. } else {
  5048. if (ysub[0] && ysub[1]) {
  5049. v->vc1dsp.sprite_v_double_twoscale(dst, src_h[0][0], src_h[0][1], ysub[0],
  5050. src_h[1][0], src_h[1][1], ysub[1], alpha, width);
  5051. } else if (ysub[0]) {
  5052. v->vc1dsp.sprite_v_double_onescale(dst, src_h[0][0], src_h[0][1], ysub[0],
  5053. src_h[1][0], alpha, width);
  5054. } else if (ysub[1]) {
  5055. v->vc1dsp.sprite_v_double_onescale(dst, src_h[1][0], src_h[1][1], ysub[1],
  5056. src_h[0][0], (1<<16)-1-alpha, width);
  5057. } else {
  5058. v->vc1dsp.sprite_v_double_noscale(dst, src_h[0][0], src_h[1][0], alpha, width);
  5059. }
  5060. }
  5061. }
  5062. if (!plane) {
  5063. for (i = 0; i < 2; i++) {
  5064. xoff[i] >>= 1;
  5065. yoff[i] >>= 1;
  5066. }
  5067. }
  5068. }
  5069. }
  5070. static int vc1_decode_sprites(VC1Context *v, GetBitContext* gb)
  5071. {
  5072. MpegEncContext *s = &v->s;
  5073. AVCodecContext *avctx = s->avctx;
  5074. SpriteData sd;
  5075. vc1_parse_sprites(v, gb, &sd);
  5076. if (!s->current_picture.f->data[0]) {
  5077. av_log(avctx, AV_LOG_ERROR, "Got no sprites\n");
  5078. return -1;
  5079. }
  5080. if (v->two_sprites && (!s->last_picture_ptr || !s->last_picture.f->data[0])) {
  5081. av_log(avctx, AV_LOG_WARNING, "Need two sprites, only got one\n");
  5082. v->two_sprites = 0;
  5083. }
  5084. av_frame_unref(v->sprite_output_frame);
  5085. if (ff_get_buffer(avctx, v->sprite_output_frame, 0) < 0) {
  5086. av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  5087. return -1;
  5088. }
  5089. vc1_draw_sprites(v, &sd);
  5090. return 0;
  5091. }
  5092. static void vc1_sprite_flush(AVCodecContext *avctx)
  5093. {
  5094. VC1Context *v = avctx->priv_data;
  5095. MpegEncContext *s = &v->s;
  5096. AVFrame *f = s->current_picture.f;
  5097. int plane, i;
  5098. /* Windows Media Image codecs have a convergence interval of two keyframes.
  5099. Since we can't enforce it, clear to black the missing sprite. This is
  5100. wrong but it looks better than doing nothing. */
  5101. if (f->data[0])
  5102. for (plane = 0; plane < (s->flags&CODEC_FLAG_GRAY ? 1 : 3); plane++)
  5103. for (i = 0; i < v->sprite_height>>!!plane; i++)
  5104. memset(f->data[plane] + i * f->linesize[plane],
  5105. plane ? 128 : 0, f->linesize[plane]);
  5106. }
  5107. #endif
  5108. av_cold int ff_vc1_decode_init_alloc_tables(VC1Context *v)
  5109. {
  5110. MpegEncContext *s = &v->s;
  5111. int i;
  5112. int mb_height = FFALIGN(s->mb_height, 2);
  5113. /* Allocate mb bitplanes */
  5114. v->mv_type_mb_plane = av_malloc (s->mb_stride * mb_height);
  5115. v->direct_mb_plane = av_malloc (s->mb_stride * mb_height);
  5116. v->forward_mb_plane = av_malloc (s->mb_stride * mb_height);
  5117. v->fieldtx_plane = av_mallocz(s->mb_stride * mb_height);
  5118. v->acpred_plane = av_malloc (s->mb_stride * mb_height);
  5119. v->over_flags_plane = av_malloc (s->mb_stride * mb_height);
  5120. v->n_allocated_blks = s->mb_width + 2;
  5121. v->block = av_malloc(sizeof(*v->block) * v->n_allocated_blks);
  5122. v->cbp_base = av_malloc(sizeof(v->cbp_base[0]) * 2 * s->mb_stride);
  5123. v->cbp = v->cbp_base + s->mb_stride;
  5124. v->ttblk_base = av_malloc(sizeof(v->ttblk_base[0]) * 2 * s->mb_stride);
  5125. v->ttblk = v->ttblk_base + s->mb_stride;
  5126. v->is_intra_base = av_mallocz(sizeof(v->is_intra_base[0]) * 2 * s->mb_stride);
  5127. v->is_intra = v->is_intra_base + s->mb_stride;
  5128. v->luma_mv_base = av_malloc(sizeof(v->luma_mv_base[0]) * 2 * s->mb_stride);
  5129. v->luma_mv = v->luma_mv_base + s->mb_stride;
  5130. /* allocate block type info in that way so it could be used with s->block_index[] */
  5131. v->mb_type_base = av_malloc(s->b8_stride * (mb_height * 2 + 1) + s->mb_stride * (mb_height + 1) * 2);
  5132. v->mb_type[0] = v->mb_type_base + s->b8_stride + 1;
  5133. v->mb_type[1] = v->mb_type_base + s->b8_stride * (mb_height * 2 + 1) + s->mb_stride + 1;
  5134. v->mb_type[2] = v->mb_type[1] + s->mb_stride * (mb_height + 1);
  5135. /* allocate memory to store block level MV info */
  5136. v->blk_mv_type_base = av_mallocz( s->b8_stride * (mb_height * 2 + 1) + s->mb_stride * (mb_height + 1) * 2);
  5137. v->blk_mv_type = v->blk_mv_type_base + s->b8_stride + 1;
  5138. v->mv_f_base = av_mallocz(2 * (s->b8_stride * (mb_height * 2 + 1) + s->mb_stride * (mb_height + 1) * 2));
  5139. v->mv_f[0] = v->mv_f_base + s->b8_stride + 1;
  5140. v->mv_f[1] = v->mv_f[0] + (s->b8_stride * (mb_height * 2 + 1) + s->mb_stride * (mb_height + 1) * 2);
  5141. v->mv_f_next_base = av_mallocz(2 * (s->b8_stride * (mb_height * 2 + 1) + s->mb_stride * (mb_height + 1) * 2));
  5142. v->mv_f_next[0] = v->mv_f_next_base + s->b8_stride + 1;
  5143. v->mv_f_next[1] = v->mv_f_next[0] + (s->b8_stride * (mb_height * 2 + 1) + s->mb_stride * (mb_height + 1) * 2);
  5144. /* Init coded blocks info */
  5145. if (v->profile == PROFILE_ADVANCED) {
  5146. // if (alloc_bitplane(&v->over_flags_plane, s->mb_width, s->mb_height) < 0)
  5147. // return -1;
  5148. // if (alloc_bitplane(&v->ac_pred_plane, s->mb_width, s->mb_height) < 0)
  5149. // return -1;
  5150. }
  5151. ff_intrax8_common_init(&v->x8,s);
  5152. if (s->avctx->codec_id == AV_CODEC_ID_WMV3IMAGE || s->avctx->codec_id == AV_CODEC_ID_VC1IMAGE) {
  5153. for (i = 0; i < 4; i++)
  5154. if (!(v->sr_rows[i >> 1][i & 1] = av_malloc(v->output_width))) return -1;
  5155. }
  5156. if (!v->mv_type_mb_plane || !v->direct_mb_plane || !v->acpred_plane || !v->over_flags_plane ||
  5157. !v->block || !v->cbp_base || !v->ttblk_base || !v->is_intra_base || !v->luma_mv_base ||
  5158. !v->mb_type_base) {
  5159. av_freep(&v->mv_type_mb_plane);
  5160. av_freep(&v->direct_mb_plane);
  5161. av_freep(&v->acpred_plane);
  5162. av_freep(&v->over_flags_plane);
  5163. av_freep(&v->block);
  5164. av_freep(&v->cbp_base);
  5165. av_freep(&v->ttblk_base);
  5166. av_freep(&v->is_intra_base);
  5167. av_freep(&v->luma_mv_base);
  5168. av_freep(&v->mb_type_base);
  5169. return AVERROR(ENOMEM);
  5170. }
  5171. return 0;
  5172. }
  5173. av_cold void ff_vc1_init_transposed_scantables(VC1Context *v)
  5174. {
  5175. int i;
  5176. for (i = 0; i < 64; i++) {
  5177. #define transpose(x) ((x >> 3) | ((x & 7) << 3))
  5178. v->zz_8x8[0][i] = transpose(ff_wmv1_scantable[0][i]);
  5179. v->zz_8x8[1][i] = transpose(ff_wmv1_scantable[1][i]);
  5180. v->zz_8x8[2][i] = transpose(ff_wmv1_scantable[2][i]);
  5181. v->zz_8x8[3][i] = transpose(ff_wmv1_scantable[3][i]);
  5182. v->zzi_8x8[i] = transpose(ff_vc1_adv_interlaced_8x8_zz[i]);
  5183. }
  5184. v->left_blk_sh = 0;
  5185. v->top_blk_sh = 3;
  5186. }
  5187. /** Initialize a VC1/WMV3 decoder
  5188. * @todo TODO: Handle VC-1 IDUs (Transport level?)
  5189. * @todo TODO: Decypher remaining bits in extra_data
  5190. */
  5191. static av_cold int vc1_decode_init(AVCodecContext *avctx)
  5192. {
  5193. VC1Context *v = avctx->priv_data;
  5194. MpegEncContext *s = &v->s;
  5195. GetBitContext gb;
  5196. /* save the container output size for WMImage */
  5197. v->output_width = avctx->width;
  5198. v->output_height = avctx->height;
  5199. if (!avctx->extradata_size || !avctx->extradata)
  5200. return -1;
  5201. if (!(avctx->flags & CODEC_FLAG_GRAY))
  5202. avctx->pix_fmt = ff_get_format(avctx, avctx->codec->pix_fmts);
  5203. else
  5204. avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  5205. v->s.avctx = avctx;
  5206. if (ff_vc1_init_common(v) < 0)
  5207. return -1;
  5208. ff_blockdsp_init(&s->bdsp, avctx);
  5209. ff_h264chroma_init(&v->h264chroma, 8);
  5210. ff_qpeldsp_init(&s->qdsp);
  5211. ff_vc1dsp_init(&v->vc1dsp);
  5212. if (avctx->codec_id == AV_CODEC_ID_WMV3 || avctx->codec_id == AV_CODEC_ID_WMV3IMAGE) {
  5213. int count = 0;
  5214. // looks like WMV3 has a sequence header stored in the extradata
  5215. // advanced sequence header may be before the first frame
  5216. // the last byte of the extradata is a version number, 1 for the
  5217. // samples we can decode
  5218. init_get_bits(&gb, avctx->extradata, avctx->extradata_size*8);
  5219. if (ff_vc1_decode_sequence_header(avctx, v, &gb) < 0)
  5220. return -1;
  5221. count = avctx->extradata_size*8 - get_bits_count(&gb);
  5222. if (count > 0) {
  5223. av_log(avctx, AV_LOG_INFO, "Extra data: %i bits left, value: %X\n",
  5224. count, get_bits(&gb, count));
  5225. } else if (count < 0) {
  5226. av_log(avctx, AV_LOG_INFO, "Read %i bits in overflow\n", -count);
  5227. }
  5228. } else { // VC1/WVC1/WVP2
  5229. const uint8_t *start = avctx->extradata;
  5230. uint8_t *end = avctx->extradata + avctx->extradata_size;
  5231. const uint8_t *next;
  5232. int size, buf2_size;
  5233. uint8_t *buf2 = NULL;
  5234. int seq_initialized = 0, ep_initialized = 0;
  5235. if (avctx->extradata_size < 16) {
  5236. av_log(avctx, AV_LOG_ERROR, "Extradata size too small: %i\n", avctx->extradata_size);
  5237. return -1;
  5238. }
  5239. buf2 = av_mallocz(avctx->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
  5240. start = find_next_marker(start, end); // in WVC1 extradata first byte is its size, but can be 0 in mkv
  5241. next = start;
  5242. for (; next < end; start = next) {
  5243. next = find_next_marker(start + 4, end);
  5244. size = next - start - 4;
  5245. if (size <= 0)
  5246. continue;
  5247. buf2_size = vc1_unescape_buffer(start + 4, size, buf2);
  5248. init_get_bits(&gb, buf2, buf2_size * 8);
  5249. switch (AV_RB32(start)) {
  5250. case VC1_CODE_SEQHDR:
  5251. if (ff_vc1_decode_sequence_header(avctx, v, &gb) < 0) {
  5252. av_free(buf2);
  5253. return -1;
  5254. }
  5255. seq_initialized = 1;
  5256. break;
  5257. case VC1_CODE_ENTRYPOINT:
  5258. if (ff_vc1_decode_entry_point(avctx, v, &gb) < 0) {
  5259. av_free(buf2);
  5260. return -1;
  5261. }
  5262. ep_initialized = 1;
  5263. break;
  5264. }
  5265. }
  5266. av_free(buf2);
  5267. if (!seq_initialized || !ep_initialized) {
  5268. av_log(avctx, AV_LOG_ERROR, "Incomplete extradata\n");
  5269. return -1;
  5270. }
  5271. v->res_sprite = (avctx->codec_id == AV_CODEC_ID_VC1IMAGE);
  5272. }
  5273. v->sprite_output_frame = av_frame_alloc();
  5274. if (!v->sprite_output_frame)
  5275. return AVERROR(ENOMEM);
  5276. avctx->profile = v->profile;
  5277. if (v->profile == PROFILE_ADVANCED)
  5278. avctx->level = v->level;
  5279. avctx->has_b_frames = !!avctx->max_b_frames;
  5280. s->mb_width = (avctx->coded_width + 15) >> 4;
  5281. s->mb_height = (avctx->coded_height + 15) >> 4;
  5282. if (v->profile == PROFILE_ADVANCED || v->res_fasttx) {
  5283. ff_vc1_init_transposed_scantables(v);
  5284. } else {
  5285. memcpy(v->zz_8x8, ff_wmv1_scantable, 4*64);
  5286. v->left_blk_sh = 3;
  5287. v->top_blk_sh = 0;
  5288. }
  5289. if (avctx->codec_id == AV_CODEC_ID_WMV3IMAGE || avctx->codec_id == AV_CODEC_ID_VC1IMAGE) {
  5290. v->sprite_width = avctx->coded_width;
  5291. v->sprite_height = avctx->coded_height;
  5292. avctx->coded_width = avctx->width = v->output_width;
  5293. avctx->coded_height = avctx->height = v->output_height;
  5294. // prevent 16.16 overflows
  5295. if (v->sprite_width > 1 << 14 ||
  5296. v->sprite_height > 1 << 14 ||
  5297. v->output_width > 1 << 14 ||
  5298. v->output_height > 1 << 14) return -1;
  5299. }
  5300. return 0;
  5301. }
  5302. /** Close a VC1/WMV3 decoder
  5303. * @warning Initial try at using MpegEncContext stuff
  5304. */
  5305. av_cold int ff_vc1_decode_end(AVCodecContext *avctx)
  5306. {
  5307. VC1Context *v = avctx->priv_data;
  5308. int i;
  5309. av_frame_free(&v->sprite_output_frame);
  5310. for (i = 0; i < 4; i++)
  5311. av_freep(&v->sr_rows[i >> 1][i & 1]);
  5312. av_freep(&v->hrd_rate);
  5313. av_freep(&v->hrd_buffer);
  5314. ff_MPV_common_end(&v->s);
  5315. av_freep(&v->mv_type_mb_plane);
  5316. av_freep(&v->direct_mb_plane);
  5317. av_freep(&v->forward_mb_plane);
  5318. av_freep(&v->fieldtx_plane);
  5319. av_freep(&v->acpred_plane);
  5320. av_freep(&v->over_flags_plane);
  5321. av_freep(&v->mb_type_base);
  5322. av_freep(&v->blk_mv_type_base);
  5323. av_freep(&v->mv_f_base);
  5324. av_freep(&v->mv_f_next_base);
  5325. av_freep(&v->block);
  5326. av_freep(&v->cbp_base);
  5327. av_freep(&v->ttblk_base);
  5328. av_freep(&v->is_intra_base); // FIXME use v->mb_type[]
  5329. av_freep(&v->luma_mv_base);
  5330. ff_intrax8_common_end(&v->x8);
  5331. return 0;
  5332. }
  5333. /** Decode a VC1/WMV3 frame
  5334. * @todo TODO: Handle VC-1 IDUs (Transport level?)
  5335. */
  5336. static int vc1_decode_frame(AVCodecContext *avctx, void *data,
  5337. int *got_frame, AVPacket *avpkt)
  5338. {
  5339. const uint8_t *buf = avpkt->data;
  5340. int buf_size = avpkt->size, n_slices = 0, i, ret;
  5341. VC1Context *v = avctx->priv_data;
  5342. MpegEncContext *s = &v->s;
  5343. AVFrame *pict = data;
  5344. uint8_t *buf2 = NULL;
  5345. const uint8_t *buf_start = buf;
  5346. int mb_height, n_slices1;
  5347. struct {
  5348. uint8_t *buf;
  5349. GetBitContext gb;
  5350. int mby_start;
  5351. } *slices = NULL, *tmp;
  5352. /* no supplementary picture */
  5353. if (buf_size == 0 || (buf_size == 4 && AV_RB32(buf) == VC1_CODE_ENDOFSEQ)) {
  5354. /* special case for last picture */
  5355. if (s->low_delay == 0 && s->next_picture_ptr) {
  5356. if ((ret = av_frame_ref(pict, s->next_picture_ptr->f)) < 0)
  5357. return ret;
  5358. s->next_picture_ptr = NULL;
  5359. *got_frame = 1;
  5360. }
  5361. return 0;
  5362. }
  5363. //for advanced profile we may need to parse and unescape data
  5364. if (avctx->codec_id == AV_CODEC_ID_VC1 || avctx->codec_id == AV_CODEC_ID_VC1IMAGE) {
  5365. int buf_size2 = 0;
  5366. buf2 = av_mallocz(buf_size + FF_INPUT_BUFFER_PADDING_SIZE);
  5367. if (IS_MARKER(AV_RB32(buf))) { /* frame starts with marker and needs to be parsed */
  5368. const uint8_t *start, *end, *next;
  5369. int size;
  5370. next = buf;
  5371. for (start = buf, end = buf + buf_size; next < end; start = next) {
  5372. next = find_next_marker(start + 4, end);
  5373. size = next - start - 4;
  5374. if (size <= 0) continue;
  5375. switch (AV_RB32(start)) {
  5376. case VC1_CODE_FRAME:
  5377. if (avctx->hwaccel)
  5378. buf_start = start;
  5379. buf_size2 = vc1_unescape_buffer(start + 4, size, buf2);
  5380. break;
  5381. case VC1_CODE_FIELD: {
  5382. int buf_size3;
  5383. tmp = av_realloc(slices, sizeof(*slices) * (n_slices+1));
  5384. if (!tmp)
  5385. goto err;
  5386. slices = tmp;
  5387. slices[n_slices].buf = av_mallocz(buf_size + FF_INPUT_BUFFER_PADDING_SIZE);
  5388. if (!slices[n_slices].buf)
  5389. goto err;
  5390. buf_size3 = vc1_unescape_buffer(start + 4, size,
  5391. slices[n_slices].buf);
  5392. init_get_bits(&slices[n_slices].gb, slices[n_slices].buf,
  5393. buf_size3 << 3);
  5394. /* assuming that the field marker is at the exact middle,
  5395. hope it's correct */
  5396. slices[n_slices].mby_start = s->mb_height >> 1;
  5397. n_slices1 = n_slices - 1; // index of the last slice of the first field
  5398. n_slices++;
  5399. break;
  5400. }
  5401. case VC1_CODE_ENTRYPOINT: /* it should be before frame data */
  5402. buf_size2 = vc1_unescape_buffer(start + 4, size, buf2);
  5403. init_get_bits(&s->gb, buf2, buf_size2 * 8);
  5404. ff_vc1_decode_entry_point(avctx, v, &s->gb);
  5405. break;
  5406. case VC1_CODE_SLICE: {
  5407. int buf_size3;
  5408. tmp = av_realloc(slices, sizeof(*slices) * (n_slices+1));
  5409. if (!tmp)
  5410. goto err;
  5411. slices = tmp;
  5412. slices[n_slices].buf = av_mallocz(buf_size + FF_INPUT_BUFFER_PADDING_SIZE);
  5413. if (!slices[n_slices].buf)
  5414. goto err;
  5415. buf_size3 = vc1_unescape_buffer(start + 4, size,
  5416. slices[n_slices].buf);
  5417. init_get_bits(&slices[n_slices].gb, slices[n_slices].buf,
  5418. buf_size3 << 3);
  5419. slices[n_slices].mby_start = get_bits(&slices[n_slices].gb, 9);
  5420. n_slices++;
  5421. break;
  5422. }
  5423. }
  5424. }
  5425. } else if (v->interlace && ((buf[0] & 0xC0) == 0xC0)) { /* WVC1 interlaced stores both fields divided by marker */
  5426. const uint8_t *divider;
  5427. int buf_size3;
  5428. divider = find_next_marker(buf, buf + buf_size);
  5429. if ((divider == (buf + buf_size)) || AV_RB32(divider) != VC1_CODE_FIELD) {
  5430. av_log(avctx, AV_LOG_ERROR, "Error in WVC1 interlaced frame\n");
  5431. goto err;
  5432. } else { // found field marker, unescape second field
  5433. tmp = av_realloc(slices, sizeof(*slices) * (n_slices+1));
  5434. if (!tmp)
  5435. goto err;
  5436. slices = tmp;
  5437. slices[n_slices].buf = av_mallocz(buf_size + FF_INPUT_BUFFER_PADDING_SIZE);
  5438. if (!slices[n_slices].buf)
  5439. goto err;
  5440. buf_size3 = vc1_unescape_buffer(divider + 4, buf + buf_size - divider - 4, slices[n_slices].buf);
  5441. init_get_bits(&slices[n_slices].gb, slices[n_slices].buf,
  5442. buf_size3 << 3);
  5443. slices[n_slices].mby_start = s->mb_height >> 1;
  5444. n_slices1 = n_slices - 1;
  5445. n_slices++;
  5446. }
  5447. buf_size2 = vc1_unescape_buffer(buf, divider - buf, buf2);
  5448. } else {
  5449. buf_size2 = vc1_unescape_buffer(buf, buf_size, buf2);
  5450. }
  5451. init_get_bits(&s->gb, buf2, buf_size2*8);
  5452. } else
  5453. init_get_bits(&s->gb, buf, buf_size*8);
  5454. if (v->res_sprite) {
  5455. v->new_sprite = !get_bits1(&s->gb);
  5456. v->two_sprites = get_bits1(&s->gb);
  5457. /* res_sprite means a Windows Media Image stream, AV_CODEC_ID_*IMAGE means
  5458. we're using the sprite compositor. These are intentionally kept separate
  5459. so you can get the raw sprites by using the wmv3 decoder for WMVP or
  5460. the vc1 one for WVP2 */
  5461. if (avctx->codec_id == AV_CODEC_ID_WMV3IMAGE || avctx->codec_id == AV_CODEC_ID_VC1IMAGE) {
  5462. if (v->new_sprite) {
  5463. // switch AVCodecContext parameters to those of the sprites
  5464. avctx->width = avctx->coded_width = v->sprite_width;
  5465. avctx->height = avctx->coded_height = v->sprite_height;
  5466. } else {
  5467. goto image;
  5468. }
  5469. }
  5470. }
  5471. if (s->context_initialized &&
  5472. (s->width != avctx->coded_width ||
  5473. s->height != avctx->coded_height)) {
  5474. ff_vc1_decode_end(avctx);
  5475. }
  5476. if (!s->context_initialized) {
  5477. if (ff_msmpeg4_decode_init(avctx) < 0)
  5478. goto err;
  5479. if (ff_vc1_decode_init_alloc_tables(v) < 0) {
  5480. ff_MPV_common_end(s);
  5481. goto err;
  5482. }
  5483. s->low_delay = !avctx->has_b_frames || v->res_sprite;
  5484. if (v->profile == PROFILE_ADVANCED) {
  5485. s->h_edge_pos = avctx->coded_width;
  5486. s->v_edge_pos = avctx->coded_height;
  5487. }
  5488. }
  5489. // do parse frame header
  5490. v->pic_header_flag = 0;
  5491. v->first_pic_header_flag = 1;
  5492. if (v->profile < PROFILE_ADVANCED) {
  5493. if (ff_vc1_parse_frame_header(v, &s->gb) < 0) {
  5494. goto err;
  5495. }
  5496. } else {
  5497. if (ff_vc1_parse_frame_header_adv(v, &s->gb) < 0) {
  5498. goto err;
  5499. }
  5500. }
  5501. v->first_pic_header_flag = 0;
  5502. if ((avctx->codec_id == AV_CODEC_ID_WMV3IMAGE || avctx->codec_id == AV_CODEC_ID_VC1IMAGE)
  5503. && s->pict_type != AV_PICTURE_TYPE_I) {
  5504. av_log(v->s.avctx, AV_LOG_ERROR, "Sprite decoder: expected I-frame\n");
  5505. goto err;
  5506. }
  5507. // for skipping the frame
  5508. s->current_picture.f->pict_type = s->pict_type;
  5509. s->current_picture.f->key_frame = s->pict_type == AV_PICTURE_TYPE_I;
  5510. /* skip B-frames if we don't have reference frames */
  5511. if (s->last_picture_ptr == NULL && (s->pict_type == AV_PICTURE_TYPE_B || s->droppable)) {
  5512. goto end;
  5513. }
  5514. if ((avctx->skip_frame >= AVDISCARD_NONREF && s->pict_type == AV_PICTURE_TYPE_B) ||
  5515. (avctx->skip_frame >= AVDISCARD_NONKEY && s->pict_type != AV_PICTURE_TYPE_I) ||
  5516. avctx->skip_frame >= AVDISCARD_ALL) {
  5517. goto end;
  5518. }
  5519. if (s->next_p_frame_damaged) {
  5520. if (s->pict_type == AV_PICTURE_TYPE_B)
  5521. goto end;
  5522. else
  5523. s->next_p_frame_damaged = 0;
  5524. }
  5525. if (ff_MPV_frame_start(s, avctx) < 0) {
  5526. goto err;
  5527. }
  5528. // process pulldown flags
  5529. s->current_picture_ptr->f->repeat_pict = 0;
  5530. // Pulldown flags are only valid when 'broadcast' has been set.
  5531. // So ticks_per_frame will be 2
  5532. if (v->rff) {
  5533. // repeat field
  5534. s->current_picture_ptr->f->repeat_pict = 1;
  5535. } else if (v->rptfrm) {
  5536. // repeat frames
  5537. s->current_picture_ptr->f->repeat_pict = v->rptfrm * 2;
  5538. }
  5539. s->me.qpel_put = s->qdsp.put_qpel_pixels_tab;
  5540. s->me.qpel_avg = s->qdsp.avg_qpel_pixels_tab;
  5541. if (avctx->hwaccel) {
  5542. if (avctx->hwaccel->start_frame(avctx, buf, buf_size) < 0)
  5543. goto err;
  5544. if (avctx->hwaccel->decode_slice(avctx, buf_start, (buf + buf_size) - buf_start) < 0)
  5545. goto err;
  5546. if (avctx->hwaccel->end_frame(avctx) < 0)
  5547. goto err;
  5548. } else {
  5549. int header_ret = 0;
  5550. ff_mpeg_er_frame_start(s);
  5551. v->bits = buf_size * 8;
  5552. v->end_mb_x = s->mb_width;
  5553. if (v->field_mode) {
  5554. s->current_picture.f->linesize[0] <<= 1;
  5555. s->current_picture.f->linesize[1] <<= 1;
  5556. s->current_picture.f->linesize[2] <<= 1;
  5557. s->linesize <<= 1;
  5558. s->uvlinesize <<= 1;
  5559. }
  5560. mb_height = s->mb_height >> v->field_mode;
  5561. if (!mb_height) {
  5562. av_log(v->s.avctx, AV_LOG_ERROR, "Invalid mb_height.\n");
  5563. goto err;
  5564. }
  5565. for (i = 0; i <= n_slices; i++) {
  5566. if (i > 0 && slices[i - 1].mby_start >= mb_height) {
  5567. if (v->field_mode <= 0) {
  5568. av_log(v->s.avctx, AV_LOG_ERROR, "Slice %d starts beyond "
  5569. "picture boundary (%d >= %d)\n", i,
  5570. slices[i - 1].mby_start, mb_height);
  5571. continue;
  5572. }
  5573. v->second_field = 1;
  5574. v->blocks_off = s->mb_width * s->mb_height << 1;
  5575. v->mb_off = s->mb_stride * s->mb_height >> 1;
  5576. } else {
  5577. v->second_field = 0;
  5578. v->blocks_off = 0;
  5579. v->mb_off = 0;
  5580. }
  5581. if (i) {
  5582. v->pic_header_flag = 0;
  5583. if (v->field_mode && i == n_slices1 + 2) {
  5584. if ((header_ret = ff_vc1_parse_frame_header_adv(v, &s->gb)) < 0) {
  5585. av_log(v->s.avctx, AV_LOG_ERROR, "Field header damaged\n");
  5586. if (avctx->err_recognition & AV_EF_EXPLODE)
  5587. goto err;
  5588. continue;
  5589. }
  5590. } else if (get_bits1(&s->gb)) {
  5591. v->pic_header_flag = 1;
  5592. if ((header_ret = ff_vc1_parse_frame_header_adv(v, &s->gb)) < 0) {
  5593. av_log(v->s.avctx, AV_LOG_ERROR, "Slice header damaged\n");
  5594. if (avctx->err_recognition & AV_EF_EXPLODE)
  5595. goto err;
  5596. continue;
  5597. }
  5598. }
  5599. }
  5600. if (header_ret < 0)
  5601. continue;
  5602. s->start_mb_y = (i == 0) ? 0 : FFMAX(0, slices[i-1].mby_start % mb_height);
  5603. if (!v->field_mode || v->second_field)
  5604. s->end_mb_y = (i == n_slices ) ? mb_height : FFMIN(mb_height, slices[i].mby_start % mb_height);
  5605. else
  5606. s->end_mb_y = (i <= n_slices1 + 1) ? mb_height : FFMIN(mb_height, slices[i].mby_start % mb_height);
  5607. ff_vc1_decode_blocks(v);
  5608. if (i != n_slices)
  5609. s->gb = slices[i].gb;
  5610. }
  5611. if (v->field_mode) {
  5612. v->second_field = 0;
  5613. s->current_picture.f->linesize[0] >>= 1;
  5614. s->current_picture.f->linesize[1] >>= 1;
  5615. s->current_picture.f->linesize[2] >>= 1;
  5616. s->linesize >>= 1;
  5617. s->uvlinesize >>= 1;
  5618. if (v->s.pict_type != AV_PICTURE_TYPE_BI && v->s.pict_type != AV_PICTURE_TYPE_B) {
  5619. FFSWAP(uint8_t *, v->mv_f_next[0], v->mv_f[0]);
  5620. FFSWAP(uint8_t *, v->mv_f_next[1], v->mv_f[1]);
  5621. }
  5622. }
  5623. av_dlog(s->avctx, "Consumed %i/%i bits\n",
  5624. get_bits_count(&s->gb), s->gb.size_in_bits);
  5625. // if (get_bits_count(&s->gb) > buf_size * 8)
  5626. // return -1;
  5627. if (!v->field_mode)
  5628. ff_er_frame_end(&s->er);
  5629. }
  5630. ff_MPV_frame_end(s);
  5631. if (avctx->codec_id == AV_CODEC_ID_WMV3IMAGE || avctx->codec_id == AV_CODEC_ID_VC1IMAGE) {
  5632. image:
  5633. avctx->width = avctx->coded_width = v->output_width;
  5634. avctx->height = avctx->coded_height = v->output_height;
  5635. if (avctx->skip_frame >= AVDISCARD_NONREF)
  5636. goto end;
  5637. #if CONFIG_WMV3IMAGE_DECODER || CONFIG_VC1IMAGE_DECODER
  5638. if (vc1_decode_sprites(v, &s->gb))
  5639. goto err;
  5640. #endif
  5641. if ((ret = av_frame_ref(pict, v->sprite_output_frame)) < 0)
  5642. goto err;
  5643. *got_frame = 1;
  5644. } else {
  5645. if (s->pict_type == AV_PICTURE_TYPE_B || s->low_delay) {
  5646. if ((ret = av_frame_ref(pict, s->current_picture_ptr->f)) < 0)
  5647. goto err;
  5648. ff_print_debug_info(s, s->current_picture_ptr);
  5649. *got_frame = 1;
  5650. } else if (s->last_picture_ptr != NULL) {
  5651. if ((ret = av_frame_ref(pict, s->last_picture_ptr->f)) < 0)
  5652. goto err;
  5653. ff_print_debug_info(s, s->last_picture_ptr);
  5654. *got_frame = 1;
  5655. }
  5656. }
  5657. end:
  5658. av_free(buf2);
  5659. for (i = 0; i < n_slices; i++)
  5660. av_free(slices[i].buf);
  5661. av_free(slices);
  5662. return buf_size;
  5663. err:
  5664. av_free(buf2);
  5665. for (i = 0; i < n_slices; i++)
  5666. av_free(slices[i].buf);
  5667. av_free(slices);
  5668. return -1;
  5669. }
  5670. static const AVProfile profiles[] = {
  5671. { FF_PROFILE_VC1_SIMPLE, "Simple" },
  5672. { FF_PROFILE_VC1_MAIN, "Main" },
  5673. { FF_PROFILE_VC1_COMPLEX, "Complex" },
  5674. { FF_PROFILE_VC1_ADVANCED, "Advanced" },
  5675. { FF_PROFILE_UNKNOWN },
  5676. };
  5677. static const enum AVPixelFormat vc1_hwaccel_pixfmt_list_420[] = {
  5678. #if CONFIG_VC1_DXVA2_HWACCEL
  5679. AV_PIX_FMT_DXVA2_VLD,
  5680. #endif
  5681. #if CONFIG_VC1_VAAPI_HWACCEL
  5682. AV_PIX_FMT_VAAPI_VLD,
  5683. #endif
  5684. #if CONFIG_VC1_VDPAU_HWACCEL
  5685. AV_PIX_FMT_VDPAU,
  5686. #endif
  5687. AV_PIX_FMT_YUV420P,
  5688. AV_PIX_FMT_NONE
  5689. };
  5690. AVCodec ff_vc1_decoder = {
  5691. .name = "vc1",
  5692. .long_name = NULL_IF_CONFIG_SMALL("SMPTE VC-1"),
  5693. .type = AVMEDIA_TYPE_VIDEO,
  5694. .id = AV_CODEC_ID_VC1,
  5695. .priv_data_size = sizeof(VC1Context),
  5696. .init = vc1_decode_init,
  5697. .close = ff_vc1_decode_end,
  5698. .decode = vc1_decode_frame,
  5699. .flush = ff_mpeg_flush,
  5700. .capabilities = CODEC_CAP_DR1 | CODEC_CAP_DELAY,
  5701. .pix_fmts = vc1_hwaccel_pixfmt_list_420,
  5702. .profiles = NULL_IF_CONFIG_SMALL(profiles)
  5703. };
  5704. #if CONFIG_WMV3_DECODER
  5705. AVCodec ff_wmv3_decoder = {
  5706. .name = "wmv3",
  5707. .long_name = NULL_IF_CONFIG_SMALL("Windows Media Video 9"),
  5708. .type = AVMEDIA_TYPE_VIDEO,
  5709. .id = AV_CODEC_ID_WMV3,
  5710. .priv_data_size = sizeof(VC1Context),
  5711. .init = vc1_decode_init,
  5712. .close = ff_vc1_decode_end,
  5713. .decode = vc1_decode_frame,
  5714. .flush = ff_mpeg_flush,
  5715. .capabilities = CODEC_CAP_DR1 | CODEC_CAP_DELAY,
  5716. .pix_fmts = vc1_hwaccel_pixfmt_list_420,
  5717. .profiles = NULL_IF_CONFIG_SMALL(profiles)
  5718. };
  5719. #endif
  5720. #if CONFIG_WMV3IMAGE_DECODER
  5721. AVCodec ff_wmv3image_decoder = {
  5722. .name = "wmv3image",
  5723. .long_name = NULL_IF_CONFIG_SMALL("Windows Media Video 9 Image"),
  5724. .type = AVMEDIA_TYPE_VIDEO,
  5725. .id = AV_CODEC_ID_WMV3IMAGE,
  5726. .priv_data_size = sizeof(VC1Context),
  5727. .init = vc1_decode_init,
  5728. .close = ff_vc1_decode_end,
  5729. .decode = vc1_decode_frame,
  5730. .capabilities = CODEC_CAP_DR1,
  5731. .flush = vc1_sprite_flush,
  5732. .pix_fmts = (const enum AVPixelFormat[]) {
  5733. AV_PIX_FMT_YUV420P,
  5734. AV_PIX_FMT_NONE
  5735. },
  5736. };
  5737. #endif
  5738. #if CONFIG_VC1IMAGE_DECODER
  5739. AVCodec ff_vc1image_decoder = {
  5740. .name = "vc1image",
  5741. .long_name = NULL_IF_CONFIG_SMALL("Windows Media Video 9 Image v2"),
  5742. .type = AVMEDIA_TYPE_VIDEO,
  5743. .id = AV_CODEC_ID_VC1IMAGE,
  5744. .priv_data_size = sizeof(VC1Context),
  5745. .init = vc1_decode_init,
  5746. .close = ff_vc1_decode_end,
  5747. .decode = vc1_decode_frame,
  5748. .capabilities = CODEC_CAP_DR1,
  5749. .flush = vc1_sprite_flush,
  5750. .pix_fmts = (const enum AVPixelFormat[]) {
  5751. AV_PIX_FMT_YUV420P,
  5752. AV_PIX_FMT_NONE
  5753. },
  5754. };
  5755. #endif