You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

465 lines
15KB

  1. /*
  2. * VC-1 and WMV3 decoder
  3. * Copyright (c) 2006-2007 Konstantin Shishkov
  4. * Partly based on vc9.c (c) 2005 Anonymous, Alex Beregszaszi, Michael Niedermayer
  5. *
  6. * This file is part of Libav.
  7. *
  8. * Libav is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * Libav is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with Libav; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #ifndef AVCODEC_VC1_H
  23. #define AVCODEC_VC1_H
  24. #include "avcodec.h"
  25. #include "h264chroma.h"
  26. #include "mpegvideo.h"
  27. #include "intrax8.h"
  28. #include "vc1dsp.h"
  29. #define AC_VLC_BITS 9
  30. /** Markers used in VC-1 AP frame data */
  31. //@{
  32. enum VC1Code {
  33. VC1_CODE_RES0 = 0x00000100,
  34. VC1_CODE_ENDOFSEQ = 0x0000010A,
  35. VC1_CODE_SLICE,
  36. VC1_CODE_FIELD,
  37. VC1_CODE_FRAME,
  38. VC1_CODE_ENTRYPOINT,
  39. VC1_CODE_SEQHDR,
  40. };
  41. //@}
  42. #define IS_MARKER(x) (((x) & ~0xFF) == VC1_CODE_RES0)
  43. /** Available Profiles */
  44. //@{
  45. enum Profile {
  46. PROFILE_SIMPLE,
  47. PROFILE_MAIN,
  48. PROFILE_COMPLEX, ///< TODO: WMV9 specific
  49. PROFILE_ADVANCED
  50. };
  51. //@}
  52. /** Sequence quantizer mode */
  53. //@{
  54. enum QuantMode {
  55. QUANT_FRAME_IMPLICIT, ///< Implicitly specified at frame level
  56. QUANT_FRAME_EXPLICIT, ///< Explicitly specified at frame level
  57. QUANT_NON_UNIFORM, ///< Non-uniform quant used for all frames
  58. QUANT_UNIFORM ///< Uniform quant used for all frames
  59. };
  60. //@}
  61. /** Where quant can be changed */
  62. //@{
  63. enum DQProfile {
  64. DQPROFILE_FOUR_EDGES,
  65. DQPROFILE_DOUBLE_EDGES,
  66. DQPROFILE_SINGLE_EDGE,
  67. DQPROFILE_ALL_MBS
  68. };
  69. //@}
  70. /** @name Where quant can be changed
  71. */
  72. //@{
  73. enum DQSingleEdge {
  74. DQSINGLE_BEDGE_LEFT,
  75. DQSINGLE_BEDGE_TOP,
  76. DQSINGLE_BEDGE_RIGHT,
  77. DQSINGLE_BEDGE_BOTTOM
  78. };
  79. //@}
  80. /** Which pair of edges is quantized with ALTPQUANT */
  81. //@{
  82. enum DQDoubleEdge {
  83. DQDOUBLE_BEDGE_TOPLEFT,
  84. DQDOUBLE_BEDGE_TOPRIGHT,
  85. DQDOUBLE_BEDGE_BOTTOMRIGHT,
  86. DQDOUBLE_BEDGE_BOTTOMLEFT
  87. };
  88. //@}
  89. /** MV modes for P frames */
  90. //@{
  91. enum MVModes {
  92. MV_PMODE_1MV_HPEL_BILIN,
  93. MV_PMODE_1MV,
  94. MV_PMODE_1MV_HPEL,
  95. MV_PMODE_MIXED_MV,
  96. MV_PMODE_INTENSITY_COMP
  97. };
  98. //@}
  99. /** MBMODE for interlaced frame P-picture */
  100. //@{
  101. enum MBModesIntfr {
  102. MV_PMODE_INTFR_1MV,
  103. MV_PMODE_INTFR_2MV_FIELD,
  104. MV_PMODE_INTFR_2MV,
  105. MV_PMODE_INTFR_4MV_FIELD,
  106. MV_PMODE_INTFR_4MV,
  107. MV_PMODE_INTFR_INTRA,
  108. };
  109. //@}
  110. /** @name MV types for B frames */
  111. //@{
  112. enum BMVTypes {
  113. BMV_TYPE_BACKWARD,
  114. BMV_TYPE_FORWARD,
  115. BMV_TYPE_INTERPOLATED,
  116. BMV_TYPE_DIRECT
  117. };
  118. //@}
  119. /** @name Block types for P/B frames */
  120. //@{
  121. enum TransformTypes {
  122. TT_8X8,
  123. TT_8X4_BOTTOM,
  124. TT_8X4_TOP,
  125. TT_8X4, // both halves
  126. TT_4X8_RIGHT,
  127. TT_4X8_LEFT,
  128. TT_4X8, // both halves
  129. TT_4X4
  130. };
  131. //@}
  132. enum CodingSet {
  133. CS_HIGH_MOT_INTRA = 0,
  134. CS_HIGH_MOT_INTER,
  135. CS_LOW_MOT_INTRA,
  136. CS_LOW_MOT_INTER,
  137. CS_MID_RATE_INTRA,
  138. CS_MID_RATE_INTER,
  139. CS_HIGH_RATE_INTRA,
  140. CS_HIGH_RATE_INTER
  141. };
  142. /** @name Overlap conditions for Advanced Profile */
  143. //@{
  144. enum COTypes {
  145. CONDOVER_NONE = 0,
  146. CONDOVER_ALL,
  147. CONDOVER_SELECT
  148. };
  149. //@}
  150. /**
  151. * FCM Frame Coding Mode
  152. * @note some content might be marked interlaced
  153. * but have fcm set to 0 as well (e.g. HD-DVD)
  154. */
  155. enum FrameCodingMode {
  156. PROGRESSIVE = 0, ///< in the bitstream is reported as 00b
  157. ILACE_FRAME, ///< in the bitstream is reported as 10b
  158. ILACE_FIELD ///< in the bitstream is reported as 11b
  159. };
  160. /** The VC1 Context
  161. * @todo Change size wherever another size is more efficient
  162. * Many members are only used for Advanced Profile
  163. */
  164. typedef struct VC1Context{
  165. MpegEncContext s;
  166. IntraX8Context x8;
  167. H264ChromaContext h264chroma;
  168. VC1DSPContext vc1dsp;
  169. int bits;
  170. /** Simple/Main Profile sequence header */
  171. //@{
  172. int res_sprite; ///< reserved, sprite mode
  173. int res_y411; ///< reserved, old interlaced mode
  174. int res_x8; ///< reserved
  175. int multires; ///< frame-level RESPIC syntax element present
  176. int res_fasttx; ///< reserved, always 1
  177. int res_transtab; ///< reserved, always 0
  178. int rangered; ///< RANGEREDFRM (range reduction) syntax element present
  179. ///< at frame level
  180. int res_rtm_flag; ///< reserved, set to 1
  181. int reserved; ///< reserved
  182. //@}
  183. /** Advanced Profile */
  184. //@{
  185. int level; ///< 3bits, for Advanced/Simple Profile, provided by TS layer
  186. int chromaformat; ///< 2bits, 2=4:2:0, only defined
  187. int postprocflag; ///< Per-frame processing suggestion flag present
  188. int broadcast; ///< TFF/RFF present
  189. int interlace; ///< Progressive/interlaced (RPTFTM syntax element)
  190. int tfcntrflag; ///< TFCNTR present
  191. int panscanflag; ///< NUMPANSCANWIN, TOPLEFT{X,Y}, BOTRIGHT{X,Y} present
  192. int refdist_flag; ///< REFDIST syntax element present in II, IP, PI or PP field picture headers
  193. int extended_dmv; ///< Additional extended dmv range at P/B frame-level
  194. int color_prim; ///< 8bits, chroma coordinates of the color primaries
  195. int transfer_char; ///< 8bits, Opto-electronic transfer characteristics
  196. int matrix_coef; ///< 8bits, Color primaries->YCbCr transform matrix
  197. int hrd_param_flag; ///< Presence of Hypothetical Reference
  198. ///< Decoder parameters
  199. int psf; ///< Progressive Segmented Frame
  200. //@}
  201. /** Sequence header data for all Profiles
  202. * TODO: choose between ints, uint8_ts and monobit flags
  203. */
  204. //@{
  205. int profile; ///< 2bits, Profile
  206. int frmrtq_postproc; ///< 3bits,
  207. int bitrtq_postproc; ///< 5bits, quantized framerate-based postprocessing strength
  208. int fastuvmc; ///< Rounding of qpel vector to hpel ? (not in Simple)
  209. int extended_mv; ///< Ext MV in P/B (not in Simple)
  210. int dquant; ///< How qscale varies with MBs, 2bits (not in Simple)
  211. int vstransform; ///< variable-size [48]x[48] transform type + info
  212. int overlap; ///< overlapped transforms in use
  213. int quantizer_mode; ///< 2bits, quantizer mode used for sequence, see QUANT_*
  214. int finterpflag; ///< INTERPFRM present
  215. //@}
  216. /** Frame decoding info for all profiles */
  217. //@{
  218. uint8_t mv_mode; ///< MV coding monde
  219. uint8_t mv_mode2; ///< Secondary MV coding mode (B frames)
  220. int k_x; ///< Number of bits for MVs (depends on MV range)
  221. int k_y; ///< Number of bits for MVs (depends on MV range)
  222. int range_x, range_y; ///< MV range
  223. uint8_t pq, altpq; ///< Current/alternate frame quantizer scale
  224. uint8_t zz_8x8[4][64]; ///< Zigzag table for TT_8x8, permuted for IDCT
  225. int left_blk_sh, top_blk_sh; ///< Either 3 or 0, positions of l/t in blk[]
  226. const uint8_t* zz_8x4; ///< Zigzag scan table for TT_8x4 coding mode
  227. const uint8_t* zz_4x8; ///< Zigzag scan table for TT_4x8 coding mode
  228. /** pquant parameters */
  229. //@{
  230. uint8_t dquantfrm;
  231. uint8_t dqprofile;
  232. uint8_t dqsbedge;
  233. uint8_t dqbilevel;
  234. //@}
  235. /** AC coding set indexes
  236. * @see 8.1.1.10, p(1)10
  237. */
  238. //@{
  239. int c_ac_table_index; ///< Chroma index from ACFRM element
  240. int y_ac_table_index; ///< Luma index from AC2FRM element
  241. //@}
  242. int ttfrm; ///< Transform type info present at frame level
  243. uint8_t ttmbf; ///< Transform type flag
  244. int *ttblk_base, *ttblk; ///< Transform type at the block level
  245. int codingset; ///< index of current table set from 11.8 to use for luma block decoding
  246. int codingset2; ///< index of current table set from 11.8 to use for chroma block decoding
  247. int pqindex; ///< raw pqindex used in coding set selection
  248. int a_avail, c_avail;
  249. uint8_t *mb_type_base, *mb_type[3];
  250. /** Luma compensation parameters */
  251. //@{
  252. uint8_t lumscale;
  253. uint8_t lumshift;
  254. //@}
  255. int16_t bfraction; ///< Relative position % anchors=> how to scale MVs
  256. uint8_t halfpq; ///< Uniform quant over image and qp+.5
  257. uint8_t respic; ///< Frame-level flag for resized images
  258. int buffer_fullness; ///< HRD info
  259. /** Ranges:
  260. * -# 0 -> [-64n 63.f] x [-32, 31.f]
  261. * -# 1 -> [-128, 127.f] x [-64, 63.f]
  262. * -# 2 -> [-512, 511.f] x [-128, 127.f]
  263. * -# 3 -> [-1024, 1023.f] x [-256, 255.f]
  264. */
  265. uint8_t mvrange; ///< Extended MV range flag
  266. uint8_t pquantizer; ///< Uniform (over sequence) quantizer in use
  267. VLC *cbpcy_vlc; ///< CBPCY VLC table
  268. int tt_index; ///< Index for Transform Type tables (to decode TTMB)
  269. uint8_t* mv_type_mb_plane; ///< bitplane for mv_type == (4MV)
  270. uint8_t* direct_mb_plane; ///< bitplane for "direct" MBs
  271. uint8_t* forward_mb_plane; ///< bitplane for "forward" MBs
  272. int mv_type_is_raw; ///< mv type mb plane is not coded
  273. int dmb_is_raw; ///< direct mb plane is raw
  274. int fmb_is_raw; ///< forward mb plane is raw
  275. int skip_is_raw; ///< skip mb plane is not coded
  276. uint8_t last_luty[2][256], last_lutuv[2][256]; ///< lookup tables used for intensity compensation
  277. uint8_t aux_luty[2][256], aux_lutuv[2][256]; ///< lookup tables used for intensity compensation
  278. uint8_t next_luty[2][256], next_lutuv[2][256]; ///< lookup tables used for intensity compensation
  279. uint8_t (*curr_luty)[256] ,(*curr_lutuv)[256];
  280. int last_use_ic, curr_use_ic, next_use_ic, aux_use_ic;
  281. int rnd; ///< rounding control
  282. /** Frame decoding info for S/M profiles only */
  283. //@{
  284. uint8_t rangeredfrm; ///< out_sample = CLIP((in_sample-128)*2+128)
  285. uint8_t interpfrm;
  286. //@}
  287. /** Frame decoding info for Advanced profile */
  288. //@{
  289. enum FrameCodingMode fcm;
  290. uint8_t numpanscanwin;
  291. uint8_t tfcntr;
  292. uint8_t rptfrm, tff, rff;
  293. uint16_t topleftx;
  294. uint16_t toplefty;
  295. uint16_t bottomrightx;
  296. uint16_t bottomrighty;
  297. uint8_t uvsamp;
  298. uint8_t postproc;
  299. int hrd_num_leaky_buckets;
  300. uint8_t bit_rate_exponent;
  301. uint8_t buffer_size_exponent;
  302. uint8_t* acpred_plane; ///< AC prediction flags bitplane
  303. int acpred_is_raw;
  304. uint8_t* over_flags_plane; ///< Overflags bitplane
  305. int overflg_is_raw;
  306. uint8_t condover;
  307. uint16_t *hrd_rate, *hrd_buffer;
  308. uint8_t *hrd_fullness;
  309. uint8_t range_mapy_flag;
  310. uint8_t range_mapuv_flag;
  311. uint8_t range_mapy;
  312. uint8_t range_mapuv;
  313. //@}
  314. /** Frame decoding info for interlaced picture */
  315. uint8_t dmvrange; ///< Extended differential MV range flag
  316. int fourmvswitch;
  317. int intcomp;
  318. uint8_t lumscale2; ///< for interlaced field P picture
  319. uint8_t lumshift2;
  320. VLC* mbmode_vlc;
  321. VLC* imv_vlc;
  322. VLC* twomvbp_vlc;
  323. VLC* fourmvbp_vlc;
  324. uint8_t twomvbp;
  325. uint8_t fourmvbp;
  326. uint8_t* fieldtx_plane;
  327. int fieldtx_is_raw;
  328. int8_t zzi_8x8[64];
  329. uint8_t *blk_mv_type_base, *blk_mv_type; ///< 0: frame MV, 1: field MV (interlaced frame)
  330. uint8_t *mv_f_base, *mv_f[2]; ///< 0: MV obtained from same field, 1: opposite field
  331. uint8_t *mv_f_next_base, *mv_f_next[2];
  332. int field_mode; ///< 1 for interlaced field pictures
  333. int fptype;
  334. int second_field;
  335. int refdist; ///< distance of the current picture from reference
  336. int numref; ///< number of past field pictures used as reference
  337. // 0 corresponds to 1 and 1 corresponds to 2 references
  338. int reffield; ///< if numref = 0 (1 reference) then reffield decides which
  339. // field to use among the two fields from previous frame
  340. int intcompfield; ///< which of the two fields to be intensity compensated
  341. // 0: both fields, 1: bottom field, 2: top field
  342. int cur_field_type; ///< 0: top, 1: bottom
  343. int ref_field_type[2]; ///< forward and backward reference field type (top or bottom)
  344. int blocks_off, mb_off;
  345. int qs_last; ///< if qpel has been used in the previous (tr.) picture
  346. int bmvtype;
  347. int frfd, brfd; ///< reference frame distance (forward or backward)
  348. int first_pic_header_flag;
  349. int pic_header_flag;
  350. /** Frame decoding info for sprite modes */
  351. //@{
  352. int new_sprite;
  353. int two_sprites;
  354. AVFrame *sprite_output_frame;
  355. int output_width, output_height, sprite_width, sprite_height;
  356. uint8_t* sr_rows[2][2]; ///< Sprite resizer line cache
  357. //@}
  358. int p_frame_skipped;
  359. int bi_type;
  360. int x8_type;
  361. int16_t (*block)[6][64];
  362. int n_allocated_blks, cur_blk_idx, left_blk_idx, topleft_blk_idx, top_blk_idx;
  363. uint32_t *cbp_base, *cbp;
  364. uint8_t *is_intra_base, *is_intra;
  365. int16_t (*luma_mv_base)[2], (*luma_mv)[2];
  366. uint8_t bfraction_lut_index; ///< Index for BFRACTION value (see Table 40, reproduced into ff_vc1_bfraction_lut[])
  367. uint8_t broken_link; ///< Broken link flag (BROKEN_LINK syntax element)
  368. uint8_t closed_entry; ///< Closed entry point flag (CLOSED_ENTRY syntax element)
  369. int end_mb_x; ///< Horizontal macroblock limit (used only by mss2)
  370. int parse_only; ///< Context is used within parser
  371. int resync_marker; ///< could this stream contain resync markers
  372. } VC1Context;
  373. /** Find VC-1 marker in buffer
  374. * @return position where next marker starts or end of buffer if no marker found
  375. */
  376. static av_always_inline const uint8_t* find_next_marker(const uint8_t *src, const uint8_t *end)
  377. {
  378. uint32_t mrk = 0xFFFFFFFF;
  379. if (end-src < 4)
  380. return end;
  381. while (src < end) {
  382. mrk = (mrk << 8) | *src++;
  383. if (IS_MARKER(mrk))
  384. return src - 4;
  385. }
  386. return end;
  387. }
  388. static av_always_inline int vc1_unescape_buffer(const uint8_t *src, int size, uint8_t *dst)
  389. {
  390. int dsize = 0, i;
  391. if (size < 4) {
  392. for (dsize = 0; dsize < size; dsize++)
  393. *dst++ = *src++;
  394. return size;
  395. }
  396. for (i = 0; i < size; i++, src++) {
  397. if (src[0] == 3 && i >= 2 && !src[-1] && !src[-2] && i < size-1 && src[1] < 4) {
  398. dst[dsize++] = src[1];
  399. src++;
  400. i++;
  401. } else
  402. dst[dsize++] = *src;
  403. }
  404. return dsize;
  405. }
  406. /**
  407. * Decode Simple/Main Profiles sequence header
  408. * @see Figure 7-8, p16-17
  409. * @param avctx Codec context
  410. * @param gb GetBit context initialized from Codec context extra_data
  411. * @return Status
  412. */
  413. int ff_vc1_decode_sequence_header(AVCodecContext *avctx, VC1Context *v, GetBitContext *gb);
  414. int ff_vc1_decode_entry_point(AVCodecContext *avctx, VC1Context *v, GetBitContext *gb);
  415. int ff_vc1_parse_frame_header (VC1Context *v, GetBitContext *gb);
  416. int ff_vc1_parse_frame_header_adv(VC1Context *v, GetBitContext *gb);
  417. int ff_vc1_init_common(VC1Context *v);
  418. int ff_vc1_decode_init_alloc_tables(VC1Context *v);
  419. void ff_vc1_init_transposed_scantables(VC1Context *v);
  420. int ff_vc1_decode_end(AVCodecContext *avctx);
  421. void ff_vc1_decode_blocks(VC1Context *v);
  422. #endif /* AVCODEC_VC1_H */