You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

276 lines
8.2KB

  1. /*
  2. * MPEG-4 encoder/decoder internal header.
  3. * Copyright (c) 2000,2001 Fabrice Bellard
  4. * Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #ifndef AVCODEC_MPEG4VIDEO_H
  23. #define AVCODEC_MPEG4VIDEO_H
  24. #include <stdint.h>
  25. #include "get_bits.h"
  26. #include "mpegvideo.h"
  27. #include "rl.h"
  28. // shapes
  29. #define RECT_SHAPE 0
  30. #define BIN_SHAPE 1
  31. #define BIN_ONLY_SHAPE 2
  32. #define GRAY_SHAPE 3
  33. #define SIMPLE_VO_TYPE 1
  34. #define CORE_VO_TYPE 3
  35. #define MAIN_VO_TYPE 4
  36. #define NBIT_VO_TYPE 5
  37. #define ARTS_VO_TYPE 10
  38. #define ACE_VO_TYPE 12
  39. #define SIMPLE_STUDIO_VO_TYPE 14
  40. #define CORE_STUDIO_VO_TYPE 15
  41. #define ADV_SIMPLE_VO_TYPE 17
  42. #define VOT_VIDEO_ID 1
  43. #define VOT_STILL_TEXTURE_ID 2
  44. // aspect_ratio_info
  45. #define EXTENDED_PAR 15
  46. //vol_sprite_usage / sprite_enable
  47. #define STATIC_SPRITE 1
  48. #define GMC_SPRITE 2
  49. #define MOTION_MARKER 0x1F001
  50. #define DC_MARKER 0x6B001
  51. #define VOS_STARTCODE 0x1B0
  52. #define USER_DATA_STARTCODE 0x1B2
  53. #define GOP_STARTCODE 0x1B3
  54. #define VISUAL_OBJ_STARTCODE 0x1B5
  55. #define VOP_STARTCODE 0x1B6
  56. #define SLICE_STARTCODE 0x1B7
  57. #define EXT_STARTCODE 0x1B8
  58. #define QUANT_MATRIX_EXT_ID 0x3
  59. /* smaller packets likely don't contain a real frame */
  60. #define MAX_NVOP_SIZE 19
  61. typedef struct Mpeg4DecContext {
  62. MpegEncContext m;
  63. /// number of bits to represent the fractional part of time
  64. int time_increment_bits;
  65. int shape;
  66. int vol_sprite_usage;
  67. int sprite_brightness_change;
  68. int num_sprite_warping_points;
  69. /// sprite trajectory points
  70. uint16_t sprite_traj[4][2];
  71. /// sprite shift [isChroma]
  72. int sprite_shift[2];
  73. // reversible vlc
  74. int rvlc;
  75. /// could this stream contain resync markers
  76. int resync_marker;
  77. /// time distance of first I -> B, used for interlaced B-frames
  78. int t_frame;
  79. int new_pred;
  80. int enhancement_type;
  81. int scalability;
  82. int use_intra_dc_vlc;
  83. /// QP above which the ac VLC should be used for intra dc
  84. int intra_dc_threshold;
  85. /* bug workarounds */
  86. int divx_version;
  87. int divx_build;
  88. int xvid_build;
  89. int lavc_build;
  90. /// flag for having shown the warning about invalid Divx B-frames
  91. int showed_packed_warning;
  92. /** does the stream contain the low_delay flag,
  93. * used to work around buggy encoders. */
  94. int vol_control_parameters;
  95. int cplx_estimation_trash_i;
  96. int cplx_estimation_trash_p;
  97. int cplx_estimation_trash_b;
  98. int rgb;
  99. } Mpeg4DecContext;
  100. static const uint8_t mpeg4_block_count[4] = {0, 6, 8, 12};
  101. /* dc encoding for MPEG-4 */
  102. extern const uint8_t ff_mpeg4_DCtab_lum[13][2];
  103. extern const uint8_t ff_mpeg4_DCtab_chrom[13][2];
  104. extern const uint16_t ff_mpeg4_intra_vlc[103][2];
  105. extern const int8_t ff_mpeg4_intra_level[102];
  106. extern const int8_t ff_mpeg4_intra_run[102];
  107. extern RLTable ff_mpeg4_rl_intra;
  108. /* Note this is identical to the intra rvlc except that it is reordered. */
  109. extern RLTable ff_rvlc_rl_inter;
  110. extern RLTable ff_rvlc_rl_intra;
  111. extern const uint8_t ff_sprite_trajectory_lens[15];
  112. extern const uint8_t ff_mb_type_b_tab[4][2];
  113. /* these matrixes will be permuted for the idct */
  114. extern const int16_t ff_mpeg4_default_intra_matrix[64];
  115. extern const int16_t ff_mpeg4_default_non_intra_matrix[64];
  116. extern const uint8_t ff_mpeg4_y_dc_scale_table[32];
  117. extern const uint8_t ff_mpeg4_c_dc_scale_table[32];
  118. extern const uint16_t ff_mpeg4_resync_prefix[8];
  119. extern const uint8_t ff_mpeg4_dc_threshold[8];
  120. extern const uint8_t ff_mpeg4_studio_dc_luma[19][2];
  121. extern const uint8_t ff_mpeg4_studio_dc_chroma[19][2];
  122. extern const uint8_t ff_mpeg4_studio_intra[12][24][2];
  123. void ff_mpeg4_encode_mb(MpegEncContext *s,
  124. int16_t block[6][64],
  125. int motion_x, int motion_y);
  126. void ff_mpeg4_pred_ac(MpegEncContext *s, int16_t *block, int n,
  127. int dir);
  128. void ff_set_mpeg4_time(MpegEncContext *s);
  129. int ff_mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
  130. int ff_mpeg4_decode_picture_header(Mpeg4DecContext *ctx, GetBitContext *gb, int header);
  131. void ff_mpeg4_encode_video_packet_header(MpegEncContext *s);
  132. void ff_mpeg4_clean_buffers(MpegEncContext *s);
  133. void ff_mpeg4_stuffing(PutBitContext *pbc);
  134. void ff_mpeg4_init_partitions(MpegEncContext *s);
  135. void ff_mpeg4_merge_partitions(MpegEncContext *s);
  136. void ff_clean_mpeg4_qscales(MpegEncContext *s);
  137. int ff_mpeg4_decode_partitions(Mpeg4DecContext *ctx);
  138. int ff_mpeg4_get_video_packet_prefix_length(MpegEncContext *s);
  139. int ff_mpeg4_decode_video_packet_header(Mpeg4DecContext *ctx);
  140. int ff_mpeg4_decode_studio_slice_header(Mpeg4DecContext *ctx);
  141. void ff_mpeg4_init_direct_mv(MpegEncContext *s);
  142. void ff_mpeg4videodec_static_init(void);
  143. int ff_mpeg4_workaround_bugs(AVCodecContext *avctx);
  144. int ff_mpeg4_frame_end(AVCodecContext *avctx, const uint8_t *buf, int buf_size);
  145. /**
  146. * @return the mb_type
  147. */
  148. int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my);
  149. extern uint8_t ff_mpeg4_static_rl_table_store[3][2][2 * MAX_RUN + MAX_LEVEL + 3];
  150. #if 0 //3IV1 is quite rare and it slows things down a tiny bit
  151. #define IS_3IV1 s->codec_tag == AV_RL32("3IV1")
  152. #else
  153. #define IS_3IV1 0
  154. #endif
  155. /**
  156. * Predict the dc.
  157. * encoding quantized level -> quantized diff
  158. * decoding quantized diff -> quantized level
  159. * @param n block index (0-3 are luma, 4-5 are chroma)
  160. * @param dir_ptr pointer to an integer where the prediction direction will be stored
  161. */
  162. static inline int ff_mpeg4_pred_dc(MpegEncContext *s, int n, int level,
  163. int *dir_ptr, int encoding)
  164. {
  165. int a, b, c, wrap, pred, scale, ret;
  166. int16_t *dc_val;
  167. /* find prediction */
  168. if (n < 4)
  169. scale = s->y_dc_scale;
  170. else
  171. scale = s->c_dc_scale;
  172. if (IS_3IV1)
  173. scale = 8;
  174. wrap = s->block_wrap[n];
  175. dc_val = s->dc_val[0] + s->block_index[n];
  176. /* B C
  177. * A X
  178. */
  179. a = dc_val[-1];
  180. b = dc_val[-1 - wrap];
  181. c = dc_val[-wrap];
  182. /* outside slice handling (we can't do that by memset as we need the
  183. * dc for error resilience) */
  184. if (s->first_slice_line && n != 3) {
  185. if (n != 2)
  186. b = c = 1024;
  187. if (n != 1 && s->mb_x == s->resync_mb_x)
  188. b = a = 1024;
  189. }
  190. if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1) {
  191. if (n == 0 || n == 4 || n == 5)
  192. b = 1024;
  193. }
  194. if (abs(a - b) < abs(b - c)) {
  195. pred = c;
  196. *dir_ptr = 1; /* top */
  197. } else {
  198. pred = a;
  199. *dir_ptr = 0; /* left */
  200. }
  201. /* we assume pred is positive */
  202. pred = FASTDIV((pred + (scale >> 1)), scale);
  203. if (encoding) {
  204. ret = level - pred;
  205. } else {
  206. level += pred;
  207. ret = level;
  208. }
  209. level *= scale;
  210. if (level & (~2047)) {
  211. if (!s->encoding && (s->avctx->err_recognition & (AV_EF_BITSTREAM | AV_EF_AGGRESSIVE))) {
  212. if (level < 0) {
  213. av_log(s->avctx, AV_LOG_ERROR,
  214. "dc<0 at %dx%d\n", s->mb_x, s->mb_y);
  215. return AVERROR_INVALIDDATA;
  216. }
  217. if (level > 2048 + scale) {
  218. av_log(s->avctx, AV_LOG_ERROR,
  219. "dc overflow at %dx%d\n", s->mb_x, s->mb_y);
  220. return AVERROR_INVALIDDATA;
  221. }
  222. }
  223. if (level < 0)
  224. level = 0;
  225. else if (!(s->workaround_bugs & FF_BUG_DC_CLIP))
  226. level = 2047;
  227. }
  228. dc_val[0] = level;
  229. return ret;
  230. }
  231. #endif /* AVCODEC_MPEG4VIDEO_H */