You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

3441 lines
109KB

  1. /*
  2. * copyright (c) 2001 Fabrice Bellard
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #ifndef AVCODEC_AVCODEC_H
  21. #define AVCODEC_AVCODEC_H
  22. /**
  23. * @file libavcodec/avcodec.h
  24. * external API header
  25. */
  26. #include <errno.h>
  27. #include "libavutil/avutil.h"
  28. #define LIBAVCODEC_VERSION_MAJOR 52
  29. #define LIBAVCODEC_VERSION_MINOR 22
  30. #define LIBAVCODEC_VERSION_MICRO 0
  31. #define LIBAVCODEC_VERSION_INT AV_VERSION_INT(LIBAVCODEC_VERSION_MAJOR, \
  32. LIBAVCODEC_VERSION_MINOR, \
  33. LIBAVCODEC_VERSION_MICRO)
  34. #define LIBAVCODEC_VERSION AV_VERSION(LIBAVCODEC_VERSION_MAJOR, \
  35. LIBAVCODEC_VERSION_MINOR, \
  36. LIBAVCODEC_VERSION_MICRO)
  37. #define LIBAVCODEC_BUILD LIBAVCODEC_VERSION_INT
  38. #define LIBAVCODEC_IDENT "Lavc" AV_STRINGIFY(LIBAVCODEC_VERSION)
  39. #define AV_NOPTS_VALUE INT64_C(0x8000000000000000)
  40. #define AV_TIME_BASE 1000000
  41. #define AV_TIME_BASE_Q (AVRational){1, AV_TIME_BASE}
  42. /**
  43. * Identifies the syntax and semantics of the bitstream.
  44. * The principle is roughly:
  45. * Two decoders with the same ID can decode the same streams.
  46. * Two encoders with the same ID can encode compatible streams.
  47. * There may be slight deviations from the principle due to implementation
  48. * details.
  49. *
  50. * If you add a codec ID to this list, add it so that
  51. * 1. no value of a existing codec ID changes (that would break ABI),
  52. * 2. it is as close as possible to similar codecs.
  53. */
  54. enum CodecID {
  55. CODEC_ID_NONE,
  56. /* video codecs */
  57. CODEC_ID_MPEG1VIDEO,
  58. CODEC_ID_MPEG2VIDEO, ///< preferred ID for MPEG-1/2 video decoding
  59. CODEC_ID_MPEG2VIDEO_XVMC,
  60. CODEC_ID_H261,
  61. CODEC_ID_H263,
  62. CODEC_ID_RV10,
  63. CODEC_ID_RV20,
  64. CODEC_ID_MJPEG,
  65. CODEC_ID_MJPEGB,
  66. CODEC_ID_LJPEG,
  67. CODEC_ID_SP5X,
  68. CODEC_ID_JPEGLS,
  69. CODEC_ID_MPEG4,
  70. CODEC_ID_RAWVIDEO,
  71. CODEC_ID_MSMPEG4V1,
  72. CODEC_ID_MSMPEG4V2,
  73. CODEC_ID_MSMPEG4V3,
  74. CODEC_ID_WMV1,
  75. CODEC_ID_WMV2,
  76. CODEC_ID_H263P,
  77. CODEC_ID_H263I,
  78. CODEC_ID_FLV1,
  79. CODEC_ID_SVQ1,
  80. CODEC_ID_SVQ3,
  81. CODEC_ID_DVVIDEO,
  82. CODEC_ID_HUFFYUV,
  83. CODEC_ID_CYUV,
  84. CODEC_ID_H264,
  85. CODEC_ID_INDEO3,
  86. CODEC_ID_VP3,
  87. CODEC_ID_THEORA,
  88. CODEC_ID_ASV1,
  89. CODEC_ID_ASV2,
  90. CODEC_ID_FFV1,
  91. CODEC_ID_4XM,
  92. CODEC_ID_VCR1,
  93. CODEC_ID_CLJR,
  94. CODEC_ID_MDEC,
  95. CODEC_ID_ROQ,
  96. CODEC_ID_INTERPLAY_VIDEO,
  97. CODEC_ID_XAN_WC3,
  98. CODEC_ID_XAN_WC4,
  99. CODEC_ID_RPZA,
  100. CODEC_ID_CINEPAK,
  101. CODEC_ID_WS_VQA,
  102. CODEC_ID_MSRLE,
  103. CODEC_ID_MSVIDEO1,
  104. CODEC_ID_IDCIN,
  105. CODEC_ID_8BPS,
  106. CODEC_ID_SMC,
  107. CODEC_ID_FLIC,
  108. CODEC_ID_TRUEMOTION1,
  109. CODEC_ID_VMDVIDEO,
  110. CODEC_ID_MSZH,
  111. CODEC_ID_ZLIB,
  112. CODEC_ID_QTRLE,
  113. CODEC_ID_SNOW,
  114. CODEC_ID_TSCC,
  115. CODEC_ID_ULTI,
  116. CODEC_ID_QDRAW,
  117. CODEC_ID_VIXL,
  118. CODEC_ID_QPEG,
  119. CODEC_ID_XVID,
  120. CODEC_ID_PNG,
  121. CODEC_ID_PPM,
  122. CODEC_ID_PBM,
  123. CODEC_ID_PGM,
  124. CODEC_ID_PGMYUV,
  125. CODEC_ID_PAM,
  126. CODEC_ID_FFVHUFF,
  127. CODEC_ID_RV30,
  128. CODEC_ID_RV40,
  129. CODEC_ID_VC1,
  130. CODEC_ID_WMV3,
  131. CODEC_ID_LOCO,
  132. CODEC_ID_WNV1,
  133. CODEC_ID_AASC,
  134. CODEC_ID_INDEO2,
  135. CODEC_ID_FRAPS,
  136. CODEC_ID_TRUEMOTION2,
  137. CODEC_ID_BMP,
  138. CODEC_ID_CSCD,
  139. CODEC_ID_MMVIDEO,
  140. CODEC_ID_ZMBV,
  141. CODEC_ID_AVS,
  142. CODEC_ID_SMACKVIDEO,
  143. CODEC_ID_NUV,
  144. CODEC_ID_KMVC,
  145. CODEC_ID_FLASHSV,
  146. CODEC_ID_CAVS,
  147. CODEC_ID_JPEG2000,
  148. CODEC_ID_VMNC,
  149. CODEC_ID_VP5,
  150. CODEC_ID_VP6,
  151. CODEC_ID_VP6F,
  152. CODEC_ID_TARGA,
  153. CODEC_ID_DSICINVIDEO,
  154. CODEC_ID_TIERTEXSEQVIDEO,
  155. CODEC_ID_TIFF,
  156. CODEC_ID_GIF,
  157. CODEC_ID_FFH264,
  158. CODEC_ID_DXA,
  159. CODEC_ID_DNXHD,
  160. CODEC_ID_THP,
  161. CODEC_ID_SGI,
  162. CODEC_ID_C93,
  163. CODEC_ID_BETHSOFTVID,
  164. CODEC_ID_PTX,
  165. CODEC_ID_TXD,
  166. CODEC_ID_VP6A,
  167. CODEC_ID_AMV,
  168. CODEC_ID_VB,
  169. CODEC_ID_PCX,
  170. CODEC_ID_SUNRAST,
  171. CODEC_ID_INDEO4,
  172. CODEC_ID_INDEO5,
  173. CODEC_ID_MIMIC,
  174. CODEC_ID_RL2,
  175. CODEC_ID_8SVX_EXP,
  176. CODEC_ID_8SVX_FIB,
  177. CODEC_ID_ESCAPE124,
  178. CODEC_ID_DIRAC,
  179. CODEC_ID_BFI,
  180. CODEC_ID_CMV,
  181. CODEC_ID_MOTIONPIXELS,
  182. CODEC_ID_TGV,
  183. CODEC_ID_TGQ,
  184. CODEC_ID_TQI,
  185. /* various PCM "codecs" */
  186. CODEC_ID_PCM_S16LE= 0x10000,
  187. CODEC_ID_PCM_S16BE,
  188. CODEC_ID_PCM_U16LE,
  189. CODEC_ID_PCM_U16BE,
  190. CODEC_ID_PCM_S8,
  191. CODEC_ID_PCM_U8,
  192. CODEC_ID_PCM_MULAW,
  193. CODEC_ID_PCM_ALAW,
  194. CODEC_ID_PCM_S32LE,
  195. CODEC_ID_PCM_S32BE,
  196. CODEC_ID_PCM_U32LE,
  197. CODEC_ID_PCM_U32BE,
  198. CODEC_ID_PCM_S24LE,
  199. CODEC_ID_PCM_S24BE,
  200. CODEC_ID_PCM_U24LE,
  201. CODEC_ID_PCM_U24BE,
  202. CODEC_ID_PCM_S24DAUD,
  203. CODEC_ID_PCM_ZORK,
  204. CODEC_ID_PCM_S16LE_PLANAR,
  205. CODEC_ID_PCM_DVD,
  206. CODEC_ID_PCM_F32BE,
  207. CODEC_ID_PCM_F32LE,
  208. CODEC_ID_PCM_F64BE,
  209. CODEC_ID_PCM_F64LE,
  210. /* various ADPCM codecs */
  211. CODEC_ID_ADPCM_IMA_QT= 0x11000,
  212. CODEC_ID_ADPCM_IMA_WAV,
  213. CODEC_ID_ADPCM_IMA_DK3,
  214. CODEC_ID_ADPCM_IMA_DK4,
  215. CODEC_ID_ADPCM_IMA_WS,
  216. CODEC_ID_ADPCM_IMA_SMJPEG,
  217. CODEC_ID_ADPCM_MS,
  218. CODEC_ID_ADPCM_4XM,
  219. CODEC_ID_ADPCM_XA,
  220. CODEC_ID_ADPCM_ADX,
  221. CODEC_ID_ADPCM_EA,
  222. CODEC_ID_ADPCM_G726,
  223. CODEC_ID_ADPCM_CT,
  224. CODEC_ID_ADPCM_SWF,
  225. CODEC_ID_ADPCM_YAMAHA,
  226. CODEC_ID_ADPCM_SBPRO_4,
  227. CODEC_ID_ADPCM_SBPRO_3,
  228. CODEC_ID_ADPCM_SBPRO_2,
  229. CODEC_ID_ADPCM_THP,
  230. CODEC_ID_ADPCM_IMA_AMV,
  231. CODEC_ID_ADPCM_EA_R1,
  232. CODEC_ID_ADPCM_EA_R3,
  233. CODEC_ID_ADPCM_EA_R2,
  234. CODEC_ID_ADPCM_IMA_EA_SEAD,
  235. CODEC_ID_ADPCM_IMA_EA_EACS,
  236. CODEC_ID_ADPCM_EA_XAS,
  237. CODEC_ID_ADPCM_EA_MAXIS_XA,
  238. CODEC_ID_ADPCM_IMA_ISS,
  239. /* AMR */
  240. CODEC_ID_AMR_NB= 0x12000,
  241. CODEC_ID_AMR_WB,
  242. /* RealAudio codecs*/
  243. CODEC_ID_RA_144= 0x13000,
  244. CODEC_ID_RA_288,
  245. /* various DPCM codecs */
  246. CODEC_ID_ROQ_DPCM= 0x14000,
  247. CODEC_ID_INTERPLAY_DPCM,
  248. CODEC_ID_XAN_DPCM,
  249. CODEC_ID_SOL_DPCM,
  250. /* audio codecs */
  251. CODEC_ID_MP2= 0x15000,
  252. CODEC_ID_MP3, ///< preferred ID for decoding MPEG audio layer 1, 2 or 3
  253. CODEC_ID_AAC,
  254. CODEC_ID_AC3,
  255. CODEC_ID_DTS,
  256. CODEC_ID_VORBIS,
  257. CODEC_ID_DVAUDIO,
  258. CODEC_ID_WMAV1,
  259. CODEC_ID_WMAV2,
  260. CODEC_ID_MACE3,
  261. CODEC_ID_MACE6,
  262. CODEC_ID_VMDAUDIO,
  263. CODEC_ID_SONIC,
  264. CODEC_ID_SONIC_LS,
  265. CODEC_ID_FLAC,
  266. CODEC_ID_MP3ADU,
  267. CODEC_ID_MP3ON4,
  268. CODEC_ID_SHORTEN,
  269. CODEC_ID_ALAC,
  270. CODEC_ID_WESTWOOD_SND1,
  271. CODEC_ID_GSM, ///< as in Berlin toast format
  272. CODEC_ID_QDM2,
  273. CODEC_ID_COOK,
  274. CODEC_ID_TRUESPEECH,
  275. CODEC_ID_TTA,
  276. CODEC_ID_SMACKAUDIO,
  277. CODEC_ID_QCELP,
  278. CODEC_ID_WAVPACK,
  279. CODEC_ID_DSICINAUDIO,
  280. CODEC_ID_IMC,
  281. CODEC_ID_MUSEPACK7,
  282. CODEC_ID_MLP,
  283. CODEC_ID_GSM_MS, /* as found in WAV */
  284. CODEC_ID_ATRAC3,
  285. CODEC_ID_VOXWARE,
  286. CODEC_ID_APE,
  287. CODEC_ID_NELLYMOSER,
  288. CODEC_ID_MUSEPACK8,
  289. CODEC_ID_SPEEX,
  290. CODEC_ID_WMAVOICE,
  291. CODEC_ID_WMAPRO,
  292. CODEC_ID_WMALOSSLESS,
  293. CODEC_ID_ATRAC3P,
  294. CODEC_ID_EAC3,
  295. CODEC_ID_SIPR,
  296. CODEC_ID_MP1,
  297. CODEC_ID_TWINVQ,
  298. CODEC_ID_TRUEHD,
  299. /* subtitle codecs */
  300. CODEC_ID_DVD_SUBTITLE= 0x17000,
  301. CODEC_ID_DVB_SUBTITLE,
  302. CODEC_ID_TEXT, ///< raw UTF-8 text
  303. CODEC_ID_XSUB,
  304. CODEC_ID_SSA,
  305. CODEC_ID_MOV_TEXT,
  306. /* other specific kind of codecs (generally used for attachments) */
  307. CODEC_ID_TTF= 0x18000,
  308. CODEC_ID_PROBE= 0x19000, ///< codec_id is not known (like CODEC_ID_NONE) but lavf should attempt to identify it
  309. CODEC_ID_MPEG2TS= 0x20000, /**< _FAKE_ codec to indicate a raw MPEG-2 TS
  310. * stream (only used by libavformat) */
  311. };
  312. enum CodecType {
  313. CODEC_TYPE_UNKNOWN = -1,
  314. CODEC_TYPE_VIDEO,
  315. CODEC_TYPE_AUDIO,
  316. CODEC_TYPE_DATA,
  317. CODEC_TYPE_SUBTITLE,
  318. CODEC_TYPE_ATTACHMENT,
  319. CODEC_TYPE_NB
  320. };
  321. /**
  322. * all in native-endian format
  323. */
  324. enum SampleFormat {
  325. SAMPLE_FMT_NONE = -1,
  326. SAMPLE_FMT_U8, ///< unsigned 8 bits
  327. SAMPLE_FMT_S16, ///< signed 16 bits
  328. SAMPLE_FMT_S32, ///< signed 32 bits
  329. SAMPLE_FMT_FLT, ///< float
  330. SAMPLE_FMT_DBL, ///< double
  331. SAMPLE_FMT_NB ///< Number of sample formats. DO NOT USE if dynamically linking to libavcodec
  332. };
  333. /* Audio channel masks */
  334. #define CH_FRONT_LEFT 0x00000001
  335. #define CH_FRONT_RIGHT 0x00000002
  336. #define CH_FRONT_CENTER 0x00000004
  337. #define CH_LOW_FREQUENCY 0x00000008
  338. #define CH_BACK_LEFT 0x00000010
  339. #define CH_BACK_RIGHT 0x00000020
  340. #define CH_FRONT_LEFT_OF_CENTER 0x00000040
  341. #define CH_FRONT_RIGHT_OF_CENTER 0x00000080
  342. #define CH_BACK_CENTER 0x00000100
  343. #define CH_SIDE_LEFT 0x00000200
  344. #define CH_SIDE_RIGHT 0x00000400
  345. #define CH_TOP_CENTER 0x00000800
  346. #define CH_TOP_FRONT_LEFT 0x00001000
  347. #define CH_TOP_FRONT_CENTER 0x00002000
  348. #define CH_TOP_FRONT_RIGHT 0x00004000
  349. #define CH_TOP_BACK_LEFT 0x00008000
  350. #define CH_TOP_BACK_CENTER 0x00010000
  351. #define CH_TOP_BACK_RIGHT 0x00020000
  352. #define CH_STEREO_LEFT 0x20000000 ///< Stereo downmix.
  353. #define CH_STEREO_RIGHT 0x40000000 ///< See CH_STEREO_LEFT.
  354. /* Audio channel convenience macros */
  355. #define CH_LAYOUT_MONO (CH_FRONT_CENTER)
  356. #define CH_LAYOUT_STEREO (CH_FRONT_LEFT|CH_FRONT_RIGHT)
  357. #define CH_LAYOUT_SURROUND (CH_LAYOUT_STEREO|CH_FRONT_CENTER)
  358. #define CH_LAYOUT_QUAD (CH_LAYOUT_STEREO|CH_BACK_LEFT|CH_BACK_RIGHT)
  359. #define CH_LAYOUT_5POINT0 (CH_LAYOUT_SURROUND|CH_SIDE_LEFT|CH_SIDE_RIGHT)
  360. #define CH_LAYOUT_5POINT1 (CH_LAYOUT_5POINT0|CH_LOW_FREQUENCY)
  361. #define CH_LAYOUT_7POINT1 (CH_LAYOUT_5POINT1|CH_BACK_LEFT|CH_BACK_RIGHT)
  362. #define CH_LAYOUT_7POINT1_WIDE (CH_LAYOUT_SURROUND|CH_LOW_FREQUENCY|\
  363. CH_BACK_LEFT|CH_BACK_RIGHT|\
  364. CH_FRONT_LEFT_OF_CENTER|CH_FRONT_RIGHT_OF_CENTER)
  365. #define CH_LAYOUT_STEREO_DOWNMIX (CH_STEREO_LEFT|CH_STEREO_RIGHT)
  366. /* in bytes */
  367. #define AVCODEC_MAX_AUDIO_FRAME_SIZE 192000 // 1 second of 48khz 32bit audio
  368. /**
  369. * Required number of additionally allocated bytes at the end of the input bitstream for decoding.
  370. * This is mainly needed because some optimized bitstream readers read
  371. * 32 or 64 bit at once and could read over the end.<br>
  372. * Note: If the first 23 bits of the additional bytes are not 0, then damaged
  373. * MPEG bitstreams could cause overread and segfault.
  374. */
  375. #define FF_INPUT_BUFFER_PADDING_SIZE 8
  376. /**
  377. * minimum encoding buffer size
  378. * Used to avoid some checks during header writing.
  379. */
  380. #define FF_MIN_BUFFER_SIZE 16384
  381. /**
  382. * motion estimation type.
  383. */
  384. enum Motion_Est_ID {
  385. ME_ZERO = 1, ///< no search, that is use 0,0 vector whenever one is needed
  386. ME_FULL,
  387. ME_LOG,
  388. ME_PHODS,
  389. ME_EPZS, ///< enhanced predictive zonal search
  390. ME_X1, ///< reserved for experiments
  391. ME_HEX, ///< hexagon based search
  392. ME_UMH, ///< uneven multi-hexagon search
  393. ME_ITER, ///< iterative search
  394. ME_TESA, ///< transformed exhaustive search algorithm
  395. };
  396. enum AVDiscard{
  397. /* We leave some space between them for extensions (drop some
  398. * keyframes for intra-only or drop just some bidir frames). */
  399. AVDISCARD_NONE =-16, ///< discard nothing
  400. AVDISCARD_DEFAULT= 0, ///< discard useless packets like 0 size packets in avi
  401. AVDISCARD_NONREF = 8, ///< discard all non reference
  402. AVDISCARD_BIDIR = 16, ///< discard all bidirectional frames
  403. AVDISCARD_NONKEY = 32, ///< discard all frames except keyframes
  404. AVDISCARD_ALL = 48, ///< discard all
  405. };
  406. typedef struct RcOverride{
  407. int start_frame;
  408. int end_frame;
  409. int qscale; // If this is 0 then quality_factor will be used instead.
  410. float quality_factor;
  411. } RcOverride;
  412. #define FF_MAX_B_FRAMES 16
  413. /* encoding support
  414. These flags can be passed in AVCodecContext.flags before initialization.
  415. Note: Not everything is supported yet.
  416. */
  417. #define CODEC_FLAG_QSCALE 0x0002 ///< Use fixed qscale.
  418. #define CODEC_FLAG_4MV 0x0004 ///< 4 MV per MB allowed / advanced prediction for H.263.
  419. #define CODEC_FLAG_QPEL 0x0010 ///< Use qpel MC.
  420. #define CODEC_FLAG_GMC 0x0020 ///< Use GMC.
  421. #define CODEC_FLAG_MV0 0x0040 ///< Always try a MB with MV=<0,0>.
  422. #define CODEC_FLAG_PART 0x0080 ///< Use data partitioning.
  423. /**
  424. * The parent program guarantees that the input for B-frames containing
  425. * streams is not written to for at least s->max_b_frames+1 frames, if
  426. * this is not set the input will be copied.
  427. */
  428. #define CODEC_FLAG_INPUT_PRESERVED 0x0100
  429. #define CODEC_FLAG_PASS1 0x0200 ///< Use internal 2pass ratecontrol in first pass mode.
  430. #define CODEC_FLAG_PASS2 0x0400 ///< Use internal 2pass ratecontrol in second pass mode.
  431. #define CODEC_FLAG_EXTERN_HUFF 0x1000 ///< Use external Huffman table (for MJPEG).
  432. #define CODEC_FLAG_GRAY 0x2000 ///< Only decode/encode grayscale.
  433. #define CODEC_FLAG_EMU_EDGE 0x4000 ///< Don't draw edges.
  434. #define CODEC_FLAG_PSNR 0x8000 ///< error[?] variables will be set during encoding.
  435. #define CODEC_FLAG_TRUNCATED 0x00010000 /** Input bitstream might be truncated at a random
  436. location instead of only at frame boundaries. */
  437. #define CODEC_FLAG_NORMALIZE_AQP 0x00020000 ///< Normalize adaptive quantization.
  438. #define CODEC_FLAG_INTERLACED_DCT 0x00040000 ///< Use interlaced DCT.
  439. #define CODEC_FLAG_LOW_DELAY 0x00080000 ///< Force low delay.
  440. #define CODEC_FLAG_ALT_SCAN 0x00100000 ///< Use alternate scan.
  441. #define CODEC_FLAG_GLOBAL_HEADER 0x00400000 ///< Place global headers in extradata instead of every keyframe.
  442. #define CODEC_FLAG_BITEXACT 0x00800000 ///< Use only bitexact stuff (except (I)DCT).
  443. /* Fx : Flag for h263+ extra options */
  444. #define CODEC_FLAG_AC_PRED 0x01000000 ///< H.263 advanced intra coding / MPEG-4 AC prediction
  445. #define CODEC_FLAG_H263P_UMV 0x02000000 ///< unlimited motion vector
  446. #define CODEC_FLAG_CBP_RD 0x04000000 ///< Use rate distortion optimization for cbp.
  447. #define CODEC_FLAG_QP_RD 0x08000000 ///< Use rate distortion optimization for qp selectioon.
  448. #define CODEC_FLAG_H263P_AIV 0x00000008 ///< H.263 alternative inter VLC
  449. #define CODEC_FLAG_OBMC 0x00000001 ///< OBMC
  450. #define CODEC_FLAG_LOOP_FILTER 0x00000800 ///< loop filter
  451. #define CODEC_FLAG_H263P_SLICE_STRUCT 0x10000000
  452. #define CODEC_FLAG_INTERLACED_ME 0x20000000 ///< interlaced motion estimation
  453. #define CODEC_FLAG_SVCD_SCAN_OFFSET 0x40000000 ///< Will reserve space for SVCD scan offset user data.
  454. #define CODEC_FLAG_CLOSED_GOP 0x80000000
  455. #define CODEC_FLAG2_FAST 0x00000001 ///< Allow non spec compliant speedup tricks.
  456. #define CODEC_FLAG2_STRICT_GOP 0x00000002 ///< Strictly enforce GOP size.
  457. #define CODEC_FLAG2_NO_OUTPUT 0x00000004 ///< Skip bitstream encoding.
  458. #define CODEC_FLAG2_LOCAL_HEADER 0x00000008 ///< Place global headers at every keyframe instead of in extradata.
  459. #define CODEC_FLAG2_BPYRAMID 0x00000010 ///< H.264 allow B-frames to be used as references.
  460. #define CODEC_FLAG2_WPRED 0x00000020 ///< H.264 weighted biprediction for B-frames
  461. #define CODEC_FLAG2_MIXED_REFS 0x00000040 ///< H.264 one reference per partition, as opposed to one reference per macroblock
  462. #define CODEC_FLAG2_8X8DCT 0x00000080 ///< H.264 high profile 8x8 transform
  463. #define CODEC_FLAG2_FASTPSKIP 0x00000100 ///< H.264 fast pskip
  464. #define CODEC_FLAG2_AUD 0x00000200 ///< H.264 access unit delimiters
  465. #define CODEC_FLAG2_BRDO 0x00000400 ///< B-frame rate-distortion optimization
  466. #define CODEC_FLAG2_INTRA_VLC 0x00000800 ///< Use MPEG-2 intra VLC table.
  467. #define CODEC_FLAG2_MEMC_ONLY 0x00001000 ///< Only do ME/MC (I frames -> ref, P frame -> ME+MC).
  468. #define CODEC_FLAG2_DROP_FRAME_TIMECODE 0x00002000 ///< timecode is in drop frame format.
  469. #define CODEC_FLAG2_SKIP_RD 0x00004000 ///< RD optimal MB level residual skipping
  470. #define CODEC_FLAG2_CHUNKS 0x00008000 ///< Input bitstream might be truncated at a packet boundaries instead of only at frame boundaries.
  471. #define CODEC_FLAG2_NON_LINEAR_QUANT 0x00010000 ///< Use MPEG-2 nonlinear quantizer.
  472. #define CODEC_FLAG2_BIT_RESERVOIR 0x00020000 ///< Use a bit reservoir when encoding if possible
  473. /* Unsupported options :
  474. * Syntax Arithmetic coding (SAC)
  475. * Reference Picture Selection
  476. * Independent Segment Decoding */
  477. /* /Fx */
  478. /* codec capabilities */
  479. #define CODEC_CAP_DRAW_HORIZ_BAND 0x0001 ///< Decoder can use draw_horiz_band callback.
  480. /**
  481. * Codec uses get_buffer() for allocating buffers.
  482. * direct rendering method 1
  483. */
  484. #define CODEC_CAP_DR1 0x0002
  485. /* If 'parse_only' field is true, then avcodec_parse_frame() can be used. */
  486. #define CODEC_CAP_PARSE_ONLY 0x0004
  487. #define CODEC_CAP_TRUNCATED 0x0008
  488. /* Codec can export data for HW decoding (XvMC). */
  489. #define CODEC_CAP_HWACCEL 0x0010
  490. /**
  491. * Codec has a nonzero delay and needs to be fed with NULL at the end to get the delayed data.
  492. * If this is not set, the codec is guaranteed to never be fed with NULL data.
  493. */
  494. #define CODEC_CAP_DELAY 0x0020
  495. /**
  496. * Codec can be fed a final frame with a smaller size.
  497. * This can be used to prevent truncation of the last audio samples.
  498. */
  499. #define CODEC_CAP_SMALL_LAST_FRAME 0x0040
  500. /**
  501. * Codec can export data for HW decoding (VDPAU).
  502. */
  503. #define CODEC_CAP_HWACCEL_VDPAU 0x0080
  504. //The following defines may change, don't expect compatibility if you use them.
  505. #define MB_TYPE_INTRA4x4 0x0001
  506. #define MB_TYPE_INTRA16x16 0x0002 //FIXME H.264-specific
  507. #define MB_TYPE_INTRA_PCM 0x0004 //FIXME H.264-specific
  508. #define MB_TYPE_16x16 0x0008
  509. #define MB_TYPE_16x8 0x0010
  510. #define MB_TYPE_8x16 0x0020
  511. #define MB_TYPE_8x8 0x0040
  512. #define MB_TYPE_INTERLACED 0x0080
  513. #define MB_TYPE_DIRECT2 0x0100 //FIXME
  514. #define MB_TYPE_ACPRED 0x0200
  515. #define MB_TYPE_GMC 0x0400
  516. #define MB_TYPE_SKIP 0x0800
  517. #define MB_TYPE_P0L0 0x1000
  518. #define MB_TYPE_P1L0 0x2000
  519. #define MB_TYPE_P0L1 0x4000
  520. #define MB_TYPE_P1L1 0x8000
  521. #define MB_TYPE_L0 (MB_TYPE_P0L0 | MB_TYPE_P1L0)
  522. #define MB_TYPE_L1 (MB_TYPE_P0L1 | MB_TYPE_P1L1)
  523. #define MB_TYPE_L0L1 (MB_TYPE_L0 | MB_TYPE_L1)
  524. #define MB_TYPE_QUANT 0x00010000
  525. #define MB_TYPE_CBP 0x00020000
  526. //Note bits 24-31 are reserved for codec specific use (h264 ref0, mpeg1 0mv, ...)
  527. /**
  528. * Pan Scan area.
  529. * This specifies the area which should be displayed.
  530. * Note there may be multiple such areas for one frame.
  531. */
  532. typedef struct AVPanScan{
  533. /**
  534. * id
  535. * - encoding: Set by user.
  536. * - decoding: Set by libavcodec.
  537. */
  538. int id;
  539. /**
  540. * width and height in 1/16 pel
  541. * - encoding: Set by user.
  542. * - decoding: Set by libavcodec.
  543. */
  544. int width;
  545. int height;
  546. /**
  547. * position of the top left corner in 1/16 pel for up to 3 fields/frames
  548. * - encoding: Set by user.
  549. * - decoding: Set by libavcodec.
  550. */
  551. int16_t position[3][2];
  552. }AVPanScan;
  553. #define FF_COMMON_FRAME \
  554. /**\
  555. * pointer to the picture planes.\
  556. * This might be different from the first allocated byte\
  557. * - encoding: \
  558. * - decoding: \
  559. */\
  560. uint8_t *data[4];\
  561. int linesize[4];\
  562. /**\
  563. * pointer to the first allocated byte of the picture. Can be used in get_buffer/release_buffer.\
  564. * This isn't used by libavcodec unless the default get/release_buffer() is used.\
  565. * - encoding: \
  566. * - decoding: \
  567. */\
  568. uint8_t *base[4];\
  569. /**\
  570. * 1 -> keyframe, 0-> not\
  571. * - encoding: Set by libavcodec.\
  572. * - decoding: Set by libavcodec.\
  573. */\
  574. int key_frame;\
  575. \
  576. /**\
  577. * Picture type of the frame, see ?_TYPE below.\
  578. * - encoding: Set by libavcodec. for coded_picture (and set by user for input).\
  579. * - decoding: Set by libavcodec.\
  580. */\
  581. int pict_type;\
  582. \
  583. /**\
  584. * presentation timestamp in time_base units (time when frame should be shown to user)\
  585. * If AV_NOPTS_VALUE then frame_rate = 1/time_base will be assumed.\
  586. * - encoding: MUST be set by user.\
  587. * - decoding: Set by libavcodec.\
  588. */\
  589. int64_t pts;\
  590. \
  591. /**\
  592. * picture number in bitstream order\
  593. * - encoding: set by\
  594. * - decoding: Set by libavcodec.\
  595. */\
  596. int coded_picture_number;\
  597. /**\
  598. * picture number in display order\
  599. * - encoding: set by\
  600. * - decoding: Set by libavcodec.\
  601. */\
  602. int display_picture_number;\
  603. \
  604. /**\
  605. * quality (between 1 (good) and FF_LAMBDA_MAX (bad)) \
  606. * - encoding: Set by libavcodec. for coded_picture (and set by user for input).\
  607. * - decoding: Set by libavcodec.\
  608. */\
  609. int quality; \
  610. \
  611. /**\
  612. * buffer age (1->was last buffer and dint change, 2->..., ...).\
  613. * Set to INT_MAX if the buffer has not been used yet.\
  614. * - encoding: unused\
  615. * - decoding: MUST be set by get_buffer().\
  616. */\
  617. int age;\
  618. \
  619. /**\
  620. * is this picture used as reference\
  621. * The values for this are the same as the MpegEncContext.picture_structure\
  622. * variable, that is 1->top field, 2->bottom field, 3->frame/both fields.\
  623. * Set to 4 for delayed, non-reference frames.\
  624. * - encoding: unused\
  625. * - decoding: Set by libavcodec. (before get_buffer() call)).\
  626. */\
  627. int reference;\
  628. \
  629. /**\
  630. * QP table\
  631. * - encoding: unused\
  632. * - decoding: Set by libavcodec.\
  633. */\
  634. int8_t *qscale_table;\
  635. /**\
  636. * QP store stride\
  637. * - encoding: unused\
  638. * - decoding: Set by libavcodec.\
  639. */\
  640. int qstride;\
  641. \
  642. /**\
  643. * mbskip_table[mb]>=1 if MB didn't change\
  644. * stride= mb_width = (width+15)>>4\
  645. * - encoding: unused\
  646. * - decoding: Set by libavcodec.\
  647. */\
  648. uint8_t *mbskip_table;\
  649. \
  650. /**\
  651. * motion vector table\
  652. * @code\
  653. * example:\
  654. * int mv_sample_log2= 4 - motion_subsample_log2;\
  655. * int mb_width= (width+15)>>4;\
  656. * int mv_stride= (mb_width << mv_sample_log2) + 1;\
  657. * motion_val[direction][x + y*mv_stride][0->mv_x, 1->mv_y];\
  658. * @endcode\
  659. * - encoding: Set by user.\
  660. * - decoding: Set by libavcodec.\
  661. */\
  662. int16_t (*motion_val[2])[2];\
  663. \
  664. /**\
  665. * macroblock type table\
  666. * mb_type_base + mb_width + 2\
  667. * - encoding: Set by user.\
  668. * - decoding: Set by libavcodec.\
  669. */\
  670. uint32_t *mb_type;\
  671. \
  672. /**\
  673. * log2 of the size of the block which a single vector in motion_val represents: \
  674. * (4->16x16, 3->8x8, 2-> 4x4, 1-> 2x2)\
  675. * - encoding: unused\
  676. * - decoding: Set by libavcodec.\
  677. */\
  678. uint8_t motion_subsample_log2;\
  679. \
  680. /**\
  681. * for some private data of the user\
  682. * - encoding: unused\
  683. * - decoding: Set by user.\
  684. */\
  685. void *opaque;\
  686. \
  687. /**\
  688. * error\
  689. * - encoding: Set by libavcodec. if flags&CODEC_FLAG_PSNR.\
  690. * - decoding: unused\
  691. */\
  692. uint64_t error[4];\
  693. \
  694. /**\
  695. * type of the buffer (to keep track of who has to deallocate data[*])\
  696. * - encoding: Set by the one who allocates it.\
  697. * - decoding: Set by the one who allocates it.\
  698. * Note: User allocated (direct rendering) & internal buffers cannot coexist currently.\
  699. */\
  700. int type;\
  701. \
  702. /**\
  703. * When decoding, this signals how much the picture must be delayed.\
  704. * extra_delay = repeat_pict / (2*fps)\
  705. * - encoding: unused\
  706. * - decoding: Set by libavcodec.\
  707. */\
  708. int repeat_pict;\
  709. \
  710. /**\
  711. * \
  712. */\
  713. int qscale_type;\
  714. \
  715. /**\
  716. * The content of the picture is interlaced.\
  717. * - encoding: Set by user.\
  718. * - decoding: Set by libavcodec. (default 0)\
  719. */\
  720. int interlaced_frame;\
  721. \
  722. /**\
  723. * If the content is interlaced, is top field displayed first.\
  724. * - encoding: Set by user.\
  725. * - decoding: Set by libavcodec.\
  726. */\
  727. int top_field_first;\
  728. \
  729. /**\
  730. * Pan scan.\
  731. * - encoding: Set by user.\
  732. * - decoding: Set by libavcodec.\
  733. */\
  734. AVPanScan *pan_scan;\
  735. \
  736. /**\
  737. * Tell user application that palette has changed from previous frame.\
  738. * - encoding: ??? (no palette-enabled encoder yet)\
  739. * - decoding: Set by libavcodec. (default 0).\
  740. */\
  741. int palette_has_changed;\
  742. \
  743. /**\
  744. * codec suggestion on buffer type if != 0\
  745. * - encoding: unused\
  746. * - decoding: Set by libavcodec. (before get_buffer() call)).\
  747. */\
  748. int buffer_hints;\
  749. \
  750. /**\
  751. * DCT coefficients\
  752. * - encoding: unused\
  753. * - decoding: Set by libavcodec.\
  754. */\
  755. short *dct_coeff;\
  756. \
  757. /**\
  758. * motion referece frame index\
  759. * - encoding: Set by user.\
  760. * - decoding: Set by libavcodec.\
  761. */\
  762. int8_t *ref_index[2];\
  763. \
  764. /**\
  765. * reordered opaque 64bit number (generally a PTS) from AVCodecContext.reordered_opaque\
  766. * output in AVFrame.reordered_opaque\
  767. * - encoding: unused\
  768. * - decoding: Read by user.\
  769. */\
  770. int64_t reordered_opaque;\
  771. \
  772. /**\
  773. * hardware accelerator private data (FFmpeg allocated)\
  774. * - encoding: unused\
  775. * - decoding: Set by libavcodec\
  776. */\
  777. void *hwaccel_picture_private;\
  778. #define FF_QSCALE_TYPE_MPEG1 0
  779. #define FF_QSCALE_TYPE_MPEG2 1
  780. #define FF_QSCALE_TYPE_H264 2
  781. #define FF_BUFFER_TYPE_INTERNAL 1
  782. #define FF_BUFFER_TYPE_USER 2 ///< direct rendering buffers (image is (de)allocated by user)
  783. #define FF_BUFFER_TYPE_SHARED 4 ///< Buffer from somewhere else; don't deallocate image (data/base), all other tables are not shared.
  784. #define FF_BUFFER_TYPE_COPY 8 ///< Just a (modified) copy of some other buffer, don't deallocate anything.
  785. #define FF_I_TYPE 1 ///< Intra
  786. #define FF_P_TYPE 2 ///< Predicted
  787. #define FF_B_TYPE 3 ///< Bi-dir predicted
  788. #define FF_S_TYPE 4 ///< S(GMC)-VOP MPEG4
  789. #define FF_SI_TYPE 5 ///< Switching Intra
  790. #define FF_SP_TYPE 6 ///< Switching Predicted
  791. #define FF_BI_TYPE 7
  792. #define FF_BUFFER_HINTS_VALID 0x01 // Buffer hints value is meaningful (if 0 ignore).
  793. #define FF_BUFFER_HINTS_READABLE 0x02 // Codec will read from buffer.
  794. #define FF_BUFFER_HINTS_PRESERVE 0x04 // User must not alter buffer content.
  795. #define FF_BUFFER_HINTS_REUSABLE 0x08 // Codec will reuse the buffer (update).
  796. /**
  797. * Audio Video Frame.
  798. * New fields can be added to the end of FF_COMMON_FRAME with minor version
  799. * bumps.
  800. * Removal, reordering and changes to existing fields require a major
  801. * version bump. No fields should be added into AVFrame before or after
  802. * FF_COMMON_FRAME!
  803. * sizeof(AVFrame) must not be used outside libav*.
  804. */
  805. typedef struct AVFrame {
  806. FF_COMMON_FRAME
  807. } AVFrame;
  808. /**
  809. * main external API structure.
  810. * New fields can be added to the end with minor version bumps.
  811. * Removal, reordering and changes to existing fields require a major
  812. * version bump.
  813. * sizeof(AVCodecContext) must not be used outside libav*.
  814. */
  815. typedef struct AVCodecContext {
  816. /**
  817. * information on struct for av_log
  818. * - set by avcodec_alloc_context
  819. */
  820. const AVClass *av_class;
  821. /**
  822. * the average bitrate
  823. * - encoding: Set by user; unused for constant quantizer encoding.
  824. * - decoding: Set by libavcodec. 0 or some bitrate if this info is available in the stream.
  825. */
  826. int bit_rate;
  827. /**
  828. * number of bits the bitstream is allowed to diverge from the reference.
  829. * the reference can be CBR (for CBR pass1) or VBR (for pass2)
  830. * - encoding: Set by user; unused for constant quantizer encoding.
  831. * - decoding: unused
  832. */
  833. int bit_rate_tolerance;
  834. /**
  835. * CODEC_FLAG_*.
  836. * - encoding: Set by user.
  837. * - decoding: Set by user.
  838. */
  839. int flags;
  840. /**
  841. * Some codecs need additional format info. It is stored here.
  842. * If any muxer uses this then ALL demuxers/parsers AND encoders for the
  843. * specific codec MUST set it correctly otherwise stream copy breaks.
  844. * In general use of this field by muxers is not recommanded.
  845. * - encoding: Set by libavcodec.
  846. * - decoding: Set by libavcodec. (FIXME: Is this OK?)
  847. */
  848. int sub_id;
  849. /**
  850. * Motion estimation algorithm used for video coding.
  851. * 1 (zero), 2 (full), 3 (log), 4 (phods), 5 (epzs), 6 (x1), 7 (hex),
  852. * 8 (umh), 9 (iter), 10 (tesa) [7, 8, 10 are x264 specific, 9 is snow specific]
  853. * - encoding: MUST be set by user.
  854. * - decoding: unused
  855. */
  856. int me_method;
  857. /**
  858. * some codecs need / can use extradata like Huffman tables.
  859. * mjpeg: Huffman tables
  860. * rv10: additional flags
  861. * mpeg4: global headers (they can be in the bitstream or here)
  862. * The allocated memory should be FF_INPUT_BUFFER_PADDING_SIZE bytes larger
  863. * than extradata_size to avoid prolems if it is read with the bitstream reader.
  864. * The bytewise contents of extradata must not depend on the architecture or CPU endianness.
  865. * - encoding: Set/allocated/freed by libavcodec.
  866. * - decoding: Set/allocated/freed by user.
  867. */
  868. uint8_t *extradata;
  869. int extradata_size;
  870. /**
  871. * This is the fundamental unit of time (in seconds) in terms
  872. * of which frame timestamps are represented. For fixed-fps content,
  873. * timebase should be 1/framerate and timestamp increments should be
  874. * identically 1.
  875. * - encoding: MUST be set by user.
  876. * - decoding: Set by libavcodec.
  877. */
  878. AVRational time_base;
  879. /* video only */
  880. /**
  881. * picture width / height.
  882. * - encoding: MUST be set by user.
  883. * - decoding: Set by libavcodec.
  884. * Note: For compatibility it is possible to set this instead of
  885. * coded_width/height before decoding.
  886. */
  887. int width, height;
  888. #define FF_ASPECT_EXTENDED 15
  889. /**
  890. * the number of pictures in a group of pictures, or 0 for intra_only
  891. * - encoding: Set by user.
  892. * - decoding: unused
  893. */
  894. int gop_size;
  895. /**
  896. * Pixel format, see PIX_FMT_xxx.
  897. * - encoding: Set by user.
  898. * - decoding: Set by libavcodec.
  899. */
  900. enum PixelFormat pix_fmt;
  901. /**
  902. * Frame rate emulation. If not zero, the lower layer (i.e. format handler)
  903. * has to read frames at native frame rate.
  904. * - encoding: Set by user.
  905. * - decoding: unused
  906. */
  907. int rate_emu;
  908. /**
  909. * If non NULL, 'draw_horiz_band' is called by the libavcodec
  910. * decoder to draw a horizontal band. It improves cache usage. Not
  911. * all codecs can do that. You must check the codec capabilities
  912. * beforehand.
  913. * The function is also used by hardware acceleration APIs.
  914. * It is called at least once during frame decoding to pass
  915. * the data needed for hardware render.
  916. * In that mode instead of pixel data, AVFrame points to
  917. * a structure specific to the acceleration API. The application
  918. * reads the structure and can change some fields to indicate progress
  919. * or mark state.
  920. * - encoding: unused
  921. * - decoding: Set by user.
  922. * @param height the height of the slice
  923. * @param y the y position of the slice
  924. * @param type 1->top field, 2->bottom field, 3->frame
  925. * @param offset offset into the AVFrame.data from which the slice should be read
  926. */
  927. void (*draw_horiz_band)(struct AVCodecContext *s,
  928. const AVFrame *src, int offset[4],
  929. int y, int type, int height);
  930. /* audio only */
  931. int sample_rate; ///< samples per second
  932. int channels; ///< number of audio channels
  933. /**
  934. * audio sample format
  935. * - encoding: Set by user.
  936. * - decoding: Set by libavcodec.
  937. */
  938. enum SampleFormat sample_fmt; ///< sample format, currently unused
  939. /* The following data should not be initialized. */
  940. /**
  941. * Samples per packet, initialized when calling 'init'.
  942. */
  943. int frame_size;
  944. int frame_number; ///< audio or video frame number
  945. int real_pict_num; ///< Returns the real picture number of previous encoded frame.
  946. /**
  947. * Number of frames the decoded output will be delayed relative to
  948. * the encoded input.
  949. * - encoding: Set by libavcodec.
  950. * - decoding: unused
  951. */
  952. int delay;
  953. /* - encoding parameters */
  954. float qcompress; ///< amount of qscale change between easy & hard scenes (0.0-1.0)
  955. float qblur; ///< amount of qscale smoothing over time (0.0-1.0)
  956. /**
  957. * minimum quantizer
  958. * - encoding: Set by user.
  959. * - decoding: unused
  960. */
  961. int qmin;
  962. /**
  963. * maximum quantizer
  964. * - encoding: Set by user.
  965. * - decoding: unused
  966. */
  967. int qmax;
  968. /**
  969. * maximum quantizer difference between frames
  970. * - encoding: Set by user.
  971. * - decoding: unused
  972. */
  973. int max_qdiff;
  974. /**
  975. * maximum number of B-frames between non-B-frames
  976. * Note: The output will be delayed by max_b_frames+1 relative to the input.
  977. * - encoding: Set by user.
  978. * - decoding: unused
  979. */
  980. int max_b_frames;
  981. /**
  982. * qscale factor between IP and B-frames
  983. * If > 0 then the last P-frame quantizer will be used (q= lastp_q*factor+offset).
  984. * If < 0 then normal ratecontrol will be done (q= -normal_q*factor+offset).
  985. * - encoding: Set by user.
  986. * - decoding: unused
  987. */
  988. float b_quant_factor;
  989. /** obsolete FIXME remove */
  990. int rc_strategy;
  991. #define FF_RC_STRATEGY_XVID 1
  992. int b_frame_strategy;
  993. /**
  994. * hurry up amount
  995. * - encoding: unused
  996. * - decoding: Set by user. 1-> Skip B-frames, 2-> Skip IDCT/dequant too, 5-> Skip everything except header
  997. * @deprecated Deprecated in favor of skip_idct and skip_frame.
  998. */
  999. int hurry_up;
  1000. struct AVCodec *codec;
  1001. void *priv_data;
  1002. int rtp_payload_size; /* The size of the RTP payload: the coder will */
  1003. /* do its best to deliver a chunk with size */
  1004. /* below rtp_payload_size, the chunk will start */
  1005. /* with a start code on some codecs like H.263. */
  1006. /* This doesn't take account of any particular */
  1007. /* headers inside the transmitted RTP payload. */
  1008. /* The RTP callback: This function is called */
  1009. /* every time the encoder has a packet to send. */
  1010. /* It depends on the encoder if the data starts */
  1011. /* with a Start Code (it should). H.263 does. */
  1012. /* mb_nb contains the number of macroblocks */
  1013. /* encoded in the RTP payload. */
  1014. void (*rtp_callback)(struct AVCodecContext *avctx, void *data, int size, int mb_nb);
  1015. /* statistics, used for 2-pass encoding */
  1016. int mv_bits;
  1017. int header_bits;
  1018. int i_tex_bits;
  1019. int p_tex_bits;
  1020. int i_count;
  1021. int p_count;
  1022. int skip_count;
  1023. int misc_bits;
  1024. /**
  1025. * number of bits used for the previously encoded frame
  1026. * - encoding: Set by libavcodec.
  1027. * - decoding: unused
  1028. */
  1029. int frame_bits;
  1030. /**
  1031. * Private data of the user, can be used to carry app specific stuff.
  1032. * - encoding: Set by user.
  1033. * - decoding: Set by user.
  1034. */
  1035. void *opaque;
  1036. char codec_name[32];
  1037. enum CodecType codec_type; /* see CODEC_TYPE_xxx */
  1038. enum CodecID codec_id; /* see CODEC_ID_xxx */
  1039. /**
  1040. * fourcc (LSB first, so "ABCD" -> ('D'<<24) + ('C'<<16) + ('B'<<8) + 'A').
  1041. * This is used to work around some encoder bugs.
  1042. * A demuxer should set this to what is stored in the field used to identify the codec.
  1043. * If there are multiple such fields in a container then the demuxer should choose the one
  1044. * which maximizes the information about the used codec.
  1045. * If the codec tag field in a container is larger then 32 bits then the demuxer should
  1046. * remap the longer ID to 32 bits with a table or other structure. Alternatively a new
  1047. * extra_codec_tag + size could be added but for this a clear advantage must be demonstrated
  1048. * first.
  1049. * - encoding: Set by user, if not then the default based on codec_id will be used.
  1050. * - decoding: Set by user, will be converted to uppercase by libavcodec during init.
  1051. */
  1052. unsigned int codec_tag;
  1053. /**
  1054. * Work around bugs in encoders which sometimes cannot be detected automatically.
  1055. * - encoding: Set by user
  1056. * - decoding: Set by user
  1057. */
  1058. int workaround_bugs;
  1059. #define FF_BUG_AUTODETECT 1 ///< autodetection
  1060. #define FF_BUG_OLD_MSMPEG4 2
  1061. #define FF_BUG_XVID_ILACE 4
  1062. #define FF_BUG_UMP4 8
  1063. #define FF_BUG_NO_PADDING 16
  1064. #define FF_BUG_AMV 32
  1065. #define FF_BUG_AC_VLC 0 ///< Will be removed, libavcodec can now handle these non-compliant files by default.
  1066. #define FF_BUG_QPEL_CHROMA 64
  1067. #define FF_BUG_STD_QPEL 128
  1068. #define FF_BUG_QPEL_CHROMA2 256
  1069. #define FF_BUG_DIRECT_BLOCKSIZE 512
  1070. #define FF_BUG_EDGE 1024
  1071. #define FF_BUG_HPEL_CHROMA 2048
  1072. #define FF_BUG_DC_CLIP 4096
  1073. #define FF_BUG_MS 8192 ///< Work around various bugs in Microsoft's broken decoders.
  1074. //#define FF_BUG_FAKE_SCALABILITY 16 //Autodetection should work 100%.
  1075. /**
  1076. * luma single coefficient elimination threshold
  1077. * - encoding: Set by user.
  1078. * - decoding: unused
  1079. */
  1080. int luma_elim_threshold;
  1081. /**
  1082. * chroma single coeff elimination threshold
  1083. * - encoding: Set by user.
  1084. * - decoding: unused
  1085. */
  1086. int chroma_elim_threshold;
  1087. /**
  1088. * strictly follow the standard (MPEG4, ...).
  1089. * - encoding: Set by user.
  1090. * - decoding: Set by user.
  1091. * Setting this to STRICT or higher means the encoder and decoder will
  1092. * generally do stupid things. While setting it to inofficial or lower
  1093. * will mean the encoder might use things that are not supported by all
  1094. * spec compliant decoders. Decoders make no difference between normal,
  1095. * inofficial and experimental, that is they always try to decode things
  1096. * when they can unless they are explicitly asked to behave stupid
  1097. * (=strictly conform to the specs)
  1098. */
  1099. int strict_std_compliance;
  1100. #define FF_COMPLIANCE_VERY_STRICT 2 ///< Strictly conform to a older more strict version of the spec or reference software.
  1101. #define FF_COMPLIANCE_STRICT 1 ///< Strictly conform to all the things in the spec no matter what consequences.
  1102. #define FF_COMPLIANCE_NORMAL 0
  1103. #define FF_COMPLIANCE_INOFFICIAL -1 ///< Allow inofficial extensions.
  1104. #define FF_COMPLIANCE_EXPERIMENTAL -2 ///< Allow nonstandardized experimental things.
  1105. /**
  1106. * qscale offset between IP and B-frames
  1107. * - encoding: Set by user.
  1108. * - decoding: unused
  1109. */
  1110. float b_quant_offset;
  1111. /**
  1112. * Error recognization; higher values will detect more errors but may
  1113. * misdetect some more or less valid parts as errors.
  1114. * - encoding: unused
  1115. * - decoding: Set by user.
  1116. */
  1117. int error_recognition;
  1118. #define FF_ER_CAREFUL 1
  1119. #define FF_ER_COMPLIANT 2
  1120. #define FF_ER_AGGRESSIVE 3
  1121. #define FF_ER_VERY_AGGRESSIVE 4
  1122. /**
  1123. * Called at the beginning of each frame to get a buffer for it.
  1124. * If pic.reference is set then the frame will be read later by libavcodec.
  1125. * avcodec_align_dimensions() should be used to find the required width and
  1126. * height, as they normally need to be rounded up to the next multiple of 16.
  1127. * - encoding: unused
  1128. * - decoding: Set by libavcodec., user can override.
  1129. */
  1130. int (*get_buffer)(struct AVCodecContext *c, AVFrame *pic);
  1131. /**
  1132. * Called to release buffers which were allocated with get_buffer.
  1133. * A released buffer can be reused in get_buffer().
  1134. * pic.data[*] must be set to NULL.
  1135. * - encoding: unused
  1136. * - decoding: Set by libavcodec., user can override.
  1137. */
  1138. void (*release_buffer)(struct AVCodecContext *c, AVFrame *pic);
  1139. /**
  1140. * Size of the frame reordering buffer in the decoder.
  1141. * For MPEG-2 it is 1 IPB or 0 low delay IP.
  1142. * - encoding: Set by libavcodec.
  1143. * - decoding: Set by libavcodec.
  1144. */
  1145. int has_b_frames;
  1146. /**
  1147. * number of bytes per packet if constant and known or 0
  1148. * Used by some WAV based audio codecs.
  1149. */
  1150. int block_align;
  1151. int parse_only; /* - decoding only: If true, only parsing is done
  1152. (function avcodec_parse_frame()). The frame
  1153. data is returned. Only MPEG codecs support this now. */
  1154. /**
  1155. * 0-> h263 quant 1-> mpeg quant
  1156. * - encoding: Set by user.
  1157. * - decoding: unused
  1158. */
  1159. int mpeg_quant;
  1160. /**
  1161. * pass1 encoding statistics output buffer
  1162. * - encoding: Set by libavcodec.
  1163. * - decoding: unused
  1164. */
  1165. char *stats_out;
  1166. /**
  1167. * pass2 encoding statistics input buffer
  1168. * Concatenated stuff from stats_out of pass1 should be placed here.
  1169. * - encoding: Allocated/set/freed by user.
  1170. * - decoding: unused
  1171. */
  1172. char *stats_in;
  1173. /**
  1174. * ratecontrol qmin qmax limiting method
  1175. * 0-> clipping, 1-> use a nice continous function to limit qscale wthin qmin/qmax.
  1176. * - encoding: Set by user.
  1177. * - decoding: unused
  1178. */
  1179. float rc_qsquish;
  1180. float rc_qmod_amp;
  1181. int rc_qmod_freq;
  1182. /**
  1183. * ratecontrol override, see RcOverride
  1184. * - encoding: Allocated/set/freed by user.
  1185. * - decoding: unused
  1186. */
  1187. RcOverride *rc_override;
  1188. int rc_override_count;
  1189. /**
  1190. * rate control equation
  1191. * - encoding: Set by user
  1192. * - decoding: unused
  1193. */
  1194. const char *rc_eq;
  1195. /**
  1196. * maximum bitrate
  1197. * - encoding: Set by user.
  1198. * - decoding: unused
  1199. */
  1200. int rc_max_rate;
  1201. /**
  1202. * minimum bitrate
  1203. * - encoding: Set by user.
  1204. * - decoding: unused
  1205. */
  1206. int rc_min_rate;
  1207. /**
  1208. * decoder bitstream buffer size
  1209. * - encoding: Set by user.
  1210. * - decoding: unused
  1211. */
  1212. int rc_buffer_size;
  1213. float rc_buffer_aggressivity;
  1214. /**
  1215. * qscale factor between P and I-frames
  1216. * If > 0 then the last p frame quantizer will be used (q= lastp_q*factor+offset).
  1217. * If < 0 then normal ratecontrol will be done (q= -normal_q*factor+offset).
  1218. * - encoding: Set by user.
  1219. * - decoding: unused
  1220. */
  1221. float i_quant_factor;
  1222. /**
  1223. * qscale offset between P and I-frames
  1224. * - encoding: Set by user.
  1225. * - decoding: unused
  1226. */
  1227. float i_quant_offset;
  1228. /**
  1229. * initial complexity for pass1 ratecontrol
  1230. * - encoding: Set by user.
  1231. * - decoding: unused
  1232. */
  1233. float rc_initial_cplx;
  1234. /**
  1235. * DCT algorithm, see FF_DCT_* below
  1236. * - encoding: Set by user.
  1237. * - decoding: unused
  1238. */
  1239. int dct_algo;
  1240. #define FF_DCT_AUTO 0
  1241. #define FF_DCT_FASTINT 1
  1242. #define FF_DCT_INT 2
  1243. #define FF_DCT_MMX 3
  1244. #define FF_DCT_MLIB 4
  1245. #define FF_DCT_ALTIVEC 5
  1246. #define FF_DCT_FAAN 6
  1247. /**
  1248. * luminance masking (0-> disabled)
  1249. * - encoding: Set by user.
  1250. * - decoding: unused
  1251. */
  1252. float lumi_masking;
  1253. /**
  1254. * temporary complexity masking (0-> disabled)
  1255. * - encoding: Set by user.
  1256. * - decoding: unused
  1257. */
  1258. float temporal_cplx_masking;
  1259. /**
  1260. * spatial complexity masking (0-> disabled)
  1261. * - encoding: Set by user.
  1262. * - decoding: unused
  1263. */
  1264. float spatial_cplx_masking;
  1265. /**
  1266. * p block masking (0-> disabled)
  1267. * - encoding: Set by user.
  1268. * - decoding: unused
  1269. */
  1270. float p_masking;
  1271. /**
  1272. * darkness masking (0-> disabled)
  1273. * - encoding: Set by user.
  1274. * - decoding: unused
  1275. */
  1276. float dark_masking;
  1277. /**
  1278. * IDCT algorithm, see FF_IDCT_* below.
  1279. * - encoding: Set by user.
  1280. * - decoding: Set by user.
  1281. */
  1282. int idct_algo;
  1283. #define FF_IDCT_AUTO 0
  1284. #define FF_IDCT_INT 1
  1285. #define FF_IDCT_SIMPLE 2
  1286. #define FF_IDCT_SIMPLEMMX 3
  1287. #define FF_IDCT_LIBMPEG2MMX 4
  1288. #define FF_IDCT_PS2 5
  1289. #define FF_IDCT_MLIB 6
  1290. #define FF_IDCT_ARM 7
  1291. #define FF_IDCT_ALTIVEC 8
  1292. #define FF_IDCT_SH4 9
  1293. #define FF_IDCT_SIMPLEARM 10
  1294. #define FF_IDCT_H264 11
  1295. #define FF_IDCT_VP3 12
  1296. #define FF_IDCT_IPP 13
  1297. #define FF_IDCT_XVIDMMX 14
  1298. #define FF_IDCT_CAVS 15
  1299. #define FF_IDCT_SIMPLEARMV5TE 16
  1300. #define FF_IDCT_SIMPLEARMV6 17
  1301. #define FF_IDCT_SIMPLEVIS 18
  1302. #define FF_IDCT_WMV2 19
  1303. #define FF_IDCT_FAAN 20
  1304. #define FF_IDCT_EA 21
  1305. #define FF_IDCT_SIMPLENEON 22
  1306. #define FF_IDCT_SIMPLEALPHA 23
  1307. /**
  1308. * slice count
  1309. * - encoding: Set by libavcodec.
  1310. * - decoding: Set by user (or 0).
  1311. */
  1312. int slice_count;
  1313. /**
  1314. * slice offsets in the frame in bytes
  1315. * - encoding: Set/allocated by libavcodec.
  1316. * - decoding: Set/allocated by user (or NULL).
  1317. */
  1318. int *slice_offset;
  1319. /**
  1320. * error concealment flags
  1321. * - encoding: unused
  1322. * - decoding: Set by user.
  1323. */
  1324. int error_concealment;
  1325. #define FF_EC_GUESS_MVS 1
  1326. #define FF_EC_DEBLOCK 2
  1327. /**
  1328. * dsp_mask could be add used to disable unwanted CPU features
  1329. * CPU features (i.e. MMX, SSE. ...)
  1330. *
  1331. * With the FORCE flag you may instead enable given CPU features.
  1332. * (Dangerous: Usable in case of misdetection, improper usage however will
  1333. * result into program crash.)
  1334. */
  1335. unsigned dsp_mask;
  1336. #define FF_MM_FORCE 0x80000000 /* Force usage of selected flags (OR) */
  1337. /* lower 16 bits - CPU features */
  1338. #define FF_MM_MMX 0x0001 ///< standard MMX
  1339. #define FF_MM_3DNOW 0x0004 ///< AMD 3DNOW
  1340. #define FF_MM_MMXEXT 0x0002 ///< SSE integer functions or AMD MMX ext
  1341. #define FF_MM_SSE 0x0008 ///< SSE functions
  1342. #define FF_MM_SSE2 0x0010 ///< PIV SSE2 functions
  1343. #define FF_MM_3DNOWEXT 0x0020 ///< AMD 3DNowExt
  1344. #define FF_MM_SSE3 0x0040 ///< Prescott SSE3 functions
  1345. #define FF_MM_SSSE3 0x0080 ///< Conroe SSSE3 functions
  1346. #define FF_MM_IWMMXT 0x0100 ///< XScale IWMMXT
  1347. #define FF_MM_ALTIVEC 0x0001 ///< standard AltiVec
  1348. /**
  1349. * bits per sample/pixel from the demuxer (needed for huffyuv).
  1350. * - encoding: Set by libavcodec.
  1351. * - decoding: Set by user.
  1352. */
  1353. int bits_per_coded_sample;
  1354. /**
  1355. * prediction method (needed for huffyuv)
  1356. * - encoding: Set by user.
  1357. * - decoding: unused
  1358. */
  1359. int prediction_method;
  1360. #define FF_PRED_LEFT 0
  1361. #define FF_PRED_PLANE 1
  1362. #define FF_PRED_MEDIAN 2
  1363. /**
  1364. * sample aspect ratio (0 if unknown)
  1365. * That is the width of a pixel divided by the height of the pixel.
  1366. * Numerator and denominator must be relatively prime and smaller than 256 for some video standards.
  1367. * - encoding: Set by user.
  1368. * - decoding: Set by libavcodec.
  1369. */
  1370. AVRational sample_aspect_ratio;
  1371. /**
  1372. * the picture in the bitstream
  1373. * - encoding: Set by libavcodec.
  1374. * - decoding: Set by libavcodec.
  1375. */
  1376. AVFrame *coded_frame;
  1377. /**
  1378. * debug
  1379. * - encoding: Set by user.
  1380. * - decoding: Set by user.
  1381. */
  1382. int debug;
  1383. #define FF_DEBUG_PICT_INFO 1
  1384. #define FF_DEBUG_RC 2
  1385. #define FF_DEBUG_BITSTREAM 4
  1386. #define FF_DEBUG_MB_TYPE 8
  1387. #define FF_DEBUG_QP 16
  1388. #define FF_DEBUG_MV 32
  1389. #define FF_DEBUG_DCT_COEFF 0x00000040
  1390. #define FF_DEBUG_SKIP 0x00000080
  1391. #define FF_DEBUG_STARTCODE 0x00000100
  1392. #define FF_DEBUG_PTS 0x00000200
  1393. #define FF_DEBUG_ER 0x00000400
  1394. #define FF_DEBUG_MMCO 0x00000800
  1395. #define FF_DEBUG_BUGS 0x00001000
  1396. #define FF_DEBUG_VIS_QP 0x00002000
  1397. #define FF_DEBUG_VIS_MB_TYPE 0x00004000
  1398. #define FF_DEBUG_BUFFERS 0x00008000
  1399. /**
  1400. * debug
  1401. * - encoding: Set by user.
  1402. * - decoding: Set by user.
  1403. */
  1404. int debug_mv;
  1405. #define FF_DEBUG_VIS_MV_P_FOR 0x00000001 //visualize forward predicted MVs of P frames
  1406. #define FF_DEBUG_VIS_MV_B_FOR 0x00000002 //visualize forward predicted MVs of B frames
  1407. #define FF_DEBUG_VIS_MV_B_BACK 0x00000004 //visualize backward predicted MVs of B frames
  1408. /**
  1409. * error
  1410. * - encoding: Set by libavcodec if flags&CODEC_FLAG_PSNR.
  1411. * - decoding: unused
  1412. */
  1413. uint64_t error[4];
  1414. /**
  1415. * minimum MB quantizer
  1416. * - encoding: unused
  1417. * - decoding: unused
  1418. */
  1419. int mb_qmin;
  1420. /**
  1421. * maximum MB quantizer
  1422. * - encoding: unused
  1423. * - decoding: unused
  1424. */
  1425. int mb_qmax;
  1426. /**
  1427. * motion estimation comparison function
  1428. * - encoding: Set by user.
  1429. * - decoding: unused
  1430. */
  1431. int me_cmp;
  1432. /**
  1433. * subpixel motion estimation comparison function
  1434. * - encoding: Set by user.
  1435. * - decoding: unused
  1436. */
  1437. int me_sub_cmp;
  1438. /**
  1439. * macroblock comparison function (not supported yet)
  1440. * - encoding: Set by user.
  1441. * - decoding: unused
  1442. */
  1443. int mb_cmp;
  1444. /**
  1445. * interlaced DCT comparison function
  1446. * - encoding: Set by user.
  1447. * - decoding: unused
  1448. */
  1449. int ildct_cmp;
  1450. #define FF_CMP_SAD 0
  1451. #define FF_CMP_SSE 1
  1452. #define FF_CMP_SATD 2
  1453. #define FF_CMP_DCT 3
  1454. #define FF_CMP_PSNR 4
  1455. #define FF_CMP_BIT 5
  1456. #define FF_CMP_RD 6
  1457. #define FF_CMP_ZERO 7
  1458. #define FF_CMP_VSAD 8
  1459. #define FF_CMP_VSSE 9
  1460. #define FF_CMP_NSSE 10
  1461. #define FF_CMP_W53 11
  1462. #define FF_CMP_W97 12
  1463. #define FF_CMP_DCTMAX 13
  1464. #define FF_CMP_DCT264 14
  1465. #define FF_CMP_CHROMA 256
  1466. /**
  1467. * ME diamond size & shape
  1468. * - encoding: Set by user.
  1469. * - decoding: unused
  1470. */
  1471. int dia_size;
  1472. /**
  1473. * amount of previous MV predictors (2a+1 x 2a+1 square)
  1474. * - encoding: Set by user.
  1475. * - decoding: unused
  1476. */
  1477. int last_predictor_count;
  1478. /**
  1479. * prepass for motion estimation
  1480. * - encoding: Set by user.
  1481. * - decoding: unused
  1482. */
  1483. int pre_me;
  1484. /**
  1485. * motion estimation prepass comparison function
  1486. * - encoding: Set by user.
  1487. * - decoding: unused
  1488. */
  1489. int me_pre_cmp;
  1490. /**
  1491. * ME prepass diamond size & shape
  1492. * - encoding: Set by user.
  1493. * - decoding: unused
  1494. */
  1495. int pre_dia_size;
  1496. /**
  1497. * subpel ME quality
  1498. * - encoding: Set by user.
  1499. * - decoding: unused
  1500. */
  1501. int me_subpel_quality;
  1502. /**
  1503. * callback to negotiate the pixelFormat
  1504. * @param fmt is the list of formats which are supported by the codec,
  1505. * it is terminated by -1 as 0 is a valid format, the formats are ordered by quality.
  1506. * The first is always the native one.
  1507. * @return the chosen format
  1508. * - encoding: unused
  1509. * - decoding: Set by user, if not set the native format will be chosen.
  1510. */
  1511. enum PixelFormat (*get_format)(struct AVCodecContext *s, const enum PixelFormat * fmt);
  1512. /**
  1513. * DTG active format information (additional aspect ratio
  1514. * information only used in DVB MPEG-2 transport streams)
  1515. * 0 if not set.
  1516. *
  1517. * - encoding: unused
  1518. * - decoding: Set by decoder.
  1519. */
  1520. int dtg_active_format;
  1521. #define FF_DTG_AFD_SAME 8
  1522. #define FF_DTG_AFD_4_3 9
  1523. #define FF_DTG_AFD_16_9 10
  1524. #define FF_DTG_AFD_14_9 11
  1525. #define FF_DTG_AFD_4_3_SP_14_9 13
  1526. #define FF_DTG_AFD_16_9_SP_14_9 14
  1527. #define FF_DTG_AFD_SP_4_3 15
  1528. /**
  1529. * maximum motion estimation search range in subpel units
  1530. * If 0 then no limit.
  1531. *
  1532. * - encoding: Set by user.
  1533. * - decoding: unused
  1534. */
  1535. int me_range;
  1536. /**
  1537. * intra quantizer bias
  1538. * - encoding: Set by user.
  1539. * - decoding: unused
  1540. */
  1541. int intra_quant_bias;
  1542. #define FF_DEFAULT_QUANT_BIAS 999999
  1543. /**
  1544. * inter quantizer bias
  1545. * - encoding: Set by user.
  1546. * - decoding: unused
  1547. */
  1548. int inter_quant_bias;
  1549. /**
  1550. * color table ID
  1551. * - encoding: unused
  1552. * - decoding: Which clrtable should be used for 8bit RGB images.
  1553. * Tables have to be stored somewhere. FIXME
  1554. */
  1555. int color_table_id;
  1556. /**
  1557. * internal_buffer count
  1558. * Don't touch, used by libavcodec default_get_buffer().
  1559. */
  1560. int internal_buffer_count;
  1561. /**
  1562. * internal_buffers
  1563. * Don't touch, used by libavcodec default_get_buffer().
  1564. */
  1565. void *internal_buffer;
  1566. #define FF_LAMBDA_SHIFT 7
  1567. #define FF_LAMBDA_SCALE (1<<FF_LAMBDA_SHIFT)
  1568. #define FF_QP2LAMBDA 118 ///< factor to convert from H.263 QP to lambda
  1569. #define FF_LAMBDA_MAX (256*128-1)
  1570. #define FF_QUALITY_SCALE FF_LAMBDA_SCALE //FIXME maybe remove
  1571. /**
  1572. * Global quality for codecs which cannot change it per frame.
  1573. * This should be proportional to MPEG-1/2/4 qscale.
  1574. * - encoding: Set by user.
  1575. * - decoding: unused
  1576. */
  1577. int global_quality;
  1578. #define FF_CODER_TYPE_VLC 0
  1579. #define FF_CODER_TYPE_AC 1
  1580. #define FF_CODER_TYPE_RAW 2
  1581. #define FF_CODER_TYPE_RLE 3
  1582. #define FF_CODER_TYPE_DEFLATE 4
  1583. /**
  1584. * coder type
  1585. * - encoding: Set by user.
  1586. * - decoding: unused
  1587. */
  1588. int coder_type;
  1589. /**
  1590. * context model
  1591. * - encoding: Set by user.
  1592. * - decoding: unused
  1593. */
  1594. int context_model;
  1595. #if 0
  1596. /**
  1597. *
  1598. * - encoding: unused
  1599. * - decoding: Set by user.
  1600. */
  1601. uint8_t * (*realloc)(struct AVCodecContext *s, uint8_t *buf, int buf_size);
  1602. #endif
  1603. /**
  1604. * slice flags
  1605. * - encoding: unused
  1606. * - decoding: Set by user.
  1607. */
  1608. int slice_flags;
  1609. #define SLICE_FLAG_CODED_ORDER 0x0001 ///< draw_horiz_band() is called in coded order instead of display
  1610. #define SLICE_FLAG_ALLOW_FIELD 0x0002 ///< allow draw_horiz_band() with field slices (MPEG2 field pics)
  1611. #define SLICE_FLAG_ALLOW_PLANE 0x0004 ///< allow draw_horiz_band() with 1 component at a time (SVQ1)
  1612. /**
  1613. * XVideo Motion Acceleration
  1614. * - encoding: forbidden
  1615. * - decoding: set by decoder
  1616. */
  1617. int xvmc_acceleration;
  1618. /**
  1619. * macroblock decision mode
  1620. * - encoding: Set by user.
  1621. * - decoding: unused
  1622. */
  1623. int mb_decision;
  1624. #define FF_MB_DECISION_SIMPLE 0 ///< uses mb_cmp
  1625. #define FF_MB_DECISION_BITS 1 ///< chooses the one which needs the fewest bits
  1626. #define FF_MB_DECISION_RD 2 ///< rate distortion
  1627. /**
  1628. * custom intra quantization matrix
  1629. * - encoding: Set by user, can be NULL.
  1630. * - decoding: Set by libavcodec.
  1631. */
  1632. uint16_t *intra_matrix;
  1633. /**
  1634. * custom inter quantization matrix
  1635. * - encoding: Set by user, can be NULL.
  1636. * - decoding: Set by libavcodec.
  1637. */
  1638. uint16_t *inter_matrix;
  1639. /**
  1640. * fourcc from the AVI stream header (LSB first, so "ABCD" -> ('D'<<24) + ('C'<<16) + ('B'<<8) + 'A').
  1641. * This is used to work around some encoder bugs.
  1642. * - encoding: unused
  1643. * - decoding: Set by user, will be converted to uppercase by libavcodec during init.
  1644. */
  1645. unsigned int stream_codec_tag;
  1646. /**
  1647. * scene change detection threshold
  1648. * 0 is default, larger means fewer detected scene changes.
  1649. * - encoding: Set by user.
  1650. * - decoding: unused
  1651. */
  1652. int scenechange_threshold;
  1653. /**
  1654. * minimum Lagrange multipler
  1655. * - encoding: Set by user.
  1656. * - decoding: unused
  1657. */
  1658. int lmin;
  1659. /**
  1660. * maximum Lagrange multipler
  1661. * - encoding: Set by user.
  1662. * - decoding: unused
  1663. */
  1664. int lmax;
  1665. /**
  1666. * palette control structure
  1667. * - encoding: ??? (no palette-enabled encoder yet)
  1668. * - decoding: Set by user.
  1669. */
  1670. struct AVPaletteControl *palctrl;
  1671. /**
  1672. * noise reduction strength
  1673. * - encoding: Set by user.
  1674. * - decoding: unused
  1675. */
  1676. int noise_reduction;
  1677. /**
  1678. * Called at the beginning of a frame to get cr buffer for it.
  1679. * Buffer type (size, hints) must be the same. libavcodec won't check it.
  1680. * libavcodec will pass previous buffer in pic, function should return
  1681. * same buffer or new buffer with old frame "painted" into it.
  1682. * If pic.data[0] == NULL must behave like get_buffer().
  1683. * - encoding: unused
  1684. * - decoding: Set by libavcodec., user can override
  1685. */
  1686. int (*reget_buffer)(struct AVCodecContext *c, AVFrame *pic);
  1687. /**
  1688. * Number of bits which should be loaded into the rc buffer before decoding starts.
  1689. * - encoding: Set by user.
  1690. * - decoding: unused
  1691. */
  1692. int rc_initial_buffer_occupancy;
  1693. /**
  1694. *
  1695. * - encoding: Set by user.
  1696. * - decoding: unused
  1697. */
  1698. int inter_threshold;
  1699. /**
  1700. * CODEC_FLAG2_*
  1701. * - encoding: Set by user.
  1702. * - decoding: Set by user.
  1703. */
  1704. int flags2;
  1705. /**
  1706. * Simulates errors in the bitstream to test error concealment.
  1707. * - encoding: Set by user.
  1708. * - decoding: unused
  1709. */
  1710. int error_rate;
  1711. /**
  1712. * MP3 antialias algorithm, see FF_AA_* below.
  1713. * - encoding: unused
  1714. * - decoding: Set by user.
  1715. */
  1716. int antialias_algo;
  1717. #define FF_AA_AUTO 0
  1718. #define FF_AA_FASTINT 1 //not implemented yet
  1719. #define FF_AA_INT 2
  1720. #define FF_AA_FLOAT 3
  1721. /**
  1722. * quantizer noise shaping
  1723. * - encoding: Set by user.
  1724. * - decoding: unused
  1725. */
  1726. int quantizer_noise_shaping;
  1727. /**
  1728. * thread count
  1729. * is used to decide how many independent tasks should be passed to execute()
  1730. * - encoding: Set by user.
  1731. * - decoding: Set by user.
  1732. */
  1733. int thread_count;
  1734. /**
  1735. * The codec may call this to execute several independent things.
  1736. * It will return only after finishing all tasks.
  1737. * The user may replace this with some multithreaded implementation,
  1738. * the default implementation will execute the parts serially.
  1739. * @param count the number of things to execute
  1740. * - encoding: Set by libavcodec, user can override.
  1741. * - decoding: Set by libavcodec, user can override.
  1742. */
  1743. int (*execute)(struct AVCodecContext *c, int (*func)(struct AVCodecContext *c2, void *arg), void *arg2, int *ret, int count, int size);
  1744. /**
  1745. * thread opaque
  1746. * Can be used by execute() to store some per AVCodecContext stuff.
  1747. * - encoding: set by execute()
  1748. * - decoding: set by execute()
  1749. */
  1750. void *thread_opaque;
  1751. /**
  1752. * Motion estimation threshold below which no motion estimation is
  1753. * performed, but instead the user specified motion vectors are used.
  1754. *
  1755. * - encoding: Set by user.
  1756. * - decoding: unused
  1757. */
  1758. int me_threshold;
  1759. /**
  1760. * Macroblock threshold below which the user specified macroblock types will be used.
  1761. * - encoding: Set by user.
  1762. * - decoding: unused
  1763. */
  1764. int mb_threshold;
  1765. /**
  1766. * precision of the intra DC coefficient - 8
  1767. * - encoding: Set by user.
  1768. * - decoding: unused
  1769. */
  1770. int intra_dc_precision;
  1771. /**
  1772. * noise vs. sse weight for the nsse comparsion function
  1773. * - encoding: Set by user.
  1774. * - decoding: unused
  1775. */
  1776. int nsse_weight;
  1777. /**
  1778. * Number of macroblock rows at the top which are skipped.
  1779. * - encoding: unused
  1780. * - decoding: Set by user.
  1781. */
  1782. int skip_top;
  1783. /**
  1784. * Number of macroblock rows at the bottom which are skipped.
  1785. * - encoding: unused
  1786. * - decoding: Set by user.
  1787. */
  1788. int skip_bottom;
  1789. /**
  1790. * profile
  1791. * - encoding: Set by user.
  1792. * - decoding: Set by libavcodec.
  1793. */
  1794. int profile;
  1795. #define FF_PROFILE_UNKNOWN -99
  1796. #define FF_PROFILE_AAC_MAIN 0
  1797. #define FF_PROFILE_AAC_LOW 1
  1798. #define FF_PROFILE_AAC_SSR 2
  1799. #define FF_PROFILE_AAC_LTP 3
  1800. /**
  1801. * level
  1802. * - encoding: Set by user.
  1803. * - decoding: Set by libavcodec.
  1804. */
  1805. int level;
  1806. #define FF_LEVEL_UNKNOWN -99
  1807. /**
  1808. * low resolution decoding, 1-> 1/2 size, 2->1/4 size
  1809. * - encoding: unused
  1810. * - decoding: Set by user.
  1811. */
  1812. int lowres;
  1813. /**
  1814. * Bitstream width / height, may be different from width/height if lowres
  1815. * or other things are used.
  1816. * - encoding: unused
  1817. * - decoding: Set by user before init if known. Codec should override / dynamically change if needed.
  1818. */
  1819. int coded_width, coded_height;
  1820. /**
  1821. * frame skip threshold
  1822. * - encoding: Set by user.
  1823. * - decoding: unused
  1824. */
  1825. int frame_skip_threshold;
  1826. /**
  1827. * frame skip factor
  1828. * - encoding: Set by user.
  1829. * - decoding: unused
  1830. */
  1831. int frame_skip_factor;
  1832. /**
  1833. * frame skip exponent
  1834. * - encoding: Set by user.
  1835. * - decoding: unused
  1836. */
  1837. int frame_skip_exp;
  1838. /**
  1839. * frame skip comparison function
  1840. * - encoding: Set by user.
  1841. * - decoding: unused
  1842. */
  1843. int frame_skip_cmp;
  1844. /**
  1845. * Border processing masking, raises the quantizer for mbs on the borders
  1846. * of the picture.
  1847. * - encoding: Set by user.
  1848. * - decoding: unused
  1849. */
  1850. float border_masking;
  1851. /**
  1852. * minimum MB lagrange multipler
  1853. * - encoding: Set by user.
  1854. * - decoding: unused
  1855. */
  1856. int mb_lmin;
  1857. /**
  1858. * maximum MB lagrange multipler
  1859. * - encoding: Set by user.
  1860. * - decoding: unused
  1861. */
  1862. int mb_lmax;
  1863. /**
  1864. *
  1865. * - encoding: Set by user.
  1866. * - decoding: unused
  1867. */
  1868. int me_penalty_compensation;
  1869. /**
  1870. *
  1871. * - encoding: unused
  1872. * - decoding: Set by user.
  1873. */
  1874. enum AVDiscard skip_loop_filter;
  1875. /**
  1876. *
  1877. * - encoding: unused
  1878. * - decoding: Set by user.
  1879. */
  1880. enum AVDiscard skip_idct;
  1881. /**
  1882. *
  1883. * - encoding: unused
  1884. * - decoding: Set by user.
  1885. */
  1886. enum AVDiscard skip_frame;
  1887. /**
  1888. *
  1889. * - encoding: Set by user.
  1890. * - decoding: unused
  1891. */
  1892. int bidir_refine;
  1893. /**
  1894. *
  1895. * - encoding: Set by user.
  1896. * - decoding: unused
  1897. */
  1898. int brd_scale;
  1899. /**
  1900. * constant rate factor - quality-based VBR - values ~correspond to qps
  1901. * - encoding: Set by user.
  1902. * - decoding: unused
  1903. */
  1904. float crf;
  1905. /**
  1906. * constant quantization parameter rate control method
  1907. * - encoding: Set by user.
  1908. * - decoding: unused
  1909. */
  1910. int cqp;
  1911. /**
  1912. * minimum GOP size
  1913. * - encoding: Set by user.
  1914. * - decoding: unused
  1915. */
  1916. int keyint_min;
  1917. /**
  1918. * number of reference frames
  1919. * - encoding: Set by user.
  1920. * - decoding: Set by lavc.
  1921. */
  1922. int refs;
  1923. /**
  1924. * chroma qp offset from luma
  1925. * - encoding: Set by user.
  1926. * - decoding: unused
  1927. */
  1928. int chromaoffset;
  1929. /**
  1930. * Influences how often B-frames are used.
  1931. * - encoding: Set by user.
  1932. * - decoding: unused
  1933. */
  1934. int bframebias;
  1935. /**
  1936. * trellis RD quantization
  1937. * - encoding: Set by user.
  1938. * - decoding: unused
  1939. */
  1940. int trellis;
  1941. /**
  1942. * Reduce fluctuations in qp (before curve compression).
  1943. * - encoding: Set by user.
  1944. * - decoding: unused
  1945. */
  1946. float complexityblur;
  1947. /**
  1948. * in-loop deblocking filter alphac0 parameter
  1949. * alpha is in the range -6...6
  1950. * - encoding: Set by user.
  1951. * - decoding: unused
  1952. */
  1953. int deblockalpha;
  1954. /**
  1955. * in-loop deblocking filter beta parameter
  1956. * beta is in the range -6...6
  1957. * - encoding: Set by user.
  1958. * - decoding: unused
  1959. */
  1960. int deblockbeta;
  1961. /**
  1962. * macroblock subpartition sizes to consider - p8x8, p4x4, b8x8, i8x8, i4x4
  1963. * - encoding: Set by user.
  1964. * - decoding: unused
  1965. */
  1966. int partitions;
  1967. #define X264_PART_I4X4 0x001 /* Analyze i4x4 */
  1968. #define X264_PART_I8X8 0x002 /* Analyze i8x8 (requires 8x8 transform) */
  1969. #define X264_PART_P8X8 0x010 /* Analyze p16x8, p8x16 and p8x8 */
  1970. #define X264_PART_P4X4 0x020 /* Analyze p8x4, p4x8, p4x4 */
  1971. #define X264_PART_B8X8 0x100 /* Analyze b16x8, b8x16 and b8x8 */
  1972. /**
  1973. * direct MV prediction mode - 0 (none), 1 (spatial), 2 (temporal), 3 (auto)
  1974. * - encoding: Set by user.
  1975. * - decoding: unused
  1976. */
  1977. int directpred;
  1978. /**
  1979. * Audio cutoff bandwidth (0 means "automatic")
  1980. * - encoding: Set by user.
  1981. * - decoding: unused
  1982. */
  1983. int cutoff;
  1984. /**
  1985. * Multiplied by qscale for each frame and added to scene_change_score.
  1986. * - encoding: Set by user.
  1987. * - decoding: unused
  1988. */
  1989. int scenechange_factor;
  1990. /**
  1991. *
  1992. * Note: Value depends upon the compare function used for fullpel ME.
  1993. * - encoding: Set by user.
  1994. * - decoding: unused
  1995. */
  1996. int mv0_threshold;
  1997. /**
  1998. * Adjusts sensitivity of b_frame_strategy 1.
  1999. * - encoding: Set by user.
  2000. * - decoding: unused
  2001. */
  2002. int b_sensitivity;
  2003. /**
  2004. * - encoding: Set by user.
  2005. * - decoding: unused
  2006. */
  2007. int compression_level;
  2008. #define FF_COMPRESSION_DEFAULT -1
  2009. /**
  2010. * Sets whether to use LPC mode - used by FLAC encoder.
  2011. * - encoding: Set by user.
  2012. * - decoding: unused
  2013. */
  2014. int use_lpc;
  2015. /**
  2016. * LPC coefficient precision - used by FLAC encoder
  2017. * - encoding: Set by user.
  2018. * - decoding: unused
  2019. */
  2020. int lpc_coeff_precision;
  2021. /**
  2022. * - encoding: Set by user.
  2023. * - decoding: unused
  2024. */
  2025. int min_prediction_order;
  2026. /**
  2027. * - encoding: Set by user.
  2028. * - decoding: unused
  2029. */
  2030. int max_prediction_order;
  2031. /**
  2032. * search method for selecting prediction order
  2033. * - encoding: Set by user.
  2034. * - decoding: unused
  2035. */
  2036. int prediction_order_method;
  2037. /**
  2038. * - encoding: Set by user.
  2039. * - decoding: unused
  2040. */
  2041. int min_partition_order;
  2042. /**
  2043. * - encoding: Set by user.
  2044. * - decoding: unused
  2045. */
  2046. int max_partition_order;
  2047. /**
  2048. * GOP timecode frame start number, in non drop frame format
  2049. * - encoding: Set by user.
  2050. * - decoding: unused
  2051. */
  2052. int64_t timecode_frame_start;
  2053. #if LIBAVCODEC_VERSION_MAJOR < 53
  2054. /**
  2055. * Decoder should decode to this many channels if it can (0 for default)
  2056. * - encoding: unused
  2057. * - decoding: Set by user.
  2058. * @deprecated Deprecated in favor of request_channel_layout.
  2059. */
  2060. int request_channels;
  2061. #endif
  2062. /**
  2063. * Percentage of dynamic range compression to be applied by the decoder.
  2064. * The default value is 1.0, corresponding to full compression.
  2065. * - encoding: unused
  2066. * - decoding: Set by user.
  2067. */
  2068. float drc_scale;
  2069. /**
  2070. * opaque 64bit number (generally a PTS) that will be reordered and
  2071. * output in AVFrame.reordered_opaque
  2072. * - encoding: unused
  2073. * - decoding: Set by user.
  2074. */
  2075. int64_t reordered_opaque;
  2076. /**
  2077. * Bits per sample/pixel of internal libavcodec pixel/sample format.
  2078. * This field is applicable only when sample_fmt is SAMPLE_FMT_S32.
  2079. * - encoding: set by user.
  2080. * - decoding: set by libavcodec.
  2081. */
  2082. int bits_per_raw_sample;
  2083. /**
  2084. * Audio channel layout.
  2085. * - encoding: set by user.
  2086. * - decoding: set by libavcodec.
  2087. */
  2088. int64_t channel_layout;
  2089. /**
  2090. * Request decoder to use this channel layout if it can (0 for default)
  2091. * - encoding: unused
  2092. * - decoding: Set by user.
  2093. */
  2094. int64_t request_channel_layout;
  2095. /**
  2096. * Ratecontrol attempt to use, at maximum, <value> of what can be used without an underflow.
  2097. * - encoding: Set by user.
  2098. * - decoding: unused.
  2099. */
  2100. float rc_max_available_vbv_use;
  2101. /**
  2102. * Ratecontrol attempt to use, at least, <value> times the amount needed to prevent a vbv overflow.
  2103. * - encoding: Set by user.
  2104. * - decoding: unused.
  2105. */
  2106. float rc_min_vbv_overflow_use;
  2107. /**
  2108. * Hardware accelerator in use
  2109. * - encoding: unused.
  2110. * - decoding: Set by libavcodec
  2111. */
  2112. struct AVHWAccel *hwaccel;
  2113. /**
  2114. * For some codecs, the time base is closer to the field rate than the frame rate.
  2115. * Most notably, H.264 and MPEG-2 specify time_base as half of frame duration
  2116. * if no telecine is used ...
  2117. *
  2118. * Set to time_base ticks per frame. Default 1, e.g., H.264/MPEG-2 set it to 2.
  2119. */
  2120. int ticks_per_frame;
  2121. /**
  2122. * Hardware accelerator context.
  2123. * For some hardware accelerators, a global context needs to be
  2124. * provided by the user. In that case, this holds display-dependent
  2125. * data FFmpeg cannot instantiate itself. Please refer to the
  2126. * FFmpeg HW accelerator documentation to know how to fill this
  2127. * is. e.g. for VA API, this is a struct vaapi_context.
  2128. * - encoding: unused
  2129. * - decoding: Set by user
  2130. */
  2131. void *hwaccel_context;
  2132. } AVCodecContext;
  2133. /**
  2134. * AVCodec.
  2135. */
  2136. typedef struct AVCodec {
  2137. /**
  2138. * Name of the codec implementation.
  2139. * The name is globally unique among encoders and among decoders (but an
  2140. * encoder and a decoder can share the same name).
  2141. * This is the primary way to find a codec from the user perspective.
  2142. */
  2143. const char *name;
  2144. enum CodecType type;
  2145. enum CodecID id;
  2146. int priv_data_size;
  2147. int (*init)(AVCodecContext *);
  2148. int (*encode)(AVCodecContext *, uint8_t *buf, int buf_size, void *data);
  2149. int (*close)(AVCodecContext *);
  2150. int (*decode)(AVCodecContext *, void *outdata, int *outdata_size,
  2151. const uint8_t *buf, int buf_size);
  2152. /**
  2153. * Codec capabilities.
  2154. * see CODEC_CAP_*
  2155. */
  2156. int capabilities;
  2157. struct AVCodec *next;
  2158. /**
  2159. * Flush buffers.
  2160. * Will be called when seeking
  2161. */
  2162. void (*flush)(AVCodecContext *);
  2163. const AVRational *supported_framerates; ///< array of supported framerates, or NULL if any, array is terminated by {0,0}
  2164. const enum PixelFormat *pix_fmts; ///< array of supported pixel formats, or NULL if unknown, array is terminated by -1
  2165. /**
  2166. * Descriptive name for the codec, meant to be more human readable than \p name.
  2167. * You \e should use the NULL_IF_CONFIG_SMALL() macro to define it.
  2168. */
  2169. const char *long_name;
  2170. const int *supported_samplerates; ///< array of supported audio samplerates, or NULL if unknown, array is terminated by 0
  2171. const enum SampleFormat *sample_fmts; ///< array of supported sample formats, or NULL if unknown, array is terminated by -1
  2172. const int64_t *channel_layouts; ///< array of support channel layouts, or NULL if unknown. array is terminated by 0
  2173. } AVCodec;
  2174. /**
  2175. * AVHWAccel.
  2176. */
  2177. typedef struct AVHWAccel {
  2178. /**
  2179. * Name of the hardware accelerated codec.
  2180. * The name is globally unique among encoders and among decoders (but an
  2181. * encoder and a decoder can share the same name).
  2182. */
  2183. const char *name;
  2184. /**
  2185. * Type of codec implemented by the hardware accelerator.
  2186. *
  2187. * See CODEC_TYPE_xxx
  2188. */
  2189. enum CodecType type;
  2190. /**
  2191. * Codec implemented by the hardware accelerator.
  2192. *
  2193. * See CODEC_ID_xxx
  2194. */
  2195. enum CodecID id;
  2196. /**
  2197. * Supported pixel format.
  2198. *
  2199. * Only hardware accelerated formats are supported here.
  2200. */
  2201. enum PixelFormat pix_fmt;
  2202. /**
  2203. * Hardware accelerated codec capabilities.
  2204. * see FF_HWACCEL_CODEC_CAP_*
  2205. */
  2206. int capabilities;
  2207. struct AVHWAccel *next;
  2208. /**
  2209. * Called at the beginning of each frame or field picture.
  2210. *
  2211. * Meaningful frame information (codec specific) is guaranteed to
  2212. * be parsed at this point. This function is mandatory.
  2213. *
  2214. * Note that \p buf can be NULL along with \p buf_size set to 0.
  2215. * Otherwise, this means the whole frame is available at this point.
  2216. *
  2217. * @param avctx the codec context
  2218. * @param buf the frame data buffer base
  2219. * @param buf_size the size of the frame in bytes
  2220. * @return zero if successful, a negative value otherwise
  2221. */
  2222. int (*start_frame)(AVCodecContext *avctx, const uint8_t *buf, uint32_t buf_size);
  2223. /**
  2224. * Callback for each slice.
  2225. *
  2226. * Meaningful slice information (codec specific) is guaranteed to
  2227. * be parsed at this point. This function is mandatory.
  2228. *
  2229. * @param avctx the codec context
  2230. * @param buf the slice data buffer base
  2231. * @param buf_size the size of the slice in bytes
  2232. * @return zero if successful, a negative value otherwise
  2233. */
  2234. int (*decode_slice)(AVCodecContext *avctx, const uint8_t *buf, uint32_t buf_size);
  2235. /**
  2236. * Called at the end of each frame or field picture.
  2237. *
  2238. * The whole picture is parsed at this point and can now be sent
  2239. * to the hardware accelerator. This function is mandatory.
  2240. *
  2241. * @param avctx the codec context
  2242. * @return zero if successful, a negative value otherwise
  2243. */
  2244. int (*end_frame)(AVCodecContext *avctx);
  2245. /**
  2246. * Size of HW accelerator private data.
  2247. *
  2248. * Private data is allocated with av_mallocz() before
  2249. * AVCodecContext.get_buffer() and deallocated after
  2250. * AVCodecContext.release_buffer().
  2251. */
  2252. int priv_data_size;
  2253. } AVHWAccel;
  2254. /**
  2255. * four components are given, that's all.
  2256. * the last component is alpha
  2257. */
  2258. typedef struct AVPicture {
  2259. uint8_t *data[4];
  2260. int linesize[4]; ///< number of bytes per line
  2261. } AVPicture;
  2262. #if LIBAVCODEC_VERSION_MAJOR < 53
  2263. /**
  2264. * AVPaletteControl
  2265. * This structure defines a method for communicating palette changes
  2266. * between and demuxer and a decoder.
  2267. *
  2268. * @deprecated Use AVPacket to send palette changes instead.
  2269. * This is totally broken.
  2270. */
  2271. #define AVPALETTE_SIZE 1024
  2272. #define AVPALETTE_COUNT 256
  2273. typedef struct AVPaletteControl {
  2274. /* Demuxer sets this to 1 to indicate the palette has changed;
  2275. * decoder resets to 0. */
  2276. int palette_changed;
  2277. /* 4-byte ARGB palette entries, stored in native byte order; note that
  2278. * the individual palette components should be on a 8-bit scale; if
  2279. * the palette data comes from an IBM VGA native format, the component
  2280. * data is probably 6 bits in size and needs to be scaled. */
  2281. unsigned int palette[AVPALETTE_COUNT];
  2282. } AVPaletteControl attribute_deprecated;
  2283. #endif
  2284. enum AVSubtitleType {
  2285. SUBTITLE_NONE,
  2286. SUBTITLE_BITMAP, ///< A bitmap, pict will be set
  2287. /**
  2288. * Plain text, the text field must be set by the decoder and is
  2289. * authoritative. ass and pict fields may contain approximations.
  2290. */
  2291. SUBTITLE_TEXT,
  2292. /**
  2293. * Formatted text, the ass field must be set by the decoder and is
  2294. * authoritative. pict and text fields may contain approximations.
  2295. */
  2296. SUBTITLE_ASS,
  2297. };
  2298. typedef struct AVSubtitleRect {
  2299. int x; ///< top left corner of pict, undefined when pict is not set
  2300. int y; ///< top left corner of pict, undefined when pict is not set
  2301. int w; ///< width of pict, undefined when pict is not set
  2302. int h; ///< height of pict, undefined when pict is not set
  2303. int nb_colors; ///< number of colors in pict, undefined when pict is not set
  2304. /**
  2305. * data+linesize for the bitmap of this subtitle.
  2306. * can be set for text/ass as well once they where rendered
  2307. */
  2308. AVPicture pict;
  2309. enum AVSubtitleType type;
  2310. char *text; ///< 0 terminated plain UTF-8 text
  2311. /**
  2312. * 0 terminated ASS/SSA compatible event line.
  2313. * The pressentation of this is unaffected by the other values in this
  2314. * struct.
  2315. */
  2316. char *ass;
  2317. } AVSubtitleRect;
  2318. typedef struct AVSubtitle {
  2319. uint16_t format; /* 0 = graphics */
  2320. uint32_t start_display_time; /* relative to packet pts, in ms */
  2321. uint32_t end_display_time; /* relative to packet pts, in ms */
  2322. unsigned num_rects;
  2323. AVSubtitleRect **rects;
  2324. } AVSubtitle;
  2325. /* resample.c */
  2326. struct ReSampleContext;
  2327. struct AVResampleContext;
  2328. typedef struct ReSampleContext ReSampleContext;
  2329. #if LIBAVCODEC_VERSION_MAJOR < 53
  2330. /**
  2331. * @deprecated Use av_audio_resample_init() instead.
  2332. */
  2333. attribute_deprecated ReSampleContext *audio_resample_init(int output_channels, int input_channels,
  2334. int output_rate, int input_rate);
  2335. #endif
  2336. /**
  2337. * Initializes audio resampling context
  2338. *
  2339. * @param output_channels number of output channels
  2340. * @param input_channels number of input channels
  2341. * @param output_rate output sample rate
  2342. * @param input_rate input sample rate
  2343. * @param sample_fmt_out requested output sample format
  2344. * @param sample_fmt_in input sample format
  2345. * @param filter_length length of each FIR filter in the filterbank relative to the cutoff freq
  2346. * @param log2_phase_count log2 of the number of entries in the polyphase filterbank
  2347. * @param linear If 1 then the used FIR filter will be linearly interpolated
  2348. between the 2 closest, if 0 the closest will be used
  2349. * @param cutoff cutoff frequency, 1.0 corresponds to half the output sampling rate
  2350. * @return allocated ReSampleContext, NULL if error occured
  2351. */
  2352. ReSampleContext *av_audio_resample_init(int output_channels, int input_channels,
  2353. int output_rate, int input_rate,
  2354. enum SampleFormat sample_fmt_out,
  2355. enum SampleFormat sample_fmt_in,
  2356. int filter_length, int log2_phase_count,
  2357. int linear, double cutoff);
  2358. int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
  2359. void audio_resample_close(ReSampleContext *s);
  2360. /**
  2361. * Initializes an audio resampler.
  2362. * Note, if either rate is not an integer then simply scale both rates up so they are.
  2363. * @param filter_length length of each FIR filter in the filterbank relative to the cutoff freq
  2364. * @param log2_phase_count log2 of the number of entries in the polyphase filterbank
  2365. * @param linear If 1 then the used FIR filter will be linearly interpolated
  2366. between the 2 closest, if 0 the closest will be used
  2367. * @param cutoff cutoff frequency, 1.0 corresponds to half the output sampling rate
  2368. */
  2369. struct AVResampleContext *av_resample_init(int out_rate, int in_rate, int filter_length, int log2_phase_count, int linear, double cutoff);
  2370. /**
  2371. * resamples.
  2372. * @param src an array of unconsumed samples
  2373. * @param consumed the number of samples of src which have been consumed are returned here
  2374. * @param src_size the number of unconsumed samples available
  2375. * @param dst_size the amount of space in samples available in dst
  2376. * @param update_ctx If this is 0 then the context will not be modified, that way several channels can be resampled with the same context.
  2377. * @return the number of samples written in dst or -1 if an error occurred
  2378. */
  2379. int av_resample(struct AVResampleContext *c, short *dst, short *src, int *consumed, int src_size, int dst_size, int update_ctx);
  2380. /**
  2381. * Compensates samplerate/timestamp drift. The compensation is done by changing
  2382. * the resampler parameters, so no audible clicks or similar distortions occur
  2383. * @param compensation_distance distance in output samples over which the compensation should be performed
  2384. * @param sample_delta number of output samples which should be output less
  2385. *
  2386. * example: av_resample_compensate(c, 10, 500)
  2387. * here instead of 510 samples only 500 samples would be output
  2388. *
  2389. * note, due to rounding the actual compensation might be slightly different,
  2390. * especially if the compensation_distance is large and the in_rate used during init is small
  2391. */
  2392. void av_resample_compensate(struct AVResampleContext *c, int sample_delta, int compensation_distance);
  2393. void av_resample_close(struct AVResampleContext *c);
  2394. /**
  2395. * Allocate memory for a picture. Call avpicture_free to free it.
  2396. *
  2397. * @param picture the picture to be filled in
  2398. * @param pix_fmt the format of the picture
  2399. * @param width the width of the picture
  2400. * @param height the height of the picture
  2401. * @return zero if successful, a negative value if not
  2402. */
  2403. int avpicture_alloc(AVPicture *picture, int pix_fmt, int width, int height);
  2404. /**
  2405. * Free a picture previously allocated by avpicture_alloc().
  2406. *
  2407. * @param picture the AVPicture to be freed
  2408. */
  2409. void avpicture_free(AVPicture *picture);
  2410. /**
  2411. * Fill in the AVPicture fields.
  2412. * The fields of the given AVPicture are filled in by using the 'ptr' address
  2413. * which points to the image data buffer. Depending on the specified picture
  2414. * format, one or multiple image data pointers and line sizes will be set.
  2415. * If a planar format is specified, several pointers will be set pointing to
  2416. * the different picture planes and the line sizes of the different planes
  2417. * will be stored in the lines_sizes array.
  2418. * Call with ptr == NULL to get the required size for the ptr buffer.
  2419. *
  2420. * @param picture AVPicture whose fields are to be filled in
  2421. * @param ptr Buffer which will contain or contains the actual image data
  2422. * @param pix_fmt The format in which the picture data is stored.
  2423. * @param width the width of the image in pixels
  2424. * @param height the height of the image in pixels
  2425. * @return size of the image data in bytes
  2426. */
  2427. int avpicture_fill(AVPicture *picture, uint8_t *ptr,
  2428. int pix_fmt, int width, int height);
  2429. int avpicture_layout(const AVPicture* src, int pix_fmt, int width, int height,
  2430. unsigned char *dest, int dest_size);
  2431. /**
  2432. * Calculate the size in bytes that a picture of the given width and height
  2433. * would occupy if stored in the given picture format.
  2434. * Note that this returns the size of a compact representation as generated
  2435. * by avpicture_layout, which can be smaller than the size required for e.g.
  2436. * avpicture_fill.
  2437. *
  2438. * @param pix_fmt the given picture format
  2439. * @param width the width of the image
  2440. * @param height the height of the image
  2441. * @return Image data size in bytes or -1 on error (e.g. too large dimensions).
  2442. */
  2443. int avpicture_get_size(int pix_fmt, int width, int height);
  2444. void avcodec_get_chroma_sub_sample(int pix_fmt, int *h_shift, int *v_shift);
  2445. const char *avcodec_get_pix_fmt_name(int pix_fmt);
  2446. void avcodec_set_dimensions(AVCodecContext *s, int width, int height);
  2447. enum PixelFormat avcodec_get_pix_fmt(const char* name);
  2448. unsigned int avcodec_pix_fmt_to_codec_tag(enum PixelFormat p);
  2449. #define FF_LOSS_RESOLUTION 0x0001 /**< loss due to resolution change */
  2450. #define FF_LOSS_DEPTH 0x0002 /**< loss due to color depth change */
  2451. #define FF_LOSS_COLORSPACE 0x0004 /**< loss due to color space conversion */
  2452. #define FF_LOSS_ALPHA 0x0008 /**< loss of alpha bits */
  2453. #define FF_LOSS_COLORQUANT 0x0010 /**< loss due to color quantization */
  2454. #define FF_LOSS_CHROMA 0x0020 /**< loss of chroma (e.g. RGB to gray conversion) */
  2455. /**
  2456. * Computes what kind of losses will occur when converting from one specific
  2457. * pixel format to another.
  2458. * When converting from one pixel format to another, information loss may occur.
  2459. * For example, when converting from RGB24 to GRAY, the color information will
  2460. * be lost. Similarly, other losses occur when converting from some formats to
  2461. * other formats. These losses can involve loss of chroma, but also loss of
  2462. * resolution, loss of color depth, loss due to the color space conversion, loss
  2463. * of the alpha bits or loss due to color quantization.
  2464. * avcodec_get_fix_fmt_loss() informs you about the various types of losses
  2465. * which will occur when converting from one pixel format to another.
  2466. *
  2467. * @param[in] dst_pix_fmt destination pixel format
  2468. * @param[in] src_pix_fmt source pixel format
  2469. * @param[in] has_alpha Whether the source pixel format alpha channel is used.
  2470. * @return Combination of flags informing you what kind of losses will occur.
  2471. */
  2472. int avcodec_get_pix_fmt_loss(int dst_pix_fmt, int src_pix_fmt,
  2473. int has_alpha);
  2474. /**
  2475. * Finds the best pixel format to convert to given a certain source pixel
  2476. * format. When converting from one pixel format to another, information loss
  2477. * may occur. For example, when converting from RGB24 to GRAY, the color
  2478. * information will be lost. Similarly, other losses occur when converting from
  2479. * some formats to other formats. avcodec_find_best_pix_fmt() searches which of
  2480. * the given pixel formats should be used to suffer the least amount of loss.
  2481. * The pixel formats from which it chooses one, are determined by the
  2482. * \p pix_fmt_mask parameter.
  2483. *
  2484. * @code
  2485. * src_pix_fmt = PIX_FMT_YUV420P;
  2486. * pix_fmt_mask = (1 << PIX_FMT_YUV422P) || (1 << PIX_FMT_RGB24);
  2487. * dst_pix_fmt = avcodec_find_best_pix_fmt(pix_fmt_mask, src_pix_fmt, alpha, &loss);
  2488. * @endcode
  2489. *
  2490. * @param[in] pix_fmt_mask bitmask determining which pixel format to choose from
  2491. * @param[in] src_pix_fmt source pixel format
  2492. * @param[in] has_alpha Whether the source pixel format alpha channel is used.
  2493. * @param[out] loss_ptr Combination of flags informing you what kind of losses will occur.
  2494. * @return The best pixel format to convert to or -1 if none was found.
  2495. */
  2496. int avcodec_find_best_pix_fmt(int64_t pix_fmt_mask, int src_pix_fmt,
  2497. int has_alpha, int *loss_ptr);
  2498. /**
  2499. * Print in buf the string corresponding to the pixel format with
  2500. * number pix_fmt, or an header if pix_fmt is negative.
  2501. *
  2502. * @param[in] buf the buffer where to write the string
  2503. * @param[in] buf_size the size of buf
  2504. * @param[in] pix_fmt the number of the pixel format to print the corresponding info string, or
  2505. * a negative value to print the corresponding header.
  2506. * Meaningful values for obtaining a pixel format info vary from 0 to PIX_FMT_NB -1.
  2507. */
  2508. void avcodec_pix_fmt_string (char *buf, int buf_size, int pix_fmt);
  2509. #define FF_ALPHA_TRANSP 0x0001 /* image has some totally transparent pixels */
  2510. #define FF_ALPHA_SEMI_TRANSP 0x0002 /* image has some transparent pixels */
  2511. /**
  2512. * Tell if an image really has transparent alpha values.
  2513. * @return ored mask of FF_ALPHA_xxx constants
  2514. */
  2515. int img_get_alpha_info(const AVPicture *src,
  2516. int pix_fmt, int width, int height);
  2517. /* deinterlace a picture */
  2518. /* deinterlace - if not supported return -1 */
  2519. int avpicture_deinterlace(AVPicture *dst, const AVPicture *src,
  2520. int pix_fmt, int width, int height);
  2521. /* external high level API */
  2522. /**
  2523. * If c is NULL, returns the first registered codec,
  2524. * if c is non-NULL, returns the next registered codec after c,
  2525. * or NULL if c is the last one.
  2526. */
  2527. AVCodec *av_codec_next(AVCodec *c);
  2528. /**
  2529. * Returns the LIBAVCODEC_VERSION_INT constant.
  2530. */
  2531. unsigned avcodec_version(void);
  2532. /**
  2533. * Initializes libavcodec.
  2534. *
  2535. * @warning This function \e must be called before any other libavcodec
  2536. * function.
  2537. */
  2538. void avcodec_init(void);
  2539. #if LIBAVCODEC_VERSION_MAJOR < 53
  2540. /**
  2541. * @deprecated Deprecated in favor of avcodec_register().
  2542. */
  2543. attribute_deprecated void register_avcodec(AVCodec *codec);
  2544. #endif
  2545. /**
  2546. * Register the codec \p codec and initialize libavcodec.
  2547. *
  2548. * @see avcodec_init()
  2549. */
  2550. void avcodec_register(AVCodec *codec);
  2551. /**
  2552. * Finds a registered encoder with a matching codec ID.
  2553. *
  2554. * @param id CodecID of the requested encoder
  2555. * @return An encoder if one was found, NULL otherwise.
  2556. */
  2557. AVCodec *avcodec_find_encoder(enum CodecID id);
  2558. /**
  2559. * Finds a registered encoder with the specified name.
  2560. *
  2561. * @param name name of the requested encoder
  2562. * @return An encoder if one was found, NULL otherwise.
  2563. */
  2564. AVCodec *avcodec_find_encoder_by_name(const char *name);
  2565. /**
  2566. * Finds a registered decoder with a matching codec ID.
  2567. *
  2568. * @param id CodecID of the requested decoder
  2569. * @return A decoder if one was found, NULL otherwise.
  2570. */
  2571. AVCodec *avcodec_find_decoder(enum CodecID id);
  2572. /**
  2573. * Finds a registered decoder with the specified name.
  2574. *
  2575. * @param name name of the requested decoder
  2576. * @return A decoder if one was found, NULL otherwise.
  2577. */
  2578. AVCodec *avcodec_find_decoder_by_name(const char *name);
  2579. void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);
  2580. /**
  2581. * Sets the fields of the given AVCodecContext to default values.
  2582. *
  2583. * @param s The AVCodecContext of which the fields should be set to default values.
  2584. */
  2585. void avcodec_get_context_defaults(AVCodecContext *s);
  2586. /** THIS FUNCTION IS NOT YET PART OF THE PUBLIC API!
  2587. * we WILL change its arguments and name a few times! */
  2588. void avcodec_get_context_defaults2(AVCodecContext *s, enum CodecType);
  2589. /**
  2590. * Allocates an AVCodecContext and sets its fields to default values. The
  2591. * resulting struct can be deallocated by simply calling av_free().
  2592. *
  2593. * @return An AVCodecContext filled with default values or NULL on failure.
  2594. * @see avcodec_get_context_defaults
  2595. */
  2596. AVCodecContext *avcodec_alloc_context(void);
  2597. /** THIS FUNCTION IS NOT YET PART OF THE PUBLIC API!
  2598. * we WILL change its arguments and name a few times! */
  2599. AVCodecContext *avcodec_alloc_context2(enum CodecType);
  2600. /**
  2601. * Sets the fields of the given AVFrame to default values.
  2602. *
  2603. * @param pic The AVFrame of which the fields should be set to default values.
  2604. */
  2605. void avcodec_get_frame_defaults(AVFrame *pic);
  2606. /**
  2607. * Allocates an AVFrame and sets its fields to default values. The resulting
  2608. * struct can be deallocated by simply calling av_free().
  2609. *
  2610. * @return An AVFrame filled with default values or NULL on failure.
  2611. * @see avcodec_get_frame_defaults
  2612. */
  2613. AVFrame *avcodec_alloc_frame(void);
  2614. int avcodec_default_get_buffer(AVCodecContext *s, AVFrame *pic);
  2615. void avcodec_default_release_buffer(AVCodecContext *s, AVFrame *pic);
  2616. int avcodec_default_reget_buffer(AVCodecContext *s, AVFrame *pic);
  2617. void avcodec_align_dimensions(AVCodecContext *s, int *width, int *height);
  2618. /**
  2619. * Checks if the given dimension of a picture is valid, meaning that all
  2620. * bytes of the picture can be addressed with a signed int.
  2621. *
  2622. * @param[in] w Width of the picture.
  2623. * @param[in] h Height of the picture.
  2624. * @return Zero if valid, a negative value if invalid.
  2625. */
  2626. int avcodec_check_dimensions(void *av_log_ctx, unsigned int w, unsigned int h);
  2627. enum PixelFormat avcodec_default_get_format(struct AVCodecContext *s, const enum PixelFormat * fmt);
  2628. int avcodec_thread_init(AVCodecContext *s, int thread_count);
  2629. void avcodec_thread_free(AVCodecContext *s);
  2630. int avcodec_thread_execute(AVCodecContext *s, int (*func)(AVCodecContext *c2, void *arg2),void *arg, int *ret, int count, int size);
  2631. int avcodec_default_execute(AVCodecContext *c, int (*func)(AVCodecContext *c2, void *arg2),void *arg, int *ret, int count, int size);
  2632. //FIXME func typedef
  2633. /**
  2634. * Initializes the AVCodecContext to use the given AVCodec. Prior to using this
  2635. * function the context has to be allocated.
  2636. *
  2637. * The functions avcodec_find_decoder_by_name(), avcodec_find_encoder_by_name(),
  2638. * avcodec_find_decoder() and avcodec_find_encoder() provide an easy way for
  2639. * retrieving a codec.
  2640. *
  2641. * @warning This function is not thread safe!
  2642. *
  2643. * @code
  2644. * avcodec_register_all();
  2645. * codec = avcodec_find_decoder(CODEC_ID_H264);
  2646. * if (!codec)
  2647. * exit(1);
  2648. *
  2649. * context = avcodec_alloc_context();
  2650. *
  2651. * if (avcodec_open(context, codec) < 0)
  2652. * exit(1);
  2653. * @endcode
  2654. *
  2655. * @param avctx The context which will be set up to use the given codec.
  2656. * @param codec The codec to use within the context.
  2657. * @return zero on success, a negative value on error
  2658. * @see avcodec_alloc_context, avcodec_find_decoder, avcodec_find_encoder
  2659. */
  2660. int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
  2661. /**
  2662. * Decodes an audio frame from \p buf into \p samples.
  2663. * The avcodec_decode_audio2() function decodes an audio frame from the input
  2664. * buffer \p buf of size \p buf_size. To decode it, it makes use of the
  2665. * audio codec which was coupled with \p avctx using avcodec_open(). The
  2666. * resulting decoded frame is stored in output buffer \p samples. If no frame
  2667. * could be decompressed, \p frame_size_ptr is zero. Otherwise, it is the
  2668. * decompressed frame size in \e bytes.
  2669. *
  2670. * @warning You \e must set \p frame_size_ptr to the allocated size of the
  2671. * output buffer before calling avcodec_decode_audio2().
  2672. *
  2673. * @warning The input buffer must be \c FF_INPUT_BUFFER_PADDING_SIZE larger than
  2674. * the actual read bytes because some optimized bitstream readers read 32 or 64
  2675. * bits at once and could read over the end.
  2676. *
  2677. * @warning The end of the input buffer \p buf should be set to 0 to ensure that
  2678. * no overreading happens for damaged MPEG streams.
  2679. *
  2680. * @note You might have to align the input buffer \p buf and output buffer \p
  2681. * samples. The alignment requirements depend on the CPU: On some CPUs it isn't
  2682. * necessary at all, on others it won't work at all if not aligned and on others
  2683. * it will work but it will have an impact on performance. In practice, the
  2684. * bitstream should have 4 byte alignment at minimum and all sample data should
  2685. * be 16 byte aligned unless the CPU doesn't need it (AltiVec and SSE do). If
  2686. * the linesize is not a multiple of 16 then there's no sense in aligning the
  2687. * start of the buffer to 16.
  2688. *
  2689. * @param avctx the codec context
  2690. * @param[out] samples the output buffer
  2691. * @param[in,out] frame_size_ptr the output buffer size in bytes
  2692. * @param[in] buf the input buffer
  2693. * @param[in] buf_size the input buffer size in bytes
  2694. * @return On error a negative value is returned, otherwise the number of bytes
  2695. * used or zero if no frame could be decompressed.
  2696. */
  2697. int avcodec_decode_audio2(AVCodecContext *avctx, int16_t *samples,
  2698. int *frame_size_ptr,
  2699. const uint8_t *buf, int buf_size);
  2700. /**
  2701. * Decodes a video frame from \p buf into \p picture.
  2702. * The avcodec_decode_video() function decodes a video frame from the input
  2703. * buffer \p buf of size \p buf_size. To decode it, it makes use of the
  2704. * video codec which was coupled with \p avctx using avcodec_open(). The
  2705. * resulting decoded frame is stored in \p picture.
  2706. *
  2707. * @warning The input buffer must be \c FF_INPUT_BUFFER_PADDING_SIZE larger than
  2708. * the actual read bytes because some optimized bitstream readers read 32 or 64
  2709. * bits at once and could read over the end.
  2710. *
  2711. * @warning The end of the input buffer \p buf should be set to 0 to ensure that
  2712. * no overreading happens for damaged MPEG streams.
  2713. *
  2714. * @note You might have to align the input buffer \p buf and output buffer \p
  2715. * samples. The alignment requirements depend on the CPU: on some CPUs it isn't
  2716. * necessary at all, on others it won't work at all if not aligned and on others
  2717. * it will work but it will have an impact on performance. In practice, the
  2718. * bitstream should have 4 byte alignment at minimum and all sample data should
  2719. * be 16 byte aligned unless the CPU doesn't need it (AltiVec and SSE do). If
  2720. * the linesize is not a multiple of 16 then there's no sense in aligning the
  2721. * start of the buffer to 16.
  2722. *
  2723. * @note Some codecs have a delay between input and output, these need to be
  2724. * feeded with buf=NULL, buf_size=0 at the end to return the remaining frames.
  2725. *
  2726. * @param avctx the codec context
  2727. * @param[out] picture The AVFrame in which the decoded video frame will be stored.
  2728. * @param[in] buf the input buffer
  2729. * @param[in] buf_size the size of the input buffer in bytes
  2730. * @param[in,out] got_picture_ptr Zero if no frame could be decompressed, otherwise, it is nonzero.
  2731. * @return On error a negative value is returned, otherwise the number of bytes
  2732. * used or zero if no frame could be decompressed.
  2733. */
  2734. int avcodec_decode_video(AVCodecContext *avctx, AVFrame *picture,
  2735. int *got_picture_ptr,
  2736. const uint8_t *buf, int buf_size);
  2737. /* Decode a subtitle message. Return -1 if error, otherwise return the
  2738. * number of bytes used. If no subtitle could be decompressed,
  2739. * got_sub_ptr is zero. Otherwise, the subtitle is stored in *sub. */
  2740. int avcodec_decode_subtitle(AVCodecContext *avctx, AVSubtitle *sub,
  2741. int *got_sub_ptr,
  2742. const uint8_t *buf, int buf_size);
  2743. int avcodec_parse_frame(AVCodecContext *avctx, uint8_t **pdata,
  2744. int *data_size_ptr,
  2745. uint8_t *buf, int buf_size);
  2746. /**
  2747. * Encodes an audio frame from \p samples into \p buf.
  2748. * The avcodec_encode_audio() function encodes an audio frame from the input
  2749. * buffer \p samples. To encode it, it makes use of the audio codec which was
  2750. * coupled with \p avctx using avcodec_open(). The resulting encoded frame is
  2751. * stored in output buffer \p buf.
  2752. *
  2753. * @note The output buffer should be at least \c FF_MIN_BUFFER_SIZE bytes large.
  2754. *
  2755. * @param avctx the codec context
  2756. * @param[out] buf the output buffer
  2757. * @param[in] buf_size the output buffer size
  2758. * @param[in] samples the input buffer containing the samples
  2759. * The number of samples read from this buffer is frame_size*channels,
  2760. * both of which are defined in \p avctx.
  2761. * For PCM audio the number of samples read from \p samples is equal to
  2762. * \p buf_size * input_sample_size / output_sample_size.
  2763. * @return On error a negative value is returned, on success zero or the number
  2764. * of bytes used to encode the data read from the input buffer.
  2765. */
  2766. int avcodec_encode_audio(AVCodecContext *avctx, uint8_t *buf, int buf_size,
  2767. const short *samples);
  2768. /**
  2769. * Encodes a video frame from \p pict into \p buf.
  2770. * The avcodec_encode_video() function encodes a video frame from the input
  2771. * \p pict. To encode it, it makes use of the video codec which was coupled with
  2772. * \p avctx using avcodec_open(). The resulting encoded bytes representing the
  2773. * frame are stored in the output buffer \p buf. The input picture should be
  2774. * stored using a specific format, namely \c avctx.pix_fmt.
  2775. *
  2776. * @param avctx the codec context
  2777. * @param[out] buf the output buffer for the bitstream of encoded frame
  2778. * @param[in] buf_size the size of the output buffer in bytes
  2779. * @param[in] pict the input picture to encode
  2780. * @return On error a negative value is returned, on success zero or the number
  2781. * of bytes used from the output buffer.
  2782. */
  2783. int avcodec_encode_video(AVCodecContext *avctx, uint8_t *buf, int buf_size,
  2784. const AVFrame *pict);
  2785. int avcodec_encode_subtitle(AVCodecContext *avctx, uint8_t *buf, int buf_size,
  2786. const AVSubtitle *sub);
  2787. int avcodec_close(AVCodecContext *avctx);
  2788. /**
  2789. * Register all the codecs, parsers and bitstream filters which were enabled at
  2790. * configuration time. If you do not call this function you can select exactly
  2791. * which formats you want to support, by using the individual registration
  2792. * functions.
  2793. *
  2794. * @see avcodec_register
  2795. * @see av_register_codec_parser
  2796. * @see av_register_bitstream_filter
  2797. */
  2798. void avcodec_register_all(void);
  2799. /**
  2800. * Flush buffers, should be called when seeking or when switching to a different stream.
  2801. */
  2802. void avcodec_flush_buffers(AVCodecContext *avctx);
  2803. void avcodec_default_free_buffers(AVCodecContext *s);
  2804. /* misc useful functions */
  2805. /**
  2806. * Returns a single letter to describe the given picture type \p pict_type.
  2807. *
  2808. * @param[in] pict_type the picture type
  2809. * @return A single character representing the picture type.
  2810. */
  2811. char av_get_pict_type_char(int pict_type);
  2812. /**
  2813. * Returns codec bits per sample.
  2814. *
  2815. * @param[in] codec_id the codec
  2816. * @return Number of bits per sample or zero if unknown for the given codec.
  2817. */
  2818. int av_get_bits_per_sample(enum CodecID codec_id);
  2819. /**
  2820. * Returns sample format bits per sample.
  2821. *
  2822. * @param[in] sample_fmt the sample format
  2823. * @return Number of bits per sample or zero if unknown for the given sample format.
  2824. */
  2825. int av_get_bits_per_sample_format(enum SampleFormat sample_fmt);
  2826. /* frame parsing */
  2827. typedef struct AVCodecParserContext {
  2828. void *priv_data;
  2829. struct AVCodecParser *parser;
  2830. int64_t frame_offset; /* offset of the current frame */
  2831. int64_t cur_offset; /* current offset
  2832. (incremented by each av_parser_parse()) */
  2833. int64_t next_frame_offset; /* offset of the next frame */
  2834. /* video info */
  2835. int pict_type; /* XXX: Put it back in AVCodecContext. */
  2836. /**
  2837. * This field is used for proper frame duration computation in lavf.
  2838. * It signals, how much longer the frame duration of the current frame
  2839. * is compared to normal frame duration.
  2840. *
  2841. * frame_duration = (1 + repeat_pict) * time_base
  2842. *
  2843. * It is used by codecs like H.264 to display telecined material.
  2844. */
  2845. int repeat_pict; /* XXX: Put it back in AVCodecContext. */
  2846. int64_t pts; /* pts of the current frame */
  2847. int64_t dts; /* dts of the current frame */
  2848. /* private data */
  2849. int64_t last_pts;
  2850. int64_t last_dts;
  2851. int fetch_timestamp;
  2852. #define AV_PARSER_PTS_NB 4
  2853. int cur_frame_start_index;
  2854. int64_t cur_frame_offset[AV_PARSER_PTS_NB];
  2855. int64_t cur_frame_pts[AV_PARSER_PTS_NB];
  2856. int64_t cur_frame_dts[AV_PARSER_PTS_NB];
  2857. int flags;
  2858. #define PARSER_FLAG_COMPLETE_FRAMES 0x0001
  2859. int64_t offset; ///< byte offset from starting packet start
  2860. int64_t cur_frame_end[AV_PARSER_PTS_NB];
  2861. /*!
  2862. * Set by parser to 1 for key frames and 0 for non-key frames.
  2863. * It is initialized to -1, so if the parser doesn't set this flag,
  2864. * old-style fallback using FF_I_TYPE picture type as key frames
  2865. * will be used.
  2866. */
  2867. int key_frame;
  2868. /**
  2869. * Time difference in stream time base units from the pts of this
  2870. * packet to the point at which the output from the decoder has converged
  2871. * independent from the availability of previous frames. That is, the
  2872. * frames are virtually identical no matter if decoding started from
  2873. * the very first frame or from this keyframe.
  2874. * Is AV_NOPTS_VALUE if unknown.
  2875. * This field is not the display duration of the current frame.
  2876. *
  2877. * The purpose of this field is to allow seeking in streams that have no
  2878. * keyframes in the conventional sense. It corresponds to the
  2879. * recovery point SEI in H.264 and match_time_delta in NUT. It is also
  2880. * essential for some types of subtitle streams to ensure that all
  2881. * subtitles are correctly displayed after seeking.
  2882. */
  2883. int64_t convergence_duration;
  2884. // Timestamp generation support:
  2885. /**
  2886. * Synchronization point for start of timestamp generation.
  2887. *
  2888. * Set to >0 for sync point, 0 for no sync point and <0 for undefined
  2889. * (default).
  2890. *
  2891. * For example, this corresponds to presence of H.264 buffering period
  2892. * SEI message.
  2893. */
  2894. int dts_sync_point;
  2895. /**
  2896. * Offset of the current timestamp against last timestamp sync point in
  2897. * units of AVCodecContext.time_base.
  2898. *
  2899. * Set to INT_MIN when dts_sync_point unused. Otherwise, it must
  2900. * contain a valid timestamp offset.
  2901. *
  2902. * Note that the timestamp of sync point has usually a nonzero
  2903. * dts_ref_dts_delta, which refers to the previous sync point. Offset of
  2904. * the next frame after timestamp sync point will be usually 1.
  2905. *
  2906. * For example, this corresponds to H.264 cpb_removal_delay.
  2907. */
  2908. int dts_ref_dts_delta;
  2909. /**
  2910. * Presentation delay of current frame in units of AVCodecContext.time_base.
  2911. *
  2912. * Set to INT_MIN when dts_sync_point unused. Otherwise, it must
  2913. * contain valid non-negative timestamp delta (presentation time of a frame
  2914. * must not lie in the past).
  2915. *
  2916. * This delay represents the difference between decoding and presentation
  2917. * time of the frame.
  2918. *
  2919. * For example, this corresponds to H.264 dpb_output_delay.
  2920. */
  2921. int pts_dts_delta;
  2922. /**
  2923. * Position of the packet in file.
  2924. *
  2925. * Analogous to cur_frame_pts/dts
  2926. */
  2927. int64_t cur_frame_pos[AV_PARSER_PTS_NB];
  2928. /**
  2929. * Byte position of currently parsed frame in stream.
  2930. */
  2931. int64_t pos;
  2932. /**
  2933. * Previous frame byte position.
  2934. */
  2935. int64_t last_pos;
  2936. } AVCodecParserContext;
  2937. typedef struct AVCodecParser {
  2938. int codec_ids[5]; /* several codec IDs are permitted */
  2939. int priv_data_size;
  2940. int (*parser_init)(AVCodecParserContext *s);
  2941. int (*parser_parse)(AVCodecParserContext *s,
  2942. AVCodecContext *avctx,
  2943. const uint8_t **poutbuf, int *poutbuf_size,
  2944. const uint8_t *buf, int buf_size);
  2945. void (*parser_close)(AVCodecParserContext *s);
  2946. int (*split)(AVCodecContext *avctx, const uint8_t *buf, int buf_size);
  2947. struct AVCodecParser *next;
  2948. } AVCodecParser;
  2949. AVCodecParser *av_parser_next(AVCodecParser *c);
  2950. void av_register_codec_parser(AVCodecParser *parser);
  2951. AVCodecParserContext *av_parser_init(int codec_id);
  2952. #if LIBAVCODEC_VERSION_MAJOR < 53
  2953. attribute_deprecated
  2954. int av_parser_parse(AVCodecParserContext *s,
  2955. AVCodecContext *avctx,
  2956. uint8_t **poutbuf, int *poutbuf_size,
  2957. const uint8_t *buf, int buf_size,
  2958. int64_t pts, int64_t dts);
  2959. #endif
  2960. /**
  2961. * Parse a packet.
  2962. *
  2963. * @param s parser context.
  2964. * @param avctx codec context.
  2965. * @param poutbuf set to pointer to parsed buffer or NULL if not yet finished.
  2966. * @param poutbuf_size set to size of parsed buffer or zero if not yet finished.
  2967. * @param buf input buffer.
  2968. * @param buf_size input length, to signal EOF, this should be 0 (so that the last frame can be output).
  2969. * @param pts input presentation timestamp.
  2970. * @param dts input decoding timestamp.
  2971. * @param pos input byte position in stream.
  2972. * @return the number of bytes of the input bitstream used.
  2973. *
  2974. * Example:
  2975. * @code
  2976. * while(in_len){
  2977. * len = av_parser_parse2(myparser, AVCodecContext, &data, &size,
  2978. * in_data, in_len,
  2979. * pts, dts, pos);
  2980. * in_data += len;
  2981. * in_len -= len;
  2982. *
  2983. * if(size)
  2984. * decode_frame(data, size);
  2985. * }
  2986. * @endcode
  2987. */
  2988. int av_parser_parse2(AVCodecParserContext *s,
  2989. AVCodecContext *avctx,
  2990. uint8_t **poutbuf, int *poutbuf_size,
  2991. const uint8_t *buf, int buf_size,
  2992. int64_t pts, int64_t dts,
  2993. int64_t pos);
  2994. int av_parser_change(AVCodecParserContext *s,
  2995. AVCodecContext *avctx,
  2996. uint8_t **poutbuf, int *poutbuf_size,
  2997. const uint8_t *buf, int buf_size, int keyframe);
  2998. void av_parser_close(AVCodecParserContext *s);
  2999. typedef struct AVBitStreamFilterContext {
  3000. void *priv_data;
  3001. struct AVBitStreamFilter *filter;
  3002. AVCodecParserContext *parser;
  3003. struct AVBitStreamFilterContext *next;
  3004. } AVBitStreamFilterContext;
  3005. typedef struct AVBitStreamFilter {
  3006. const char *name;
  3007. int priv_data_size;
  3008. int (*filter)(AVBitStreamFilterContext *bsfc,
  3009. AVCodecContext *avctx, const char *args,
  3010. uint8_t **poutbuf, int *poutbuf_size,
  3011. const uint8_t *buf, int buf_size, int keyframe);
  3012. void (*close)(AVBitStreamFilterContext *bsfc);
  3013. struct AVBitStreamFilter *next;
  3014. } AVBitStreamFilter;
  3015. void av_register_bitstream_filter(AVBitStreamFilter *bsf);
  3016. AVBitStreamFilterContext *av_bitstream_filter_init(const char *name);
  3017. int av_bitstream_filter_filter(AVBitStreamFilterContext *bsfc,
  3018. AVCodecContext *avctx, const char *args,
  3019. uint8_t **poutbuf, int *poutbuf_size,
  3020. const uint8_t *buf, int buf_size, int keyframe);
  3021. void av_bitstream_filter_close(AVBitStreamFilterContext *bsf);
  3022. AVBitStreamFilter *av_bitstream_filter_next(AVBitStreamFilter *f);
  3023. /* memory */
  3024. /**
  3025. * Reallocates the given block if it is not large enough, otherwise it
  3026. * does nothing.
  3027. *
  3028. * @see av_realloc
  3029. */
  3030. void *av_fast_realloc(void *ptr, unsigned int *size, unsigned int min_size);
  3031. /**
  3032. * Copy image 'src' to 'dst'.
  3033. */
  3034. void av_picture_copy(AVPicture *dst, const AVPicture *src,
  3035. int pix_fmt, int width, int height);
  3036. /**
  3037. * Crop image top and left side.
  3038. */
  3039. int av_picture_crop(AVPicture *dst, const AVPicture *src,
  3040. int pix_fmt, int top_band, int left_band);
  3041. /**
  3042. * Pad image.
  3043. */
  3044. int av_picture_pad(AVPicture *dst, const AVPicture *src, int height, int width, int pix_fmt,
  3045. int padtop, int padbottom, int padleft, int padright, int *color);
  3046. unsigned int av_xiphlacing(unsigned char *s, unsigned int v);
  3047. /**
  3048. * Parses \p str and put in \p width_ptr and \p height_ptr the detected values.
  3049. *
  3050. * @return 0 in case of a successful parsing, a negative value otherwise
  3051. * @param[in] str the string to parse: it has to be a string in the format
  3052. * <width>x<height> or a valid video frame size abbreviation.
  3053. * @param[in,out] width_ptr pointer to the variable which will contain the detected
  3054. * frame width value
  3055. * @param[in,out] height_ptr pointer to the variable which will contain the detected
  3056. * frame height value
  3057. */
  3058. int av_parse_video_frame_size(int *width_ptr, int *height_ptr, const char *str);
  3059. /**
  3060. * Parses \p str and put in \p frame_rate the detected values.
  3061. *
  3062. * @return 0 in case of a successful parsing, a negative value otherwise
  3063. * @param[in] str the string to parse: it has to be a string in the format
  3064. * <frame_rate_num>/<frame_rate_den>, a float number or a valid video rate abbreviation
  3065. * @param[in,out] frame_rate pointer to the AVRational which will contain the detected
  3066. * frame rate
  3067. */
  3068. int av_parse_video_frame_rate(AVRational *frame_rate, const char *str);
  3069. /* error handling */
  3070. #if EINVAL > 0
  3071. #define AVERROR(e) (-(e)) /**< Returns a negative error code from a POSIX error code, to return from library functions. */
  3072. #define AVUNERROR(e) (-(e)) /**< Returns a POSIX error code from a library function error return value. */
  3073. #else
  3074. /* Some platforms have E* and errno already negated. */
  3075. #define AVERROR(e) (e)
  3076. #define AVUNERROR(e) (e)
  3077. #endif
  3078. #define AVERROR_UNKNOWN AVERROR(EINVAL) /**< unknown error */
  3079. #define AVERROR_IO AVERROR(EIO) /**< I/O error */
  3080. #define AVERROR_NUMEXPECTED AVERROR(EDOM) /**< Number syntax expected in filename. */
  3081. #define AVERROR_INVALIDDATA AVERROR(EINVAL) /**< invalid data found */
  3082. #define AVERROR_NOMEM AVERROR(ENOMEM) /**< not enough memory */
  3083. #define AVERROR_NOFMT AVERROR(EILSEQ) /**< unknown format */
  3084. #define AVERROR_NOTSUPP AVERROR(ENOSYS) /**< Operation not supported. */
  3085. #define AVERROR_NOENT AVERROR(ENOENT) /**< No such file or directory. */
  3086. #define AVERROR_EOF AVERROR(EPIPE) /**< End of file. */
  3087. #define AVERROR_PATCHWELCOME -MKTAG('P','A','W','E') /**< Not yet implemented in FFmpeg. Patches welcome. */
  3088. /**
  3089. * Registers the hardware accelerator \p hwaccel.
  3090. */
  3091. void av_register_hwaccel(AVHWAccel *hwaccel);
  3092. /**
  3093. * If hwaccel is NULL, returns the first registered hardware accelerator,
  3094. * if hwaccel is non-NULL, returns the next registered hardware accelerator
  3095. * after hwaccel, or NULL if hwaccel is the last one.
  3096. */
  3097. AVHWAccel *av_hwaccel_next(AVHWAccel *hwaccel);
  3098. #endif /* AVCODEC_AVCODEC_H */