You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

574 lines
19KB

  1. #ifndef AVCODEC_H
  2. #define AVCODEC_H
  3. #include "common.h"
  4. #define LIBAVCODEC_VERSION_INT 0x000406
  5. #define LIBAVCODEC_VERSION "0.4.6"
  6. #define LIBAVCODEC_BUILD 4618
  7. #define LIBAVCODEC_BUILD_STR "4618"
  8. enum CodecID {
  9. CODEC_ID_NONE,
  10. CODEC_ID_MPEG1VIDEO,
  11. CODEC_ID_H263,
  12. CODEC_ID_RV10,
  13. CODEC_ID_MP2,
  14. CODEC_ID_MP3LAME,
  15. CODEC_ID_AC3,
  16. CODEC_ID_MJPEG,
  17. CODEC_ID_MPEG4,
  18. CODEC_ID_RAWVIDEO,
  19. CODEC_ID_MSMPEG4V1,
  20. CODEC_ID_MSMPEG4V2,
  21. CODEC_ID_MSMPEG4V3,
  22. CODEC_ID_WMV1,
  23. CODEC_ID_WMV2,
  24. CODEC_ID_H263P,
  25. CODEC_ID_H263I,
  26. CODEC_ID_SVQ1,
  27. /* various pcm "codecs" */
  28. CODEC_ID_PCM_S16LE,
  29. CODEC_ID_PCM_S16BE,
  30. CODEC_ID_PCM_U16LE,
  31. CODEC_ID_PCM_U16BE,
  32. CODEC_ID_PCM_S8,
  33. CODEC_ID_PCM_U8,
  34. CODEC_ID_PCM_MULAW,
  35. CODEC_ID_PCM_ALAW,
  36. /* various adpcm codecs */
  37. CODEC_ID_ADPCM_IMA_QT,
  38. CODEC_ID_ADPCM_IMA_WAV,
  39. CODEC_ID_ADPCM_MS,
  40. };
  41. #define CODEC_ID_MSMPEG4 CODEC_ID_MSMPEG4V3
  42. enum CodecType {
  43. CODEC_TYPE_UNKNOWN = -1,
  44. CODEC_TYPE_VIDEO,
  45. CODEC_TYPE_AUDIO,
  46. };
  47. enum PixelFormat {
  48. PIX_FMT_ANY = -1,
  49. PIX_FMT_YUV420P,
  50. PIX_FMT_YUV422,
  51. PIX_FMT_RGB24,
  52. PIX_FMT_BGR24,
  53. PIX_FMT_YUV422P,
  54. PIX_FMT_YUV444P,
  55. PIX_FMT_RGBA32,
  56. PIX_FMT_BGRA32,
  57. PIX_FMT_YUV410P
  58. };
  59. /* currently unused, may be used if 24/32 bits samples ever supported */
  60. enum SampleFormat {
  61. SAMPLE_FMT_S16 = 0, /* signed 16 bits */
  62. };
  63. /* in bytes */
  64. #define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432
  65. /* motion estimation type, EPZS by default */
  66. enum Motion_Est_ID {
  67. ME_ZERO = 1,
  68. ME_FULL,
  69. ME_LOG,
  70. ME_PHODS,
  71. ME_EPZS,
  72. ME_X1
  73. };
  74. /* only for ME compatiblity with old apps */
  75. extern int motion_estimation_method;
  76. /* ME algos sorted by quality */
  77. static const int Motion_Est_QTab[] = { ME_ZERO, ME_PHODS, ME_LOG,
  78. ME_X1, ME_EPZS, ME_FULL };
  79. #define FF_MAX_B_FRAMES 4
  80. /* encoding support */
  81. /* note not everything is supported yet */
  82. #define CODEC_FLAG_HQ 0x0001 /* high quality (non real time) encoding */
  83. #define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */
  84. #define CODEC_FLAG_4MV 0x0004 /* 4 MV per MB allowed */
  85. #define CODEC_FLAG_QPEL 0x0010 /* use qpel MC */
  86. #define CODEC_FLAG_GMC 0x0020 /* use GMC */
  87. #define CODEC_FLAG_TYPE 0x0040 /* fixed I/P frame type, from avctx->key_frame */
  88. #define CODEC_FLAG_PART 0x0080 /* use data partitioning */
  89. /* parent program gurantees that the input for b-frame containing streams is not written to
  90. for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */
  91. #define CODEC_FLAG_INPUT_PRESERVED 0x0100
  92. #define CODEC_FLAG_PASS1 0x0200 /* use internal 2pass ratecontrol in first pass mode */
  93. #define CODEC_FLAG_PASS2 0x0400 /* use internal 2pass ratecontrol in second pass mode */
  94. #define CODEC_FLAG_EXTERN_HUFF 0x1000 /* use external huffman table (for mjpeg) */
  95. #define CODEC_FLAG_GRAY 0x2000 /* only decode/encode grayscale */
  96. #define CODEC_FLAG_EMU_EDGE 0x4000/* dont draw edges */
  97. #define CODEC_FLAG_DR1 0x8000 /* dr1 */
  98. /* codec capabilities */
  99. /* decoder can use draw_horiz_band callback */
  100. #define CODEC_CAP_DRAW_HORIZ_BAND 0x0001
  101. #define CODEC_CAP_DR1 0x0002 /* direct rendering method 1 */
  102. /* if 'parse_only' field is true, then avcodec_parse_frame() can be
  103. used */
  104. #define CODEC_CAP_PARSE_ONLY 0x0004
  105. #define FRAME_RATE_BASE 10000
  106. typedef struct AVCodecContext {
  107. int bit_rate;
  108. int bit_rate_tolerance; /* amount of +- bits (>0)*/
  109. int flags;
  110. int sub_id; /* some codecs needs additionnal format info. It is
  111. stored there */
  112. int me_method; /* ME algorithm used for video coding */
  113. /* extra data from parent application to codec, e.g. huffman table
  114. for mjpeg */
  115. /* the parent should allocate and free this buffer */
  116. void *extradata;
  117. int extradata_size;
  118. /* video only */
  119. int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */
  120. int width, height;
  121. int aspect_ratio_info;
  122. #define FF_ASPECT_SQUARE 1
  123. #define FF_ASPECT_4_3_625 2
  124. #define FF_ASPECT_4_3_525 3
  125. #define FF_ASPECT_16_9_625 4
  126. #define FF_ASPECT_16_9_525 5
  127. int gop_size; /* 0 = intra only */
  128. enum PixelFormat pix_fmt; /* pixel format, see PIX_FMT_xxx */
  129. int repeat_pict; /* when decoding, this signal how much the picture */
  130. /* must be delayed. */
  131. /* extra_delay = (repeat_pict / 2) * (1/fps) */
  132. /* if non NULL, 'draw_horiz_band' is called by the libavcodec
  133. decoder to draw an horizontal band. It improve cache usage. Not
  134. all codecs can do that. You must check the codec capabilities
  135. before */
  136. void (*draw_horiz_band)(struct AVCodecContext *s,
  137. UINT8 **src_ptr, int linesize,
  138. int y, int width, int height);
  139. /* audio only */
  140. int sample_rate; /* samples per sec */
  141. int channels;
  142. int sample_fmt; /* sample format, currenly unused */
  143. /* the following data should not be initialized */
  144. int frame_size; /* in samples, initialized when calling 'init' */
  145. int frame_number; /* audio or video frame number */
  146. int real_pict_num; /* returns the real picture number of
  147. previous encoded frame */
  148. int key_frame; /* true if the previous compressed frame was
  149. a key frame (intra, or seekable) */
  150. int pict_type; /* picture type of the previous
  151. encoded frame */
  152. /* FIXME: these should have FF_ */
  153. #define I_TYPE 1 // Intra
  154. #define P_TYPE 2 // Predicted
  155. #define B_TYPE 3 // Bi-dir predicted
  156. #define S_TYPE 4 // S(GMC)-VOP MPEG4
  157. int delay; /* number of frames the decoded output
  158. will be delayed relative to the encoded input */
  159. uint8_t *mbskip_table; /* =1 if MB didnt change, is only valid for I/P frames
  160. stride= mb_width = (width+15)>>4 */
  161. /* encoding parameters */
  162. int quality; /* quality of the previous encoded frame
  163. (between 1 (good) and 31 (bad))
  164. this is allso used to set the quality in vbr mode
  165. and the per frame quality in CODEC_FLAG_TYPE (second pass mode) */
  166. float qcompress; /* amount of qscale change between easy & hard scenes (0.0-1.0)*/
  167. float qblur; /* amount of qscale smoothing over time (0.0-1.0) */
  168. int qmin; /* min qscale */
  169. int qmax; /* max qscale */
  170. int max_qdiff; /* max qscale difference between frames */
  171. int max_b_frames; /* maximum b frames, the output will be delayed by max_b_frames+1 relative to the input */
  172. float b_quant_factor;/* qscale factor between ips and b frames */
  173. int rc_strategy;
  174. int b_frame_strategy;
  175. int hurry_up; /* when set to 1 during decoding, b frames will be skiped
  176. when set to 2 idct/dequant will be skipped too */
  177. struct AVCodec *codec;
  178. void *priv_data;
  179. /* The following data is for RTP friendly coding */
  180. /* By now only H.263/H.263+/MPEG4 coder honours this */
  181. int rtp_mode; /* 1 for activate RTP friendly-mode */
  182. /* highers numbers represent more error-prone */
  183. /* enviroments, by now just "1" exist */
  184. int rtp_payload_size; /* The size of the RTP payload, the coder will */
  185. /* do it's best to deliver a chunk with size */
  186. /* below rtp_payload_size, the chunk will start */
  187. /* with a start code on some codecs like H.263 */
  188. /* This doesn't take account of any particular */
  189. /* headers inside the transmited RTP payload */
  190. /* The RTP callcack: This function is called */
  191. /* every time the encoder as a packet to send */
  192. /* Depends on the encoder if the data starts */
  193. /* with a Start Code (it should) H.263 does */
  194. void (*rtp_callback)(void *data, int size, int packet_number);
  195. /* These are for PSNR calculation, if you set get_psnr to 1 */
  196. /* after encoding you will have the PSNR on psnr_y/cb/cr */
  197. int get_psnr;
  198. float psnr_y;
  199. float psnr_cb;
  200. float psnr_cr;
  201. /* statistics, used for 2-pass encoding */
  202. int mv_bits;
  203. int header_bits;
  204. int i_tex_bits;
  205. int p_tex_bits;
  206. int i_count;
  207. int p_count;
  208. int skip_count;
  209. int misc_bits; // cbp, mb_type
  210. int frame_bits;
  211. /* the following fields are ignored */
  212. void *opaque; /* can be used to carry app specific stuff */
  213. char codec_name[32];
  214. enum CodecType codec_type; /* see CODEC_TYPE_xxx */
  215. enum CodecID codec_id; /* see CODEC_ID_xxx */
  216. unsigned int codec_tag; /* codec tag, only used if unknown codec */
  217. int workaround_bugs; /* workaround bugs in encoders which cannot be detected automatically */
  218. int luma_elim_threshold;
  219. int chroma_elim_threshold;
  220. int strict_std_compliance; /* strictly follow the std (MPEG4, ...) */
  221. float b_quant_offset;/* qscale offset between ips and b frames, not implemented yet */
  222. int error_resilience;
  223. #ifndef MBC
  224. #define MBC 128
  225. #define MBR 96
  226. #endif
  227. #define QP_TYPE int //FIXME note xxx this might be changed to int8_t
  228. QP_TYPE *quant_store; /* field for communicating with external postprocessing */
  229. unsigned qstride;
  230. uint8_t *dr_buffer[3];
  231. int dr_stride;
  232. void *dr_opaque_frame;
  233. void (*get_buffer_callback)(struct AVCodecContext *c, int width, int height, int pict_type);
  234. int has_b_frames; // is 1 if the decoded stream contains b frames
  235. int dr_uvstride;
  236. int dr_ip_buffer_count;
  237. int block_align; /* currently only for adpcm codec in wav/avi */
  238. int parse_only; /* decoding only: if true, only parsing is done
  239. (function avcodec_parse_frame()). The frame
  240. data is returned. Only MPEG codecs support this now. */
  241. //FIXME this should be reordered after kabis API is finished ...
  242. /*
  243. Note: Below are located reserved fields for further usage
  244. It requires for ABI !!!
  245. If you'll perform some changes then borrow new space from these fields
  246. (void * can be safety replaced with struct * ;)
  247. P L E A S E ! ! !
  248. IMPORTANT: Never change order of already declared fields!!!
  249. */
  250. unsigned long long int
  251. ull_res0,ull_res1,ull_res2,ull_res3,ull_res4,ull_res5,
  252. ull_res6,ull_res7,ull_res8,ull_res9,ull_res10,ull_res11,ull_res12;
  253. float
  254. flt_res0,flt_res1,flt_res2,flt_res3,flt_res4,flt_res5,
  255. flt_res6,flt_res7,flt_res8,flt_res9,flt_res10,flt_res11;
  256. void
  257. *ptr_res0,*ptr_res1,*ptr_res2,*ptr_res3,*ptr_res4,*ptr_res5,
  258. *ptr_res6;
  259. unsigned long int
  260. ul_res0,ul_res1,ul_res2,ul_res3,ul_res4,ul_res5,
  261. ul_res6,ul_res7,ul_res8,ul_res9,ul_res10,ul_res11,ul_res12;
  262. unsigned int
  263. ui_res0;
  264. unsigned short int
  265. us_res0,us_res1,us_res2,us_res3,us_res4,us_res5,
  266. us_res6,us_res7,us_res8,us_res9,us_res10,us_res11,us_res12;
  267. unsigned char
  268. uc_res0,uc_res1,uc_res2,uc_res3,uc_res4,uc_res5,
  269. uc_res6,uc_res7,uc_res8,uc_res9,uc_res10,uc_res11,uc_res12;
  270. } AVCodecContext;
  271. typedef struct AVCodec {
  272. char *name;
  273. int type;
  274. int id;
  275. int priv_data_size;
  276. int (*init)(AVCodecContext *);
  277. int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data);
  278. int (*close)(AVCodecContext *);
  279. int (*decode)(AVCodecContext *, void *outdata, int *outdata_size,
  280. UINT8 *buf, int buf_size);
  281. int capabilities;
  282. struct AVCodec *next;
  283. /*
  284. Note: Below are located reserved fields for further usage
  285. It requires for ABI !!!
  286. If you'll perform some changes then borrow new space from these fields
  287. (void * can be safety replaced with struct * ;)
  288. P L E A S E ! ! !
  289. IMPORTANT: Never change order of already declared fields!!!
  290. */
  291. unsigned long long int
  292. ull_res0,ull_res1,ull_res2,ull_res3,ull_res4,ull_res5,
  293. ull_res6,ull_res7,ull_res8,ull_res9,ull_res10,ull_res11,ull_res12;
  294. float
  295. flt_res0,flt_res1,flt_res2,flt_res3,flt_res4,flt_res5,
  296. flt_res6,flt_res7,flt_res8,flt_res9,flt_res10,flt_res11,flt_res12;
  297. void
  298. *ptr_res0,*ptr_res1,*ptr_res2,*ptr_res3,*ptr_res4,*ptr_res5,
  299. *ptr_res6,*ptr_res7,*ptr_res8,*ptr_res9,*ptr_res10,*ptr_res11,*ptr_res12;
  300. } AVCodec;
  301. /* three components are given, that's all */
  302. typedef struct AVPicture {
  303. UINT8 *data[3];
  304. int linesize[3];
  305. } AVPicture;
  306. extern AVCodec ac3_encoder;
  307. extern AVCodec mp2_encoder;
  308. extern AVCodec mp3lame_encoder;
  309. extern AVCodec mpeg1video_encoder;
  310. extern AVCodec h263_encoder;
  311. extern AVCodec h263p_encoder;
  312. extern AVCodec rv10_encoder;
  313. extern AVCodec mjpeg_encoder;
  314. extern AVCodec mpeg4_encoder;
  315. extern AVCodec msmpeg4v1_encoder;
  316. extern AVCodec msmpeg4v2_encoder;
  317. extern AVCodec msmpeg4v3_encoder;
  318. extern AVCodec wmv1_encoder;
  319. extern AVCodec wmv2_encoder;
  320. extern AVCodec h263_decoder;
  321. extern AVCodec mpeg4_decoder;
  322. extern AVCodec msmpeg4v1_decoder;
  323. extern AVCodec msmpeg4v2_decoder;
  324. extern AVCodec msmpeg4v3_decoder;
  325. extern AVCodec wmv1_decoder;
  326. extern AVCodec wmv2_decoder;
  327. extern AVCodec mpeg_decoder;
  328. extern AVCodec h263i_decoder;
  329. extern AVCodec rv10_decoder;
  330. extern AVCodec svq1_decoder;
  331. extern AVCodec mjpeg_decoder;
  332. extern AVCodec mp2_decoder;
  333. extern AVCodec mp3_decoder;
  334. /* pcm codecs */
  335. #define PCM_CODEC(id, name) \
  336. extern AVCodec name ## _decoder; \
  337. extern AVCodec name ## _encoder;
  338. PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le);
  339. PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be);
  340. PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le);
  341. PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be);
  342. PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8);
  343. PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8);
  344. PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw);
  345. PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw);
  346. /* adpcm codecs */
  347. PCM_CODEC(CODEC_ID_ADPCM_IMA_QT, adpcm_ima_qt);
  348. PCM_CODEC(CODEC_ID_ADPCM_IMA_WAV, adpcm_ima_wav);
  349. PCM_CODEC(CODEC_ID_ADPCM_MS, adpcm_ms);
  350. #undef PCM_CODEC
  351. /* dummy raw video codec */
  352. extern AVCodec rawvideo_codec;
  353. /* the following codecs use external GPL libs */
  354. extern AVCodec ac3_decoder;
  355. /* resample.c */
  356. struct ReSampleContext;
  357. typedef struct ReSampleContext ReSampleContext;
  358. ReSampleContext *audio_resample_init(int output_channels, int input_channels,
  359. int output_rate, int input_rate);
  360. int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
  361. void audio_resample_close(ReSampleContext *s);
  362. /* YUV420 format is assumed ! */
  363. struct ImgReSampleContext;
  364. typedef struct ImgReSampleContext ImgReSampleContext;
  365. ImgReSampleContext *img_resample_init(int output_width, int output_height,
  366. int input_width, int input_height);
  367. void img_resample(ImgReSampleContext *s,
  368. AVPicture *output, AVPicture *input);
  369. void img_resample_close(ImgReSampleContext *s);
  370. void avpicture_fill(AVPicture *picture, UINT8 *ptr,
  371. int pix_fmt, int width, int height);
  372. int avpicture_get_size(int pix_fmt, int width, int height);
  373. /* convert among pixel formats */
  374. int img_convert(AVPicture *dst, int dst_pix_fmt,
  375. AVPicture *src, int pix_fmt,
  376. int width, int height);
  377. /* deinterlace a picture */
  378. int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
  379. int pix_fmt, int width, int height);
  380. /* external high level API */
  381. extern AVCodec *first_avcodec;
  382. /* returns LIBAVCODEC_VERSION_INT constant */
  383. unsigned avcodec_version(void);
  384. /* returns LIBAVCODEC_BUILD constant */
  385. unsigned avcodec_build(void);
  386. void avcodec_init(void);
  387. void avcodec_set_bit_exact(void);
  388. void register_avcodec(AVCodec *format);
  389. AVCodec *avcodec_find_encoder(enum CodecID id);
  390. AVCodec *avcodec_find_encoder_by_name(const char *name);
  391. AVCodec *avcodec_find_decoder(enum CodecID id);
  392. AVCodec *avcodec_find_decoder_by_name(const char *name);
  393. void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);
  394. int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
  395. int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples,
  396. int *frame_size_ptr,
  397. UINT8 *buf, int buf_size);
  398. int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture,
  399. int *got_picture_ptr,
  400. UINT8 *buf, int buf_size);
  401. int avcodec_parse_frame(AVCodecContext *avctx, UINT8 **pdata,
  402. int *data_size_ptr,
  403. UINT8 *buf, int buf_size);
  404. int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size,
  405. const short *samples);
  406. int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size,
  407. const AVPicture *pict);
  408. int avcodec_close(AVCodecContext *avctx);
  409. void avcodec_register_all(void);
  410. void avcodec_flush_buffers(AVCodecContext *avctx);
  411. #ifdef FF_POSTPROCESS
  412. extern int quant_store[MBR+1][MBC+1]; // [Review]
  413. #endif
  414. /**
  415. * Interface for 0.5.0 version
  416. *
  417. * do not even think about it's usage for this moment
  418. */
  419. typedef struct {
  420. // compressed size used from given memory buffer
  421. int size;
  422. /// I/P/B frame type
  423. int frame_type;
  424. } avc_enc_result_t;
  425. /**
  426. * Commands
  427. * order can't be changed - once it was defined
  428. */
  429. typedef enum {
  430. // general commands
  431. AVC_OPEN_BY_NAME = 0xACA000,
  432. AVC_OPEN_BY_CODEC_ID,
  433. AVC_OPEN_BY_FOURCC,
  434. AVC_CLOSE,
  435. AVC_FLUSH,
  436. // pin - struct { uint8_t* src, uint_t src_size }
  437. // pout - struct { AVPicture* img, consumed_bytes,
  438. AVC_DECODE,
  439. // pin - struct { AVPicture* img, uint8_t* dest, uint_t dest_size }
  440. // pout - uint_t used_from_dest_size
  441. AVC_ENCODE,
  442. // query/get video commands
  443. AVC_GET_VERSION = 0xACB000,
  444. AVC_GET_WIDTH,
  445. AVC_GET_HEIGHT,
  446. AVC_GET_DELAY,
  447. AVC_GET_QUANT_TABLE,
  448. // ...
  449. // query/get audio commands
  450. AVC_GET_FRAME_SIZE = 0xABC000,
  451. // maybe define some simple structure which
  452. // might be passed to the user - but they can't
  453. // contain any codec specific parts and these
  454. // calls are usualy necessary only few times
  455. // set video commands
  456. AVC_SET_WIDTH = 0xACD000,
  457. AVC_SET_HEIGHT,
  458. // set video encoding commands
  459. AVC_SET_FRAME_RATE = 0xACD800,
  460. AVC_SET_QUALITY,
  461. AVC_SET_HURRY_UP,
  462. // set audio commands
  463. AVC_SET_SAMPLE_RATE = 0xACE000,
  464. AVC_SET_CHANNELS,
  465. } avc_cmd_t;
  466. /**
  467. * \param handle allocated private structure by libavcodec
  468. * for initialization pass NULL - will be returned pout
  469. * user is supposed to know nothing about its structure
  470. * \param cmd type of operation to be performed
  471. * \param pint input parameter
  472. * \param pout output parameter
  473. *
  474. * \returns command status - eventually for query command it might return
  475. * integer resulting value
  476. */
  477. int avcodec(void* handle, avc_cmd_t cmd, void* pin, void* pout);
  478. /* memory */
  479. void *av_malloc(int size);
  480. void *av_mallocz(int size);
  481. void av_free(void *ptr);
  482. void __av_freep(void **ptr);
  483. #define av_freep(p) __av_freep((void **)(p))
  484. #endif /* AVCODEC_H */