avcodec.h 10.6 KB
Newer Older
glantau's avatar
glantau committed
1 2 3
#ifndef AVCODEC_H
#define AVCODEC_H

glantau's avatar
glantau committed
4 5
#include "common.h"

6 7 8 9 10
#define LIBAVCODEC_VERSION_INT 0x000406
#define LIBAVCODEC_VERSION     "0.4.6"
#define LIBAVCODEC_BUILD       4600
#define LIBAVCODEC_BUILD_STR   "4600"

glantau's avatar
glantau committed
11 12 13 14 15 16
enum CodecID {
    CODEC_ID_NONE, 
    CODEC_ID_MPEG1VIDEO,
    CODEC_ID_H263,
    CODEC_ID_RV10,
    CODEC_ID_MP2,
17
    CODEC_ID_MP3LAME,
glantau's avatar
glantau committed
18 19
    CODEC_ID_AC3,
    CODEC_ID_MJPEG,
glantau's avatar
glantau committed
20
    CODEC_ID_MPEG4,
glantau's avatar
glantau committed
21
    CODEC_ID_RAWVIDEO,
22 23 24
    CODEC_ID_MSMPEG4V1,
    CODEC_ID_MSMPEG4V2,
    CODEC_ID_MSMPEG4V3,
michaelni's avatar
michaelni committed
25
    CODEC_ID_WMV1,
glantau's avatar
glantau committed
26 27
    CODEC_ID_H263P,
    CODEC_ID_H263I,
glantau's avatar
glantau committed
28 29 30 31 32 33 34 35 36 37

    /* various pcm "codecs" */
    CODEC_ID_PCM_S16LE,
    CODEC_ID_PCM_S16BE,
    CODEC_ID_PCM_U16LE,
    CODEC_ID_PCM_U16BE,
    CODEC_ID_PCM_S8,
    CODEC_ID_PCM_U8,
    CODEC_ID_PCM_MULAW,
    CODEC_ID_PCM_ALAW,
glantau's avatar
glantau committed
38
};
39
#define CODEC_ID_MSMPEG4 CODEC_ID_MSMPEG4V3
glantau's avatar
glantau committed
40 41 42 43 44 45 46

enum CodecType {
    CODEC_TYPE_VIDEO,
    CODEC_TYPE_AUDIO,
};

enum PixelFormat {
47
    PIX_FMT_ANY = -1,
glantau's avatar
glantau committed
48 49 50 51
    PIX_FMT_YUV420P,
    PIX_FMT_YUV422,
    PIX_FMT_RGB24,
    PIX_FMT_BGR24,
52 53
    PIX_FMT_YUV422P,
    PIX_FMT_YUV444P,
glantau's avatar
glantau committed
54 55
};

glantau's avatar
glantau committed
56 57 58 59 60
/* currently unused, may be used if 24/32 bits samples ever supported */
enum SampleFormat {
    SAMPLE_FMT_S16 = 0,         /* signed 16 bits */
};

glantau's avatar
glantau committed
61 62 63
/* in bytes */
#define AVCODEC_MAX_AUDIO_FRAME_SIZE 18432

64 65
/* motion estimation type, EPZS by default */
enum Motion_Est_ID {
66
    ME_ZERO = 1,
67 68 69 70 71 72 73
    ME_FULL,
    ME_LOG,
    ME_PHODS,
    ME_EPZS,
    ME_X1
};

74 75 76
/* only for ME compatiblity with old apps */
extern int motion_estimation_method;

77
/* ME algos sorted by quality */
78
static const int Motion_Est_QTab[] = { 1, 4, 3, 6, 5, 2 };
glantau's avatar
glantau committed
79

80 81
#define FF_MAX_B_FRAMES 4

glantau's avatar
glantau committed
82
/* encoding support */
83
/* note not everything is supported yet */
glantau's avatar
glantau committed
84 85 86

#define CODEC_FLAG_HQ     0x0001 /* high quality (non real time) encoding */
#define CODEC_FLAG_QSCALE 0x0002 /* use fixed qscale */
87 88 89
#define CODEC_FLAG_4MV    0x0004 /* 4 MV per MB allowed */
#define CODEC_FLAG_QPEL   0x0010 /* use qpel MC */
#define CODEC_FLAG_GMC    0x0020 /* use GMC */
90
#define CODEC_FLAG_TYPE   0x0040 /* fixed I/P frame type, from avctx->key_frame */
91 92 93
/* parent program gurantees that the input for b-frame containing streams is not written to 
   for at least s->max_b_frames+1 frames, if this is not set than the input will be copied */
#define CODEC_FLAG_INPUT_PRESERVED 0x0100 
glantau's avatar
glantau committed
94

glantau's avatar
glantau committed
95 96 97 98 99
/* codec capabilities */

/* decoder can use draw_horiz_band callback */
#define CODEC_CAP_DRAW_HORIZ_BAND 0x0001

glantau's avatar
glantau committed
100 101 102 103
#define FRAME_RATE_BASE 10000

typedef struct AVCodecContext {
    int bit_rate;
104
    int bit_rate_tolerance; /* amount of +- bits (>0)*/
glantau's avatar
glantau committed
105 106 107
    int flags;
    int sub_id;    /* some codecs needs additionnal format info. It is
                      stored there */
108 109 110
    
    int me_method; /* ME algorithm used for video coding */
    
glantau's avatar
glantau committed
111 112 113
    /* video only */
    int frame_rate; /* frames per sec multiplied by FRAME_RATE_BASE */
    int width, height;
114
    int aspect_ratio_info;
michaelni's avatar
michaelni committed
115 116 117 118 119
#define FF_ASPECT_SQUARE 1
#define FF_ASPECT_4_3_625 2
#define FF_ASPECT_4_3_525 3
#define FF_ASPECT_16_9_625 4
#define FF_ASPECT_16_9_525 5
glantau's avatar
glantau committed
120
    int gop_size; /* 0 = intra only */
121
    enum PixelFormat pix_fmt;  /* pixel format, see PIX_FMT_xxx */
glantau's avatar
glantau committed
122 123 124 125 126 127 128 129 130

    /* if non NULL, 'draw_horiz_band' is called by the libavcodec
       decoder to draw an horizontal band. It improve cache usage. Not
       all codecs can do that. You must check the codec capabilities
       before */
    void (*draw_horiz_band)(struct AVCodecContext *s,
                            UINT8 **src_ptr, int linesize,
                            int y, int width, int height);

glantau's avatar
glantau committed
131 132 133
    /* audio only */
    int sample_rate; /* samples per sec */
    int channels;
glantau's avatar
glantau committed
134
    int sample_fmt;  /* sample format, currenly unused */
glantau's avatar
glantau committed
135 136 137 138 139 140 141 142

    /* the following data should not be initialized */
    int frame_size; /* in samples, initialized when calling 'init' */
    int frame_number; /* audio or video frame number */
    int key_frame;    /* true if the previous compressed frame was 
                         a key frame (intra, or seekable) */
    int quality;      /* quality of the previous encoded frame 
                         (between 1 (good) and 31 (bad)) */
143 144 145 146 147
    float qcompress;  /* amount of qscale change between easy & hard scenes (0.0-1.0)*/
    float qblur;      /* amount of qscale smoothing over time (0.0-1.0) */
    int qmin;         /* min qscale */
    int qmax;         /* max qscale */
    int max_qdiff;    /* max qscale difference between frames */
148 149
    int max_b_frames; /* maximum b frames, the output will be delayed by max_b_frames+1 relative to the input */

glantau's avatar
glantau committed
150 151 152
    struct AVCodec *codec;
    void *priv_data;

153 154 155 156 157 158 159 160 161 162 163 164
    /* The following data is for RTP friendly coding */
    /* By now only H.263/H.263+ coder honours this   */
    int rtp_mode;   /* 1 for activate RTP friendly-mode           */
                    /* highers numbers represent more error-prone */
                    /* enviroments, by now just "1" exist         */
    
    int rtp_payload_size;   /* The size of the RTP payload, the coder will  */
                            /* do it's best to deliver a chunk with size    */
                            /* below rtp_payload_size, the chunk will start */
                            /* with a start code on some codecs like H.263  */
                            /* This doesn't take account of any particular  */
                            /* headers inside the transmited RTP payload    */
165 166 167 168 169 170 171 172

    
    /* The RTP callcack: This function is called  */
    /* every time the encoder as a packet to send */
    /* Depends on the encoder if the data starts  */
    /* with a Start Code (it should) H.263 does   */
    void (*rtp_callback)(void *data, int size, int packet_number); 

173 174 175 176 177 178
    /* These are for PSNR calculation, if you set get_psnr to 1 */
    /* after encoding you will have the PSNR on psnr_y/cb/cr    */
    int get_psnr;
    float psnr_y;
    float psnr_cb;
    float psnr_cr;
michaelni's avatar
michaelni committed
179 180 181 182 183 184 185 186 187 188 189
    
    /* statistics, used for 2-pass encoding */
    int mv_bits;
    int header_bits;
    int i_tex_bits;
    int p_tex_bits;
    int i_count;
    int p_count;
    int skip_count;
    int misc_bits; // cbp, mb_type
    int frame_bits;
190
                 
glantau's avatar
glantau committed
191
    /* the following fields are ignored */
glantau's avatar
glantau committed
192
    void *opaque;   /* can be used to carry app specific stuff */
glantau's avatar
glantau committed
193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208
    char codec_name[32];
    int codec_type; /* see CODEC_TYPE_xxx */
    int codec_id; /* see CODEC_ID_xxx */
    unsigned int codec_tag;  /* codec tag, only used if unknown codec */
} AVCodecContext;

typedef struct AVCodec {
    char *name;
    int type;
    int id;
    int priv_data_size;
    int (*init)(AVCodecContext *);
    int (*encode)(AVCodecContext *, UINT8 *buf, int buf_size, void *data);
    int (*close)(AVCodecContext *);
    int (*decode)(AVCodecContext *, void *outdata, int *outdata_size, 
                  UINT8 *buf, int buf_size);
glantau's avatar
glantau committed
209
    int capabilities;
glantau's avatar
glantau committed
210 211 212 213 214 215 216 217 218 219 220
    struct AVCodec *next;
} AVCodec;

/* three components are given, that's all */
typedef struct AVPicture {
    UINT8 *data[3];
    int linesize[3];
} AVPicture;

extern AVCodec ac3_encoder;
extern AVCodec mp2_encoder;
221
extern AVCodec mp3lame_encoder;
glantau's avatar
glantau committed
222 223 224 225 226
extern AVCodec mpeg1video_encoder;
extern AVCodec h263_encoder;
extern AVCodec h263p_encoder;
extern AVCodec rv10_encoder;
extern AVCodec mjpeg_encoder;
glantau's avatar
glantau committed
227
extern AVCodec mpeg4_encoder;
228 229 230
extern AVCodec msmpeg4v1_encoder;
extern AVCodec msmpeg4v2_encoder;
extern AVCodec msmpeg4v3_encoder;
glantau's avatar
glantau committed
231 232

extern AVCodec h263_decoder;
glantau's avatar
glantau committed
233
extern AVCodec mpeg4_decoder;
234 235 236
extern AVCodec msmpeg4v1_decoder;
extern AVCodec msmpeg4v2_decoder;
extern AVCodec msmpeg4v3_decoder;
michaelni's avatar
michaelni committed
237
extern AVCodec wmv1_decoder;
glantau's avatar
glantau committed
238 239 240
extern AVCodec mpeg_decoder;
extern AVCodec h263i_decoder;
extern AVCodec rv10_decoder;
glantau's avatar
glantau committed
241
extern AVCodec mjpeg_decoder;
242
extern AVCodec mp2_decoder;
glantau's avatar
glantau committed
243
extern AVCodec mp3_decoder;
glantau's avatar
glantau committed
244

glantau's avatar
glantau committed
245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261
/* pcm codecs */
#define PCM_CODEC(id, name) \
extern AVCodec name ## _decoder; \
extern AVCodec name ## _encoder;

PCM_CODEC(CODEC_ID_PCM_S16LE, pcm_s16le);
PCM_CODEC(CODEC_ID_PCM_S16BE, pcm_s16be);
PCM_CODEC(CODEC_ID_PCM_U16LE, pcm_u16le);
PCM_CODEC(CODEC_ID_PCM_U16BE, pcm_u16be);
PCM_CODEC(CODEC_ID_PCM_S8, pcm_s8);
PCM_CODEC(CODEC_ID_PCM_U8, pcm_u8);
PCM_CODEC(CODEC_ID_PCM_ALAW, pcm_alaw);
PCM_CODEC(CODEC_ID_PCM_MULAW, pcm_mulaw);

#undef PCM_CODEC

/* dummy raw video codec */
glantau's avatar
glantau committed
262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
extern AVCodec rawvideo_codec;

/* the following codecs use external GPL libs */
extern AVCodec ac3_decoder;

/* resample.c */

struct ReSampleContext;

typedef struct ReSampleContext ReSampleContext;

ReSampleContext *audio_resample_init(int output_channels, int input_channels, 
                                     int output_rate, int input_rate);
int audio_resample(ReSampleContext *s, short *output, short *input, int nb_samples);
void audio_resample_close(ReSampleContext *s);

/* YUV420 format is assumed ! */

struct ImgReSampleContext;

typedef struct ImgReSampleContext ImgReSampleContext;

ImgReSampleContext *img_resample_init(int output_width, int output_height,
                                      int input_width, int input_height);
void img_resample(ImgReSampleContext *s, 
                  AVPicture *output, AVPicture *input);

void img_resample_close(ImgReSampleContext *s);

291 292 293 294 295 296 297 298 299 300 301
void avpicture_fill(AVPicture *picture, UINT8 *ptr,
                    int pix_fmt, int width, int height);
int avpicture_get_size(int pix_fmt, int width, int height);

/* convert among pixel formats */
int img_convert(AVPicture *dst, int dst_pix_fmt,
                AVPicture *src, int pix_fmt, 
                int width, int height);

/* deinterlace a picture */
int avpicture_deinterlace(AVPicture *dst, AVPicture *src,
glantau's avatar
glantau committed
302 303 304 305 306 307 308 309 310 311
                          int pix_fmt, int width, int height);

/* external high level API */

extern AVCodec *first_avcodec;

void avcodec_init(void);

void register_avcodec(AVCodec *format);
AVCodec *avcodec_find_encoder(enum CodecID id);
312
AVCodec *avcodec_find_encoder_by_name(const char *name);
glantau's avatar
glantau committed
313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331
AVCodec *avcodec_find_decoder(enum CodecID id);
AVCodec *avcodec_find_decoder_by_name(const char *name);
void avcodec_string(char *buf, int buf_size, AVCodecContext *enc, int encode);

int avcodec_open(AVCodecContext *avctx, AVCodec *codec);
int avcodec_decode_audio(AVCodecContext *avctx, INT16 *samples, 
                         int *frame_size_ptr,
                         UINT8 *buf, int buf_size);
int avcodec_decode_video(AVCodecContext *avctx, AVPicture *picture, 
                         int *got_picture_ptr,
                         UINT8 *buf, int buf_size);
int avcodec_encode_audio(AVCodecContext *avctx, UINT8 *buf, int buf_size, 
                         const short *samples);
int avcodec_encode_video(AVCodecContext *avctx, UINT8 *buf, int buf_size, 
                         const AVPicture *pict);

int avcodec_close(AVCodecContext *avctx);

void avcodec_register_all(void);
glantau's avatar
glantau committed
332

333 334
#ifdef FF_POSTPROCESS
#ifndef MBC
335 336
#define MBC 128
#define MBR 96
337 338 339 340
#endif
extern int quant_store[MBR+1][MBC+1]; // [Review]
#endif

glantau's avatar
glantau committed
341
#endif /* AVCODEC_H */