mpeg4video.h 8.25 KB
Newer Older
1
/*
2
 * MPEG-4 encoder/decoder internal header.
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
 * Copyright (c) 2000,2001 Fabrice Bellard
 * Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#ifndef AVCODEC_MPEG4VIDEO_H
#define AVCODEC_MPEG4VIDEO_H

26
#include <stdint.h>
27

28 29 30 31
#include "get_bits.h"
#include "mpegvideo.h"
#include "rl.h"

32 33 34 35 36 37
// shapes
#define RECT_SHAPE       0
#define BIN_SHAPE        1
#define BIN_ONLY_SHAPE   2
#define GRAY_SHAPE       3

38 39 40 41 42 43
#define SIMPLE_VO_TYPE           1
#define CORE_VO_TYPE             3
#define MAIN_VO_TYPE             4
#define NBIT_VO_TYPE             5
#define ARTS_VO_TYPE            10
#define ACE_VO_TYPE             12
44 45
#define SIMPLE_STUDIO_VO_TYPE   14
#define CORE_STUDIO_VO_TYPE     15
46
#define ADV_SIMPLE_VO_TYPE      17
47

48 49 50
#define VOT_VIDEO_ID 1
#define VOT_STILL_TEXTURE_ID 2

51 52 53 54 55 56 57 58 59 60 61 62 63 64 65
// aspect_ratio_info
#define EXTENDED_PAR 15

//vol_sprite_usage / sprite_enable
#define STATIC_SPRITE 1
#define GMC_SPRITE 2

#define MOTION_MARKER 0x1F001
#define DC_MARKER     0x6B001

#define VOS_STARTCODE        0x1B0
#define USER_DATA_STARTCODE  0x1B2
#define GOP_STARTCODE        0x1B3
#define VISUAL_OBJ_STARTCODE 0x1B5
#define VOP_STARTCODE        0x1B6
66 67 68 69
#define SLICE_STARTCODE      0x1B7
#define EXT_STARTCODE        0x1B8

#define QUANT_MATRIX_EXT_ID  0x3
70

71 72 73
/* smaller packets likely don't contain a real frame */
#define MAX_NVOP_SIZE 19

74 75
typedef struct Mpeg4DecContext {
    MpegEncContext m;
76

77
    /// number of bits to represent the fractional part of time
78
    int time_increment_bits;
79
    int shape;
80
    int vol_sprite_usage;
81
    int sprite_brightness_change;
82
    int num_sprite_warping_points;
83
    /// sprite trajectory points
84
    uint16_t sprite_traj[4][2];
85
    /// sprite shift [isChroma]
86
    int sprite_shift[2];
87

88 89
    // reversible vlc
    int rvlc;
90
    /// could this stream contain resync markers
91
    int resync_marker;
92
    /// time distance of first I -> B, used for interlaced B-frames
93
    int t_frame;
94

95
    int new_pred;
96
    int enhancement_type;
97
    int scalability;
98
    int use_intra_dc_vlc;
99

100
    /// QP above which the ac VLC should be used for intra dc
101
    int intra_dc_threshold;
102

103 104 105 106 107
    /* bug workarounds */
    int divx_version;
    int divx_build;
    int xvid_build;
    int lavc_build;
108

109
    /// flag for having shown the warning about invalid Divx B-frames
110
    int showed_packed_warning;
111 112 113
    /** does the stream contain the low_delay flag,
     *  used to work around buggy encoders. */
    int vol_control_parameters;
114 115 116
    int cplx_estimation_trash_i;
    int cplx_estimation_trash_p;
    int cplx_estimation_trash_b;
117 118 119 120 121 122

    VLC studio_intra_tab[12];
    VLC studio_luma_dc;
    VLC studio_chroma_dc;

    int rgb;
123 124
} Mpeg4DecContext;

125 126
static const uint8_t mpeg4_block_count[4] = {0, 6, 8, 12};

127
/* dc encoding for MPEG-4 */
128 129
extern const uint8_t ff_mpeg4_DCtab_lum[13][2];
extern const uint8_t ff_mpeg4_DCtab_chrom[13][2];
130

131
extern const uint16_t ff_mpeg4_intra_vlc[103][2];
132 133 134
extern const int8_t ff_mpeg4_intra_level[102];
extern const int8_t ff_mpeg4_intra_run[102];

135
extern RLTable ff_mpeg4_rl_intra;
136 137

/* Note this is identical to the intra rvlc except that it is reordered. */
138 139
extern RLTable ff_rvlc_rl_inter;
extern RLTable ff_rvlc_rl_intra;
140

141 142
extern const uint16_t ff_sprite_trajectory_tab[15][2];
extern const uint8_t ff_mb_type_b_tab[4][2];
143 144 145 146 147 148 149 150 151

/* these matrixes will be permuted for the idct */
extern const int16_t ff_mpeg4_default_intra_matrix[64];
extern const int16_t ff_mpeg4_default_non_intra_matrix[64];

extern const uint8_t ff_mpeg4_y_dc_scale_table[32];
extern const uint8_t ff_mpeg4_c_dc_scale_table[32];
extern const uint16_t ff_mpeg4_resync_prefix[8];

152
extern const uint8_t ff_mpeg4_dc_threshold[8];
153

154 155 156 157
extern const uint16_t ff_mpeg4_studio_dc_luma[19][2];
extern const uint16_t ff_mpeg4_studio_dc_chroma[19][2];
extern const uint16_t ff_mpeg4_studio_intra[12][22][2];

158
void ff_mpeg4_encode_mb(MpegEncContext *s,
Diego Biurrun's avatar
Diego Biurrun committed
159
                        int16_t block[6][64],
160
                        int motion_x, int motion_y);
161
void ff_mpeg4_pred_ac(MpegEncContext *s, int16_t *block, int n,
162
                      int dir);
163
void ff_set_mpeg4_time(MpegEncContext *s);
164
int ff_mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
165

166
int ff_mpeg4_decode_picture_header(Mpeg4DecContext *ctx, GetBitContext *gb, int header);
167 168
void ff_mpeg4_encode_video_packet_header(MpegEncContext *s);
void ff_mpeg4_clean_buffers(MpegEncContext *s);
169
void ff_mpeg4_stuffing(PutBitContext *pbc);
170 171 172
void ff_mpeg4_init_partitions(MpegEncContext *s);
void ff_mpeg4_merge_partitions(MpegEncContext *s);
void ff_clean_mpeg4_qscales(MpegEncContext *s);
173
int ff_mpeg4_decode_partitions(Mpeg4DecContext *ctx);
174
int ff_mpeg4_get_video_packet_prefix_length(MpegEncContext *s);
175
int ff_mpeg4_decode_video_packet_header(Mpeg4DecContext *ctx);
176
int ff_mpeg4_decode_studio_slice_header(Mpeg4DecContext *ctx);
177
void ff_mpeg4_init_direct_mv(MpegEncContext *s);
178
void ff_mpeg4videodec_static_init(void);
179
int ff_mpeg4_workaround_bugs(AVCodecContext *avctx);
180
int ff_mpeg4_frame_end(AVCodecContext *avctx, const uint8_t *buf, int buf_size);
181 182 183 184 185

/**
 * @return the mb_type
 */
int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my);
186

187
extern uint8_t ff_mpeg4_static_rl_table_store[3][2][2 * MAX_RUN + MAX_LEVEL + 3];
188 189 190 191 192 193 194 195

#if 0 //3IV1 is quite rare and it slows things down a tiny bit
#define IS_3IV1 s->codec_tag == AV_RL32("3IV1")
#else
#define IS_3IV1 0
#endif

/**
196
 * Predict the dc.
197 198 199 200 201
 * encoding quantized level -> quantized diff
 * decoding quantized diff -> quantized level
 * @param n block index (0-3 are luma, 4-5 are chroma)
 * @param dir_ptr pointer to an integer where the prediction direction will be stored
 */
202 203
static inline int ff_mpeg4_pred_dc(MpegEncContext *s, int n, int level,
                                   int *dir_ptr, int encoding)
204 205 206 207 208
{
    int a, b, c, wrap, pred, scale, ret;
    int16_t *dc_val;

    /* find prediction */
209
    if (n < 4)
210
        scale = s->y_dc_scale;
211
    else
212
        scale = s->c_dc_scale;
213 214
    if (IS_3IV1)
        scale = 8;
215

216
    wrap   = s->block_wrap[n];
217 218 219 220 221
    dc_val = s->dc_val[0] + s->block_index[n];

    /* B C
     * A X
     */
222 223 224 225 226 227 228 229 230 231 232
    a = dc_val[-1];
    b = dc_val[-1 - wrap];
    c = dc_val[-wrap];

    /* outside slice handling (we can't do that by memset as we need the
     * dc for error resilience) */
    if (s->first_slice_line && n != 3) {
        if (n != 2)
            b = c = 1024;
        if (n != 1 && s->mb_x == s->resync_mb_x)
            b = a = 1024;
233
    }
234 235 236
    if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1) {
        if (n == 0 || n == 4 || n == 5)
            b = 1024;
237 238 239
    }

    if (abs(a - b) < abs(b - c)) {
240
        pred     = c;
241 242
        *dir_ptr = 1; /* top */
    } else {
243
        pred     = a;
244 245 246 247 248
        *dir_ptr = 0; /* left */
    }
    /* we assume pred is positive */
    pred = FASTDIV((pred + (scale >> 1)), scale);

249
    if (encoding) {
250
        ret = level - pred;
251
    } else {
252
        level += pred;
253
        ret    = level;
254 255 256 257
    }
    level *= scale;
    if (level & (~2047)) {
        if (!s->encoding && (s->avctx->err_recognition & (AV_EF_BITSTREAM | AV_EF_AGGRESSIVE))) {
258 259 260
            if (level < 0) {
                av_log(s->avctx, AV_LOG_ERROR,
                       "dc<0 at %dx%d\n", s->mb_x, s->mb_y);
261
                return AVERROR_INVALIDDATA;
262
            }
263
            if (level > 2048 + scale) {
264 265
                av_log(s->avctx, AV_LOG_ERROR,
                       "dc overflow at %dx%d\n", s->mb_x, s->mb_y);
266
                return AVERROR_INVALIDDATA;
267 268
            }
        }
269 270 271 272
        if (level < 0)
            level = 0;
        else if (!(s->workaround_bugs & FF_BUG_DC_CLIP))
            level = 2047;
273
    }
274
    dc_val[0] = level;
275 276 277

    return ret;
}
278

279
#endif /* AVCODEC_MPEG4VIDEO_H */