mpeg4video.h 7.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * MPEG4 encoder/decoder internal header.
 * Copyright (c) 2000,2001 Fabrice Bellard
 * Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#ifndef AVCODEC_MPEG4VIDEO_H
#define AVCODEC_MPEG4VIDEO_H

26
#include <stdint.h>
27

28 29 30 31
#include "get_bits.h"
#include "mpegvideo.h"
#include "rl.h"

32 33 34 35 36 37
// shapes
#define RECT_SHAPE       0
#define BIN_SHAPE        1
#define BIN_ONLY_SHAPE   2
#define GRAY_SHAPE       3

38 39 40 41 42 43 44
#define SIMPLE_VO_TYPE           1
#define CORE_VO_TYPE             3
#define MAIN_VO_TYPE             4
#define NBIT_VO_TYPE             5
#define ARTS_VO_TYPE            10
#define ACE_VO_TYPE             12
#define ADV_SIMPLE_VO_TYPE      17
45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61

// aspect_ratio_info
#define EXTENDED_PAR 15

//vol_sprite_usage / sprite_enable
#define STATIC_SPRITE 1
#define GMC_SPRITE 2

#define MOTION_MARKER 0x1F001
#define DC_MARKER     0x6B001

#define VOS_STARTCODE        0x1B0
#define USER_DATA_STARTCODE  0x1B2
#define GOP_STARTCODE        0x1B3
#define VISUAL_OBJ_STARTCODE 0x1B5
#define VOP_STARTCODE        0x1B6

62 63 64
/* smaller packets likely don't contain a real frame */
#define MAX_NVOP_SIZE 19

65 66
typedef struct Mpeg4DecContext {
    MpegEncContext m;
67

68
    /// number of bits to represent the fractional part of time
69
    int time_increment_bits;
70
    int shape;
71
    int vol_sprite_usage;
72
    int sprite_brightness_change;
73
    int num_sprite_warping_points;
74
    /// sprite trajectory points
75
    uint16_t sprite_traj[4][2];
76
    /// sprite shift [isChroma]
77
    int sprite_shift[2];
78

79 80
    // reversible vlc
    int rvlc;
81
    /// could this stream contain resync markers
82
    int resync_marker;
83
    /// time distance of first I -> B, used for interlaced B-frames
84
    int t_frame;
85

86
    int new_pred;
87
    int enhancement_type;
88
    int scalability;
89
    int use_intra_dc_vlc;
90

91
    /// QP above which the ac VLC should be used for intra dc
92
    int intra_dc_threshold;
93

94 95 96 97 98
    /* bug workarounds */
    int divx_version;
    int divx_build;
    int xvid_build;
    int lavc_build;
99

100
    /// flag for having shown the warning about invalid Divx B-frames
101
    int showed_packed_warning;
102 103 104
    /** does the stream contain the low_delay flag,
     *  used to work around buggy encoders. */
    int vol_control_parameters;
105 106 107
    int cplx_estimation_trash_i;
    int cplx_estimation_trash_p;
    int cplx_estimation_trash_b;
108 109
} Mpeg4DecContext;

110
/* dc encoding for mpeg4 */
111 112
extern const uint8_t ff_mpeg4_DCtab_lum[13][2];
extern const uint8_t ff_mpeg4_DCtab_chrom[13][2];
113

114
extern const uint16_t ff_mpeg4_intra_vlc[103][2];
115 116 117
extern const int8_t ff_mpeg4_intra_level[102];
extern const int8_t ff_mpeg4_intra_run[102];

118
extern RLTable ff_mpeg4_rl_intra;
119 120

/* Note this is identical to the intra rvlc except that it is reordered. */
121 122
extern RLTable ff_rvlc_rl_inter;
extern RLTable ff_rvlc_rl_intra;
123

124 125
extern const uint16_t ff_sprite_trajectory_tab[15][2];
extern const uint8_t ff_mb_type_b_tab[4][2];
126 127 128 129 130 131 132 133 134

/* these matrixes will be permuted for the idct */
extern const int16_t ff_mpeg4_default_intra_matrix[64];
extern const int16_t ff_mpeg4_default_non_intra_matrix[64];

extern const uint8_t ff_mpeg4_y_dc_scale_table[32];
extern const uint8_t ff_mpeg4_c_dc_scale_table[32];
extern const uint16_t ff_mpeg4_resync_prefix[8];

135
extern const uint8_t ff_mpeg4_dc_threshold[8];
136

137
void ff_mpeg4_encode_mb(MpegEncContext *s,
Diego Biurrun's avatar
Diego Biurrun committed
138
                        int16_t block[6][64],
139
                        int motion_x, int motion_y);
140
void ff_mpeg4_pred_ac(MpegEncContext *s, int16_t *block, int n,
141
                      int dir);
142
void ff_set_mpeg4_time(MpegEncContext *s);
143
void ff_mpeg4_encode_picture_header(MpegEncContext *s, int picture_number);
144

145
int ff_mpeg4_decode_picture_header(Mpeg4DecContext *ctx, GetBitContext *gb);
146 147
void ff_mpeg4_encode_video_packet_header(MpegEncContext *s);
void ff_mpeg4_clean_buffers(MpegEncContext *s);
148
void ff_mpeg4_stuffing(PutBitContext *pbc);
149 150 151
void ff_mpeg4_init_partitions(MpegEncContext *s);
void ff_mpeg4_merge_partitions(MpegEncContext *s);
void ff_clean_mpeg4_qscales(MpegEncContext *s);
152
int ff_mpeg4_decode_partitions(Mpeg4DecContext *ctx);
153
int ff_mpeg4_get_video_packet_prefix_length(MpegEncContext *s);
154
int ff_mpeg4_decode_video_packet_header(Mpeg4DecContext *ctx);
155
void ff_mpeg4_init_direct_mv(MpegEncContext *s);
156
void ff_mpeg4videodec_static_init(void);
157
int ff_mpeg4_workaround_bugs(AVCodecContext *avctx);
158
int ff_mpeg4_frame_end(AVCodecContext *avctx, const uint8_t *buf, int buf_size);
159 160 161 162 163 164

/**
 *
 * @return the mb_type
 */
int ff_mpeg4_set_direct_mv(MpegEncContext *s, int mx, int my);
165

166
extern uint8_t ff_mpeg4_static_rl_table_store[3][2][2 * MAX_RUN + MAX_LEVEL + 3];
167 168 169 170 171 172 173 174

#if 0 //3IV1 is quite rare and it slows things down a tiny bit
#define IS_3IV1 s->codec_tag == AV_RL32("3IV1")
#else
#define IS_3IV1 0
#endif

/**
175
 * Predict the dc.
176 177 178 179 180
 * encoding quantized level -> quantized diff
 * decoding quantized diff -> quantized level
 * @param n block index (0-3 are luma, 4-5 are chroma)
 * @param dir_ptr pointer to an integer where the prediction direction will be stored
 */
181 182
static inline int ff_mpeg4_pred_dc(MpegEncContext *s, int n, int level,
                                   int *dir_ptr, int encoding)
183 184 185 186 187
{
    int a, b, c, wrap, pred, scale, ret;
    int16_t *dc_val;

    /* find prediction */
188
    if (n < 4)
189
        scale = s->y_dc_scale;
190
    else
191
        scale = s->c_dc_scale;
192 193
    if (IS_3IV1)
        scale = 8;
194

195
    wrap   = s->block_wrap[n];
196 197 198 199 200
    dc_val = s->dc_val[0] + s->block_index[n];

    /* B C
     * A X
     */
201 202 203 204 205 206 207 208 209 210 211
    a = dc_val[-1];
    b = dc_val[-1 - wrap];
    c = dc_val[-wrap];

    /* outside slice handling (we can't do that by memset as we need the
     * dc for error resilience) */
    if (s->first_slice_line && n != 3) {
        if (n != 2)
            b = c = 1024;
        if (n != 1 && s->mb_x == s->resync_mb_x)
            b = a = 1024;
212
    }
213 214 215
    if (s->mb_x == s->resync_mb_x && s->mb_y == s->resync_mb_y + 1) {
        if (n == 0 || n == 4 || n == 5)
            b = 1024;
216 217 218
    }

    if (abs(a - b) < abs(b - c)) {
219
        pred     = c;
220 221
        *dir_ptr = 1; /* top */
    } else {
222
        pred     = a;
223 224 225 226 227
        *dir_ptr = 0; /* left */
    }
    /* we assume pred is positive */
    pred = FASTDIV((pred + (scale >> 1)), scale);

228
    if (encoding) {
229
        ret = level - pred;
230
    } else {
231
        level += pred;
232
        ret    = level;
233 234 235 236
    }
    level *= scale;
    if (level & (~2047)) {
        if (!s->encoding && (s->avctx->err_recognition & (AV_EF_BITSTREAM | AV_EF_AGGRESSIVE))) {
237 238 239
            if (level < 0) {
                av_log(s->avctx, AV_LOG_ERROR,
                       "dc<0 at %dx%d\n", s->mb_x, s->mb_y);
240 241
                return -1;
            }
242
            if (level > 2048 + scale) {
243 244
                av_log(s->avctx, AV_LOG_ERROR,
                       "dc overflow at %dx%d\n", s->mb_x, s->mb_y);
245 246 247
                return -1;
            }
        }
248 249 250 251
        if (level < 0)
            level = 0;
        else if (!(s->workaround_bugs & FF_BUG_DC_CLIP))
            level = 2047;
252
    }
253
    dc_val[0] = level;
254 255 256

    return ret;
}
257

258
#endif /* AVCODEC_MPEG4VIDEO_H */