mpeg4videoenc.c 50.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22
/*
 * MPEG4 encoder.
 * Copyright (c) 2000,2001 Fabrice Bellard
 * Copyright (c) 2002-2010 Michael Niedermayer <michaelni@gmx.at>
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

23
#include "libavutil/attributes.h"
24 25
#include "libavutil/log.h"
#include "libavutil/opt.h"
26
#include "mpegutils.h"
27 28 29 30
#include "mpegvideo.h"
#include "h263.h"
#include "mpeg4video.h"

31 32 33 34 35
/* The uni_DCtab_* tables below contain unified bits+length tables to encode DC
 * differences in mpeg4. Unified in the sense that the specification specifies
 * this encoding in several steps. */
static uint8_t  uni_DCtab_lum_len[512];
static uint8_t  uni_DCtab_chrom_len[512];
36 37 38
static uint16_t uni_DCtab_lum_bits[512];
static uint16_t uni_DCtab_chrom_bits[512];

39 40 41 42 43 44
/* Unified encoding tables for run length encoding of coefficients.
 * Unified in the sense that the specification specifies the encoding in several steps. */
static uint32_t uni_mpeg4_intra_rl_bits[64 * 64 * 2 * 2];
static uint8_t  uni_mpeg4_intra_rl_len[64 * 64 * 2 * 2];
static uint32_t uni_mpeg4_inter_rl_bits[64 * 64 * 2 * 2];
static uint8_t  uni_mpeg4_inter_rl_len[64 * 64 * 2 * 2];
45

46 47 48
//#define UNI_MPEG4_ENC_INDEX(last, run, level) ((last) * 128 + (run) * 256 + (level))
//#define UNI_MPEG4_ENC_INDEX(last, run, level) ((last) * 128 * 64 + (run) + (level) * 64)
#define UNI_MPEG4_ENC_INDEX(last, run, level) ((last) * 128 * 64 + (run) * 128 + (level))
49

50 51 52 53 54 55 56 57 58
/* mpeg4
 * inter
 * max level: 24/6
 * max run: 53/63
 *
 * intra
 * max level: 53/16
 * max run: 29/41
 */
59 60

/**
61
 * Return the number of bits that encoding the 8x8 block in block would need.
62 63
 * @param[in]  block_last_index last index in scantable order that refers to a non zero element in block.
 */
64 65 66 67
static inline int get_block_rate(MpegEncContext *s, int16_t block[64],
                                 int block_last_index, uint8_t scantable[64])
{
    int last = 0;
68
    int j;
69 70 71 72 73 74 75 76 77 78 79 80 81
    int rate = 0;

    for (j = 1; j <= block_last_index; j++) {
        const int index = scantable[j];
        int level = block[index];
        if (level) {
            level += 64;
            if ((level & (~127)) == 0) {
                if (j < block_last_index)
                    rate += s->intra_ac_vlc_length[UNI_AC_ENC_INDEX(j - last - 1, level)];
                else
                    rate += s->intra_ac_vlc_last_length[UNI_AC_ENC_INDEX(j - last - 1, level)];
            } else
82 83
                rate += s->ac_esc_length;

84
            last = j;
85 86 87 88 89 90 91
        }
    }

    return rate;
}

/**
92
 * Restore the ac coefficients in block that have been changed by decide_ac_pred().
93 94 95 96
 * This function also restores s->block_last_index.
 * @param[in,out] block MB coefficients, these will be restored
 * @param[in] dir ac prediction direction for each 8x8 block
 * @param[out] st scantable for each 8x8 block
Lou Logan's avatar
Lou Logan committed
97
 * @param[in] zigzag_last_index index referring to the last non zero coefficient in zigzag order
98
 */
99 100 101
static inline void restore_ac_coeffs(MpegEncContext *s, int16_t block[6][64],
                                     const int dir[6], uint8_t *st[6],
                                     const int zigzag_last_index[6])
102 103
{
    int i, n;
104
    memcpy(s->block_last_index, zigzag_last_index, sizeof(int) * 6);
105

106
    for (n = 0; n < 6; n++) {
107 108
        int16_t *ac_val = s->ac_val[0][0] + s->block_index[n] * 16;

109 110
        st[n] = s->intra_scantable.permutated;
        if (dir[n]) {
111
            /* top prediction */
112
            for (i = 1; i < 8; i++)
113
                block[n][s->idsp.idct_permutation[i]] = ac_val[i + 8];
114
        } else {
115
            /* left prediction */
116
            for (i = 1; i < 8; i++)
117
                block[n][s->idsp.idct_permutation[i << 3]] = ac_val[i];
118 119 120 121 122
        }
    }
}

/**
123
 * Return the optimal value (0 or 1) for the ac_pred element for the given MB in mpeg4.
124 125 126 127
 * This function will also update s->block_last_index and s->ac_val.
 * @param[in,out] block MB coefficients, these will be updated if 1 is returned
 * @param[in] dir ac prediction direction for each 8x8 block
 * @param[out] st scantable for each 8x8 block
Lou Logan's avatar
Lou Logan committed
128
 * @param[out] zigzag_last_index index referring to the last non zero coefficient in zigzag order
129
 */
130 131 132
static inline int decide_ac_pred(MpegEncContext *s, int16_t block[6][64],
                                 const int dir[6], uint8_t *st[6],
                                 int zigzag_last_index[6])
133
{
134
    int score = 0;
135
    int i, n;
136
    int8_t *const qscale_table = s->current_picture.qscale_table;
137

138
    memcpy(zigzag_last_index, s->block_last_index, sizeof(int) * 6);
139

140
    for (n = 0; n < 6; n++) {
141 142
        int16_t *ac_val, *ac_val1;

143 144
        score -= get_block_rate(s, block[n], s->block_last_index[n],
                                s->intra_scantable.permutated);
145

146 147 148 149
        ac_val  = s->ac_val[0][0] + s->block_index[n] * 16;
        ac_val1 = ac_val;
        if (dir[n]) {
            const int xy = s->mb_x + s->mb_y * s->mb_stride - s->mb_stride;
150
            /* top prediction */
151 152
            ac_val -= s->block_wrap[n] * 16;
            if (s->mb_y == 0 || s->qscale == qscale_table[xy] || n == 2 || n == 3) {
153
                /* same qscale */
154
                for (i = 1; i < 8; i++) {
155 156 157
                    const int level = block[n][s->idsp.idct_permutation[i]];
                    block[n][s->idsp.idct_permutation[i]] = level - ac_val[i + 8];
                    ac_val1[i]     = block[n][s->idsp.idct_permutation[i << 3]];
158
                    ac_val1[i + 8] = level;
159
                }
160
            } else {
161
                /* different qscale, we must rescale */
162
                for (i = 1; i < 8; i++) {
163 164 165
                    const int level = block[n][s->idsp.idct_permutation[i]];
                    block[n][s->idsp.idct_permutation[i]] = level - ROUNDED_DIV(ac_val[i + 8] * qscale_table[xy], s->qscale);
                    ac_val1[i]     = block[n][s->idsp.idct_permutation[i << 3]];
166
                    ac_val1[i + 8] = level;
167 168
                }
            }
169 170 171
            st[n] = s->intra_h_scantable.permutated;
        } else {
            const int xy = s->mb_x - 1 + s->mb_y * s->mb_stride;
172
            /* left prediction */
173 174
            ac_val -= 16;
            if (s->mb_x == 0 || s->qscale == qscale_table[xy] || n == 1 || n == 3) {
175
                /* same qscale */
176
                for (i = 1; i < 8; i++) {
177 178
                    const int level = block[n][s->idsp.idct_permutation[i << 3]];
                    block[n][s->idsp.idct_permutation[i << 3]] = level - ac_val[i];
179
                    ac_val1[i]     = level;
180
                    ac_val1[i + 8] = block[n][s->idsp.idct_permutation[i]];
181
                }
182
            } else {
183
                /* different qscale, we must rescale */
184
                for (i = 1; i < 8; i++) {
185 186
                    const int level = block[n][s->idsp.idct_permutation[i << 3]];
                    block[n][s->idsp.idct_permutation[i << 3]] = level - ROUNDED_DIV(ac_val[i] * qscale_table[xy], s->qscale);
187
                    ac_val1[i]     = level;
188
                    ac_val1[i + 8] = block[n][s->idsp.idct_permutation[i]];
189 190
                }
            }
191
            st[n] = s->intra_v_scantable.permutated;
192 193
        }

194 195 196 197
        for (i = 63; i > 0; i--)  // FIXME optimize
            if (block[n][st[n][i]])
                break;
        s->block_last_index[n] = i;
198 199 200 201

        score += get_block_rate(s, block[n], s->block_last_index[n], st[n]);
    }

202
    if (score < 0) {
203
        return 1;
204
    } else {
205 206 207 208 209 210
        restore_ac_coeffs(s, block, dir, st, zigzag_last_index);
        return 0;
    }
}

/**
211
 * modify mb_type & qscale so that encoding is actually possible in mpeg4
212
 */
213 214
void ff_clean_mpeg4_qscales(MpegEncContext *s)
{
215
    int i;
216
    int8_t *const qscale_table = s->current_picture.qscale_table;
217 218 219

    ff_clean_h263_qscales(s);

220 221 222 223
    if (s->pict_type == AV_PICTURE_TYPE_B) {
        int odd = 0;
        /* ok, come on, this isn't funny anymore, there's more code for
         * handling this mpeg4 mess than for the actual adaptive quantization */
224

225 226 227
        for (i = 0; i < s->mb_num; i++) {
            int mb_xy = s->mb_index2xy[i];
            odd += qscale_table[mb_xy] & 1;
228 229
        }

230 231 232 233
        if (2 * odd > s->mb_num)
            odd = 1;
        else
            odd = 0;
234

235 236 237
        for (i = 0; i < s->mb_num; i++) {
            int mb_xy = s->mb_index2xy[i];
            if ((qscale_table[mb_xy] & 1) != odd)
238
                qscale_table[mb_xy]++;
239 240
            if (qscale_table[mb_xy] > 31)
                qscale_table[mb_xy] = 31;
241 242
        }

243 244 245 246 247
        for (i = 1; i < s->mb_num; i++) {
            int mb_xy = s->mb_index2xy[i];
            if (qscale_table[mb_xy] != qscale_table[s->mb_index2xy[i - 1]] &&
                (s->mb_type[mb_xy] & CANDIDATE_MB_TYPE_DIRECT)) {
                s->mb_type[mb_xy] |= CANDIDATE_MB_TYPE_BIDIR;
248 249 250 251 252 253
            }
        }
    }
}

/**
254
 * Encode the dc value.
255 256
 * @param n block index (0-3 are luma, 4-5 are chroma)
 */
257
static inline void mpeg4_encode_dc(PutBitContext *s, int level, int n)
258 259
{
#if 1
260
    /* DC will overflow if level is outside the [-255,255] range. */
261
    level += 256;
262 263 264 265 266 267 268 269 270 271 272
    if (n < 4) {
        /* luminance */
        put_bits(s, uni_DCtab_lum_len[level], uni_DCtab_lum_bits[level]);
    } else {
        /* chrominance */
        put_bits(s, uni_DCtab_chrom_len[level], uni_DCtab_chrom_bits[level]);
    }
#else
    int size, v;
    /* find number of bits */
    size = 0;
273
    v    = abs(level);
274 275 276 277 278 279 280
    while (v) {
        v >>= 1;
        size++;
    }

    if (n < 4) {
        /* luminance */
281
        put_bits(s, ff_mpeg4_DCtab_lum[size][1], ff_mpeg4_DCtab_lum[size][0]);
282 283
    } else {
        /* chrominance */
284
        put_bits(s, ff_mpeg4_DCtab_chrom[size][1], ff_mpeg4_DCtab_chrom[size][0]);
285 286 287 288 289 290
    }

    /* encode remaining bits */
    if (size > 0) {
        if (level < 0)
            level = (-level) ^ ((1 << size) - 1);
291
        put_bits(s, size, level);
292
        if (size > 8)
293
            put_bits(s, 1, 1);
294 295 296 297
    }
#endif
}

298 299 300
static inline int mpeg4_get_dc_length(int level, int n)
{
    if (n < 4)
301
        return uni_DCtab_lum_len[level + 256];
302
    else
303 304 305 306
        return uni_DCtab_chrom_len[level + 256];
}

/**
307
 * Encode an 8x8 block.
308 309
 * @param n block index (0-3 are luma, 4-5 are chroma)
 */
310 311 312 313
static inline void mpeg4_encode_block(MpegEncContext *s,
                                      int16_t *block, int n, int intra_dc,
                                      uint8_t *scan_table, PutBitContext *dc_pb,
                                      PutBitContext *ac_pb)
314 315 316 317 318 319
{
    int i, last_non_zero;
    uint32_t *bits_tab;
    uint8_t *len_tab;
    const int last_index = s->block_last_index[n];

320
    if (s->mb_intra) {  // Note gcc (3.2.1 at least) will optimize this away
321 322
        /* mpeg4 based DC predictor */
        mpeg4_encode_dc(dc_pb, intra_dc, n);
323 324
        if (last_index < 1)
            return;
325
        i = 1;
326 327
        bits_tab = uni_mpeg4_intra_rl_bits;
        len_tab  = uni_mpeg4_intra_rl_len;
328
    } else {
329 330
        if (last_index < 0)
            return;
331
        i = 0;
332 333
        bits_tab = uni_mpeg4_inter_rl_bits;
        len_tab  = uni_mpeg4_inter_rl_len;
334 335 336 337 338
    }

    /* AC coefs */
    last_non_zero = i - 1;
    for (; i < last_index; i++) {
339
        int level = block[scan_table[i]];
340 341
        if (level) {
            int run = i - last_non_zero - 1;
342 343 344
            level += 64;
            if ((level & (~127)) == 0) {
                const int index = UNI_MPEG4_ENC_INDEX(0, run, level);
345
                put_bits(ac_pb, len_tab[index], bits_tab[index]);
346 347 348 349 350
            } else {  // ESC3
                put_bits(ac_pb,
                         7 + 2 + 1 + 6 + 1 + 12 + 1,
                         (3 << 23) + (3 << 21) + (0 << 20) + (run << 14) +
                         (1 << 13) + (((level - 64) & 0xfff) << 1) + 1);
351 352 353 354
            }
            last_non_zero = i;
        }
    }
355 356 357 358 359 360
    /* if (i <= last_index) */ {
        int level = block[scan_table[i]];
        int run   = i - last_non_zero - 1;
        level += 64;
        if ((level & (~127)) == 0) {
            const int index = UNI_MPEG4_ENC_INDEX(1, run, level);
361
            put_bits(ac_pb, len_tab[index], bits_tab[index]);
362 363 364 365 366
        } else {  // ESC3
            put_bits(ac_pb,
                     7 + 2 + 1 + 6 + 1 + 12 + 1,
                     (3 << 23) + (3 << 21) + (1 << 20) + (run << 14) +
                     (1 << 13) + (((level - 64) & 0xfff) << 1) + 1);
367 368 369 370
        }
    }
}

371 372 373
static int mpeg4_get_block_length(MpegEncContext *s,
                                  int16_t *block, int n,
                                  int intra_dc, uint8_t *scan_table)
374 375 376 377
{
    int i, last_non_zero;
    uint8_t *len_tab;
    const int last_index = s->block_last_index[n];
378
    int len = 0;
379

380
    if (s->mb_intra) {  // Note gcc (3.2.1 at least) will optimize this away
381 382
        /* mpeg4 based DC predictor */
        len += mpeg4_get_dc_length(intra_dc, n);
383 384
        if (last_index < 1)
            return len;
385 386 387
        i = 1;
        len_tab = uni_mpeg4_intra_rl_len;
    } else {
388 389
        if (last_index < 0)
            return 0;
390 391 392 393 394 395 396
        i = 0;
        len_tab = uni_mpeg4_inter_rl_len;
    }

    /* AC coefs */
    last_non_zero = i - 1;
    for (; i < last_index; i++) {
397
        int level = block[scan_table[i]];
398 399
        if (level) {
            int run = i - last_non_zero - 1;
400 401 402
            level += 64;
            if ((level & (~127)) == 0) {
                const int index = UNI_MPEG4_ENC_INDEX(0, run, level);
403
                len += len_tab[index];
404 405
            } else {  // ESC3
                len += 7 + 2 + 1 + 6 + 1 + 12 + 1;
406 407 408 409
            }
            last_non_zero = i;
        }
    }
410 411 412 413 414 415
    /* if (i <= last_index) */ {
        int level = block[scan_table[i]];
        int run   = i - last_non_zero - 1;
        level += 64;
        if ((level & (~127)) == 0) {
            const int index = UNI_MPEG4_ENC_INDEX(1, run, level);
416
            len += len_tab[index];
417 418
        } else {  // ESC3
            len += 7 + 2 + 1 + 6 + 1 + 12 + 1;
419 420 421 422 423 424
        }
    }

    return len;
}

425 426 427 428 429
static inline void mpeg4_encode_blocks(MpegEncContext *s, int16_t block[6][64],
                                       int intra_dc[6], uint8_t **scan_table,
                                       PutBitContext *dc_pb,
                                       PutBitContext *ac_pb)
{
430 431
    int i;

432 433 434 435 436 437 438
    if (scan_table) {
        if (s->flags2 & CODEC_FLAG2_NO_OUTPUT) {
            for (i = 0; i < 6; i++)
                skip_put_bits(&s->pb,
                              mpeg4_get_block_length(s, block[i], i,
                                                     intra_dc[i], scan_table[i]));
        } else {
439
            /* encode each block */
440 441 442
            for (i = 0; i < 6; i++)
                mpeg4_encode_block(s, block[i], i,
                                   intra_dc[i], scan_table[i], dc_pb, ac_pb);
443
        }
444 445 446 447 448 449 450
    } else {
        if (s->flags2 & CODEC_FLAG2_NO_OUTPUT) {
            for (i = 0; i < 6; i++)
                skip_put_bits(&s->pb,
                              mpeg4_get_block_length(s, block[i], i, 0,
                                                     s->intra_scantable.permutated));
        } else {
451
            /* encode each block */
452 453 454
            for (i = 0; i < 6; i++)
                mpeg4_encode_block(s, block[i], i, 0,
                                   s->intra_scantable.permutated, dc_pb, ac_pb);
455 456 457 458
        }
    }
}

459
static inline int get_b_cbp(MpegEncContext *s, int16_t block[6][64],
460 461 462 463
                            int motion_x, int motion_y, int mb_type)
{
    int cbp = 0, i;

464
    if (s->mpv_flags & FF_MPV_FLAG_CBP_RD) {
465
        int score        = 0;
466 467
        const int lambda = s->lambda2 >> (FF_LAMBDA_SHIFT - 6);

468
        for (i = 0; i < 6; i++) {
469 470 471 472
            if (s->coded_score[i] < 0) {
                score += s->coded_score[i];
                cbp   |= 1 << (5 - i);
            }
473
        }
474 475 476 477

        if (cbp) {
            int zero_score = -6;
            if ((motion_x | motion_y | s->dquant | mb_type) == 0)
478
                zero_score -= 4;  // 2 * MV + mb_type + cbp bit
479 480 481 482 483 484 485 486 487

            zero_score *= lambda;
            if (zero_score <= score)
                cbp = 0;
        }

        for (i = 0; i < 6; i++) {
            if (s->block_last_index[i] >= 0 && ((cbp >> (5 - i)) & 1) == 0) {
                s->block_last_index[i] = -1;
488
                s->bdsp.clear_block(s->block[i]);
489 490 491 492 493 494 495 496 497 498 499
            }
        }
    } else {
        for (i = 0; i < 6; i++) {
            if (s->block_last_index[i] >= 0)
                cbp |= 1 << (5 - i);
        }
    }
    return cbp;
}

500 501
// FIXME this is duplicated to h263.c
static const int dquant_code[5] = { 1, 0, 9, 2, 3 };
502

503
void ff_mpeg4_encode_mb(MpegEncContext *s, int16_t block[6][64],
504
                        int motion_x, int motion_y)
505 506
{
    int cbpc, cbpy, pred_x, pred_y;
507 508 509 510
    PutBitContext *const pb2    = s->data_partitioning ? &s->pb2 : &s->pb;
    PutBitContext *const tex_pb = s->data_partitioning && s->pict_type != AV_PICTURE_TYPE_B ? &s->tex_pb : &s->pb;
    PutBitContext *const dc_pb  = s->data_partitioning && s->pict_type != AV_PICTURE_TYPE_I ? &s->pb2 : &s->pb;
    const int interleaved_stats = (s->flags & CODEC_FLAG_PASS1) && !s->data_partitioning ? 1 : 0;
511 512 513 514

    if (!s->mb_intra) {
        int i, cbp;

515 516 517 518 519 520 521 522 523 524 525
        if (s->pict_type == AV_PICTURE_TYPE_B) {
            /* convert from mv_dir to type */
            static const int mb_type_table[8] = { -1, 3, 2, 1, -1, -1, -1, 0 };
            int mb_type = mb_type_table[s->mv_dir];

            if (s->mb_x == 0) {
                for (i = 0; i < 2; i++)
                    s->last_mv[i][0][0] =
                    s->last_mv[i][0][1] =
                    s->last_mv[i][1][0] =
                    s->last_mv[i][1][1] = 0;
526 527
            }

528 529 530
            av_assert2(s->dquant >= -2 && s->dquant <= 2);
            av_assert2((s->dquant & 1) == 0);
            av_assert2(mb_type >= 0);
531 532

            /* nothing to do if this MB was skipped in the next P Frame */
533
            if (s->next_picture.mbskip_table[s->mb_y * s->mb_stride + s->mb_x]) {  // FIXME avoid DCT & ...
534
                s->skip_count++;
535 536 537 538 539
                s->mv[0][0][0] =
                s->mv[0][0][1] =
                s->mv[1][0][0] =
                s->mv[1][0][1] = 0;
                s->mv_dir  = MV_DIR_FORWARD;  // doesn't matter
540
                s->qscale -= s->dquant;
541
//                s->mb_skipped = 1;
542 543 544 545

                return;
            }

546
            cbp = get_b_cbp(s, block, motion_x, motion_y, mb_type);
547

548
            if ((cbp | motion_x | motion_y | mb_type) == 0) {
549
                /* direct MB with MV={0,0} */
550
                av_assert2(s->dquant == 0);
551 552 553

                put_bits(&s->pb, 1, 1); /* mb not coded modb1=1 */

554
                if (interleaved_stats) {
555 556 557 558 559 560 561
                    s->misc_bits++;
                    s->last_bits++;
                }
                s->skip_count++;
                return;
            }

562 563 564 565 566
            put_bits(&s->pb, 1, 0);            /* mb coded modb1=0 */
            put_bits(&s->pb, 1, cbp ? 0 : 1);  /* modb2 */ // FIXME merge
            put_bits(&s->pb, mb_type + 1, 1);  // this table is so simple that we don't need it :)
            if (cbp)
                put_bits(&s->pb, 6, cbp);
567

568 569 570
            if (cbp && mb_type) {
                if (s->dquant)
                    put_bits(&s->pb, 2, (s->dquant >> 2) + 3);
571 572
                else
                    put_bits(&s->pb, 1, 0);
573
            } else
574 575
                s->qscale -= s->dquant;

576 577
            if (!s->progressive_sequence) {
                if (cbp)
578
                    put_bits(&s->pb, 1, s->interlaced_dct);
579
                if (mb_type)                  // not direct mode
580 581 582
                    put_bits(&s->pb, 1, s->mv_type == MV_TYPE_FIELD);
            }

583 584
            if (interleaved_stats)
                s->misc_bits += get_bits_diff(s);
585

586
            if (!mb_type) {
587
                av_assert2(s->mv_dir & MV_DIRECT);
588 589 590
                ff_h263_encode_motion_vector(s, motion_x, motion_y, 1);
                s->b_count++;
                s->f_count++;
591
            } else {
592
                av_assert2(mb_type > 0 && mb_type < 4);
593 594 595 596 597 598 599 600 601 602
                if (s->mv_type != MV_TYPE_FIELD) {
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        ff_h263_encode_motion_vector(s,
                                                     s->mv[0][0][0] - s->last_mv[0][0][0],
                                                     s->mv[0][0][1] - s->last_mv[0][0][1],
                                                     s->f_code);
                        s->last_mv[0][0][0] =
                        s->last_mv[0][1][0] = s->mv[0][0][0];
                        s->last_mv[0][0][1] =
                        s->last_mv[0][1][1] = s->mv[0][0][1];
603 604
                        s->f_count++;
                    }
605 606 607 608 609 610 611 612 613
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        ff_h263_encode_motion_vector(s,
                                                     s->mv[1][0][0] - s->last_mv[1][0][0],
                                                     s->mv[1][0][1] - s->last_mv[1][0][1],
                                                     s->b_code);
                        s->last_mv[1][0][0] =
                        s->last_mv[1][1][0] = s->mv[1][0][0];
                        s->last_mv[1][0][1] =
                        s->last_mv[1][1][1] = s->mv[1][0][1];
614 615
                        s->b_count++;
                    }
616 617
                } else {
                    if (s->mv_dir & MV_DIR_FORWARD) {
618 619 620
                        put_bits(&s->pb, 1, s->field_select[0][0]);
                        put_bits(&s->pb, 1, s->field_select[0][1]);
                    }
621
                    if (s->mv_dir & MV_DIR_BACKWARD) {
622 623 624
                        put_bits(&s->pb, 1, s->field_select[1][0]);
                        put_bits(&s->pb, 1, s->field_select[1][1]);
                    }
625 626 627 628 629 630 631 632
                    if (s->mv_dir & MV_DIR_FORWARD) {
                        for (i = 0; i < 2; i++) {
                            ff_h263_encode_motion_vector(s,
                                                         s->mv[0][i][0] - s->last_mv[0][i][0],
                                                         s->mv[0][i][1] - s->last_mv[0][i][1] / 2,
                                                         s->f_code);
                            s->last_mv[0][i][0] = s->mv[0][i][0];
                            s->last_mv[0][i][1] = s->mv[0][i][1] * 2;
633 634 635
                        }
                        s->f_count++;
                    }
636 637 638 639 640 641 642 643
                    if (s->mv_dir & MV_DIR_BACKWARD) {
                        for (i = 0; i < 2; i++) {
                            ff_h263_encode_motion_vector(s,
                                                         s->mv[1][i][0] - s->last_mv[1][i][0],
                                                         s->mv[1][i][1] - s->last_mv[1][i][1] / 2,
                                                         s->b_code);
                            s->last_mv[1][i][0] = s->mv[1][i][0];
                            s->last_mv[1][i][1] = s->mv[1][i][1] * 2;
644 645 646 647 648 649
                        }
                        s->b_count++;
                    }
                }
            }

650 651
            if (interleaved_stats)
                s->mv_bits += get_bits_diff(s);
652 653 654

            mpeg4_encode_blocks(s, block, NULL, NULL, NULL, &s->pb);

655 656 657 658 659 660 661 662 663 664 665
            if (interleaved_stats)
                s->p_tex_bits += get_bits_diff(s);
        } else { /* s->pict_type==AV_PICTURE_TYPE_B */
            cbp = get_p_cbp(s, block, motion_x, motion_y);

            if ((cbp | motion_x | motion_y | s->dquant) == 0 &&
                s->mv_type == MV_TYPE_16X16) {
                /* check if the B frames can skip it too, as we must skip it
                 * if we skip here why didn't they just compress
                 * the skip-mb bits instead of reusing them ?! */
                if (s->max_b_frames > 0) {
666
                    int i;
667
                    int x, y, offset;
668 669
                    uint8_t *p_pic;

670 671
                    x = s->mb_x * 16;
                    y = s->mb_y * 16;
672

673
                    offset = x + y * s->linesize;
674
                    p_pic  = s->new_picture.f->data[0] + offset;
675

676 677
                    s->mb_skipped = 1;
                    for (i = 0; i < s->max_b_frames; i++) {
678 679
                        uint8_t *b_pic;
                        int diff;
680
                        Picture *pic = s->reordered_input_picture[i + 1];
681

682
                        if (!pic || pic->f->pict_type != AV_PICTURE_TYPE_B)
683
                            break;
684

685
                        b_pic = pic->f->data[0] + offset;
686
                        if (!pic->shared)
687
                            b_pic += INPLACE_OFFSET;
688 689 690 691 692 693 694 695 696

                        if (x + 16 > s->width || y + 16 > s->height) {
                            int x1, y1;
                            int xe = FFMIN(16, s->width - x);
                            int ye = FFMIN(16, s->height - y);
                            diff = 0;
                            for (y1 = 0; y1 < ye; y1++) {
                                for (x1 = 0; x1 < xe; x1++) {
                                    diff += FFABS(p_pic[x1 + y1 * s->linesize] - b_pic[x1 + y1 * s->linesize]);
Michael Niedermayer's avatar
Michael Niedermayer committed
697 698
                                }
                            }
699 700
                            diff = diff * 256 / (xe * ye);
                        } else {
701
                            diff = s->mecc.sad[0](NULL, p_pic, b_pic, s->linesize, 16);
Michael Niedermayer's avatar
Michael Niedermayer committed
702
                        }
703 704
                        if (diff > s->qscale * 70) {  // FIXME check that 70 is optimal
                            s->mb_skipped = 0;
705 706 707
                            break;
                        }
                    }
708 709
                } else
                    s->mb_skipped = 1;
710

711
                if (s->mb_skipped == 1) {
712 713 714
                    /* skip macroblock */
                    put_bits(&s->pb, 1, 1);

715
                    if (interleaved_stats) {
716 717 718 719 720 721 722 723 724 725
                        s->misc_bits++;
                        s->last_bits++;
                    }
                    s->skip_count++;

                    return;
                }
            }

            put_bits(&s->pb, 1, 0);     /* mb coded */
726 727
            cbpc  = cbp & 3;
            cbpy  = cbp >> 2;
728
            cbpy ^= 0xf;
729 730 731
            if (s->mv_type == MV_TYPE_16X16) {
                if (s->dquant)
                    cbpc += 8;
732
                put_bits(&s->pb,
733 734
                         ff_h263_inter_MCBPC_bits[cbpc],
                         ff_h263_inter_MCBPC_code[cbpc]);
735

736
                put_bits(pb2, ff_h263_cbpy_tab[cbpy][1], ff_h263_cbpy_tab[cbpy][0]);
737 738
                if (s->dquant)
                    put_bits(pb2, 2, dquant_code[s->dquant + 2]);
739

740 741
                if (!s->progressive_sequence) {
                    if (cbp)
742 743 744 745
                        put_bits(pb2, 1, s->interlaced_dct);
                    put_bits(pb2, 1, 0);
                }

746 747
                if (interleaved_stats)
                    s->misc_bits += get_bits_diff(s);
748 749

                /* motion vectors: 16x16 mode */
750
                ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
751

752 753 754 755 756 757 758
                ff_h263_encode_motion_vector(s,
                                             motion_x - pred_x,
                                             motion_y - pred_y,
                                             s->f_code);
            } else if (s->mv_type == MV_TYPE_FIELD) {
                if (s->dquant)
                    cbpc += 8;
759
                put_bits(&s->pb,
760 761
                         ff_h263_inter_MCBPC_bits[cbpc],
                         ff_h263_inter_MCBPC_code[cbpc]);
762

763
                put_bits(pb2, ff_h263_cbpy_tab[cbpy][1], ff_h263_cbpy_tab[cbpy][0]);
764 765
                if (s->dquant)
                    put_bits(pb2, 2, dquant_code[s->dquant + 2]);
766

767
                av_assert2(!s->progressive_sequence);
768
                if (cbp)
769 770 771
                    put_bits(pb2, 1, s->interlaced_dct);
                put_bits(pb2, 1, 1);

772 773
                if (interleaved_stats)
                    s->misc_bits += get_bits_diff(s);
774 775

                /* motion vectors: 16x8 interlaced mode */
776
                ff_h263_pred_motion(s, 0, 0, &pred_x, &pred_y);
777
                pred_y /= 2;
778 779 780 781

                put_bits(&s->pb, 1, s->field_select[0][0]);
                put_bits(&s->pb, 1, s->field_select[0][1]);

782 783 784 785 786 787 788 789 790
                ff_h263_encode_motion_vector(s,
                                             s->mv[0][0][0] - pred_x,
                                             s->mv[0][0][1] - pred_y,
                                             s->f_code);
                ff_h263_encode_motion_vector(s,
                                             s->mv[0][1][0] - pred_x,
                                             s->mv[0][1][1] - pred_y,
                                             s->f_code);
            } else {
791
                av_assert2(s->mv_type == MV_TYPE_8X8);
792
                put_bits(&s->pb,
793 794
                         ff_h263_inter_MCBPC_bits[cbpc + 16],
                         ff_h263_inter_MCBPC_code[cbpc + 16]);
795
                put_bits(pb2, ff_h263_cbpy_tab[cbpy][1], ff_h263_cbpy_tab[cbpy][0]);
796

797 798
                if (!s->progressive_sequence && cbp)
                    put_bits(pb2, 1, s->interlaced_dct);
799

800 801
                if (interleaved_stats)
                    s->misc_bits += get_bits_diff(s);
802

803
                for (i = 0; i < 4; i++) {
804
                    /* motion vectors: 8x8 mode*/
805
                    ff_h263_pred_motion(s, i, 0, &pred_x, &pred_y);
806

807 808 809 810
                    ff_h263_encode_motion_vector(s,
                                                 s->current_picture.motion_val[0][s->block_index[i]][0] - pred_x,
                                                 s->current_picture.motion_val[0][s->block_index[i]][1] - pred_y,
                                                 s->f_code);
811 812 813
                }
            }

814 815
            if (interleaved_stats)
                s->mv_bits += get_bits_diff(s);
816 817 818

            mpeg4_encode_blocks(s, block, NULL, NULL, NULL, tex_pb);

819 820 821
            if (interleaved_stats)
                s->p_tex_bits += get_bits_diff(s);

822 823 824 825
            s->f_count++;
        }
    } else {
        int cbp;
826 827
        int dc_diff[6];  // dc values with the dc prediction subtracted
        int dir[6];      // prediction direction
828 829 830 831
        int zigzag_last_index[6];
        uint8_t *scan_table[6];
        int i;

832 833
        for (i = 0; i < 6; i++)
            dc_diff[i] = ff_mpeg4_pred_dc(s, i, block[i][0], &dir[i], 1);
834

835 836 837 838 839
        if (s->flags & CODEC_FLAG_AC_PRED) {
            s->ac_pred = decide_ac_pred(s, block, dir, scan_table, zigzag_last_index);
        } else {
            for (i = 0; i < 6; i++)
                scan_table[i] = s->intra_scantable.permutated;
840 841 842 843
        }

        /* compute cbp */
        cbp = 0;
844
        for (i = 0; i < 6; i++)
845 846 847 848
            if (s->block_last_index[i] >= 1)
                cbp |= 1 << (5 - i);

        cbpc = cbp & 3;
849
        if (s->pict_type == AV_PICTURE_TYPE_I) {
850 851
            if (s->dquant)
                cbpc += 4;
852
            put_bits(&s->pb,
853 854
                     ff_h263_intra_MCBPC_bits[cbpc],
                     ff_h263_intra_MCBPC_code[cbpc]);
855
        } else {
856 857
            if (s->dquant)
                cbpc += 8;
858 859
            put_bits(&s->pb, 1, 0);     /* mb coded */
            put_bits(&s->pb,
860 861
                     ff_h263_inter_MCBPC_bits[cbpc + 4],
                     ff_h263_inter_MCBPC_code[cbpc + 4]);
862 863 864
        }
        put_bits(pb2, 1, s->ac_pred);
        cbpy = cbp >> 2;
865
        put_bits(pb2, ff_h263_cbpy_tab[cbpy][1], ff_h263_cbpy_tab[cbpy][0]);
866 867
        if (s->dquant)
            put_bits(dc_pb, 2, dquant_code[s->dquant + 2]);
868

869
        if (!s->progressive_sequence)
870 871
            put_bits(dc_pb, 1, s->interlaced_dct);

872 873
        if (interleaved_stats)
            s->misc_bits += get_bits_diff(s);
874 875 876

        mpeg4_encode_blocks(s, block, dc_diff, scan_table, dc_pb, tex_pb);

877 878
        if (interleaved_stats)
            s->i_tex_bits += get_bits_diff(s);
879 880
        s->i_count++;

881 882 883
        /* restore ac coeffs & last_index stuff
         * if we messed them up with the prediction */
        if (s->ac_pred)
884 885 886 887 888 889 890
            restore_ac_coeffs(s, block, dir, scan_table, zigzag_last_index);
    }
}

/**
 * add mpeg4 stuffing bits (01...1)
 */
891
void ff_mpeg4_stuffing(PutBitContext *pbc)
892 893 894
{
    int length;
    put_bits(pbc, 1, 0);
895 896 897
    length = (-put_bits_count(pbc)) & 7;
    if (length)
        put_bits(pbc, length, (1 << length) - 1);
898 899 900
}

/* must be called before writing the header */
901 902 903
void ff_set_mpeg4_time(MpegEncContext *s)
{
    if (s->pict_type == AV_PICTURE_TYPE_B) {
904
        ff_mpeg4_init_direct_mv(s);
905 906
    } else {
        s->last_time_base = s->time_base;
907
        s->time_base      = FFUDIV(s->time, s->avctx->time_base.den);
908 909 910
    }
}

911 912
static void mpeg4_encode_gop_header(MpegEncContext *s)
{
913 914 915 916 917 918
    int hours, minutes, seconds;
    int64_t time;

    put_bits(&s->pb, 16, 0);
    put_bits(&s->pb, 16, GOP_STARTCODE);

919
    time = s->current_picture_ptr->f->pts;
920
    if (s->reordered_input_picture[1])
921
        time = FFMIN(time, s->reordered_input_picture[1]->f->pts);
922
    time = time * s->avctx->time_base.num;
923
    s->last_time_base = FFUDIV(time, s->avctx->time_base.den);
924

925 926 927 928
    seconds = FFUDIV(time, s->avctx->time_base.den);
    minutes = FFUDIV(seconds, 60); seconds = FFUMOD(seconds, 60);
    hours   = FFUDIV(minutes, 60); minutes = FFUMOD(minutes, 60);
    hours   = FFUMOD(hours  , 24);
929 930 931 932 933 934

    put_bits(&s->pb, 5, hours);
    put_bits(&s->pb, 6, minutes);
    put_bits(&s->pb, 1, 1);
    put_bits(&s->pb, 6, seconds);

935 936
    put_bits(&s->pb, 1, !!(s->flags & CODEC_FLAG_CLOSED_GOP));
    put_bits(&s->pb, 1, 0);  // broken link == NO
937 938 939 940

    ff_mpeg4_stuffing(&s->pb);
}

941 942
static void mpeg4_encode_visual_object_header(MpegEncContext *s)
{
943 944 945
    int profile_and_level_indication;
    int vo_ver_id;

946
    if (s->avctx->profile != FF_PROFILE_UNKNOWN) {
947
        profile_and_level_indication = s->avctx->profile << 4;
948 949 950 951
    } else if (s->max_b_frames || s->quarter_sample) {
        profile_and_level_indication = 0xF0;  // adv simple
    } else {
        profile_and_level_indication = 0x00;  // simple
952 953
    }

954
    if (s->avctx->level != FF_LEVEL_UNKNOWN)
955
        profile_and_level_indication |= s->avctx->level;
956 957
    else
        profile_and_level_indication |= 1;   // level 1
958

959 960 961 962
    if (profile_and_level_indication >> 4 == 0xF)
        vo_ver_id = 5;
    else
        vo_ver_id = 1;
963

964
    // FIXME levels
965 966 967 968 969 970 971 972 973 974

    put_bits(&s->pb, 16, 0);
    put_bits(&s->pb, 16, VOS_STARTCODE);

    put_bits(&s->pb, 8, profile_and_level_indication);

    put_bits(&s->pb, 16, 0);
    put_bits(&s->pb, 16, VISUAL_OBJ_STARTCODE);

    put_bits(&s->pb, 1, 1);
975 976
    put_bits(&s->pb, 4, vo_ver_id);
    put_bits(&s->pb, 3, 1);     // priority
977

978
    put_bits(&s->pb, 4, 1);     // visual obj type== video obj
979

980
    put_bits(&s->pb, 1, 0);     // video signal type == no clue // FIXME
981 982 983 984

    ff_mpeg4_stuffing(&s->pb);
}

985 986 987
static void mpeg4_encode_vol_header(MpegEncContext *s,
                                    int vo_number,
                                    int vol_number)
988 989 990
{
    int vo_ver_id;

991 992
    if (!CONFIG_MPEG4_ENCODER)
        return;
993

994 995 996 997 998 999
    if (s->max_b_frames || s->quarter_sample) {
        vo_ver_id  = 5;
        s->vo_type = ADV_SIMPLE_VO_TYPE;
    } else {
        vo_ver_id  = 1;
        s->vo_type = SIMPLE_VO_TYPE;
1000 1001 1002 1003 1004 1005 1006 1007 1008
    }

    put_bits(&s->pb, 16, 0);
    put_bits(&s->pb, 16, 0x100 + vo_number);        /* video obj */
    put_bits(&s->pb, 16, 0);
    put_bits(&s->pb, 16, 0x120 + vol_number);       /* video obj layer */

    put_bits(&s->pb, 1, 0);             /* random access vol */
    put_bits(&s->pb, 8, s->vo_type);    /* video obj type indication */
1009
    if (s->workaround_bugs & FF_BUG_MS) {
1010 1011 1012 1013 1014 1015 1016
        put_bits(&s->pb, 1, 0);         /* is obj layer id= no */
    } else {
        put_bits(&s->pb, 1, 1);         /* is obj layer id= yes */
        put_bits(&s->pb, 4, vo_ver_id); /* is obj layer ver id */
        put_bits(&s->pb, 3, 1);         /* is obj layer priority */
    }

1017
    s->aspect_ratio_info = ff_h263_aspect_to_info(s->avctx->sample_aspect_ratio);
1018

1019 1020
    put_bits(&s->pb, 4, s->aspect_ratio_info); /* aspect ratio info */
    if (s->aspect_ratio_info == FF_ASPECT_EXTENDED) {
1021 1022
        av_reduce(&s->avctx->sample_aspect_ratio.num, &s->avctx->sample_aspect_ratio.den,
                   s->avctx->sample_aspect_ratio.num,  s->avctx->sample_aspect_ratio.den, 255);
1023 1024 1025 1026
        put_bits(&s->pb, 8, s->avctx->sample_aspect_ratio.num);
        put_bits(&s->pb, 8, s->avctx->sample_aspect_ratio.den);
    }

1027
    if (s->workaround_bugs & FF_BUG_MS) {
1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050
        put_bits(&s->pb, 1, 0);         /* vol control parameters= no @@@ */
    } else {
        put_bits(&s->pb, 1, 1);         /* vol control parameters= yes */
        put_bits(&s->pb, 2, 1);         /* chroma format YUV 420/YV12 */
        put_bits(&s->pb, 1, s->low_delay);
        put_bits(&s->pb, 1, 0);         /* vbv parameters= no */
    }

    put_bits(&s->pb, 2, RECT_SHAPE);    /* vol shape= rectangle */
    put_bits(&s->pb, 1, 1);             /* marker bit */

    put_bits(&s->pb, 16, s->avctx->time_base.den);
    if (s->time_increment_bits < 1)
        s->time_increment_bits = 1;
    put_bits(&s->pb, 1, 1);             /* marker bit */
    put_bits(&s->pb, 1, 0);             /* fixed vop rate=no */
    put_bits(&s->pb, 1, 1);             /* marker bit */
    put_bits(&s->pb, 13, s->width);     /* vol width */
    put_bits(&s->pb, 1, 1);             /* marker bit */
    put_bits(&s->pb, 13, s->height);    /* vol height */
    put_bits(&s->pb, 1, 1);             /* marker bit */
    put_bits(&s->pb, 1, s->progressive_sequence ? 0 : 1);
    put_bits(&s->pb, 1, 1);             /* obmc disable */
1051
    if (vo_ver_id == 1)
1052
        put_bits(&s->pb, 1, 0);       /* sprite enable */
1053
    else
1054
        put_bits(&s->pb, 2, 0);       /* sprite enable */
1055 1056 1057 1058

    put_bits(&s->pb, 1, 0);             /* not 8 bit == false */
    put_bits(&s->pb, 1, s->mpeg_quant); /* quant type= (0=h263 style)*/

1059
    if (s->mpeg_quant) {
1060 1061 1062 1063 1064 1065 1066
        ff_write_quant_matrix(&s->pb, s->avctx->intra_matrix);
        ff_write_quant_matrix(&s->pb, s->avctx->inter_matrix);
    }

    if (vo_ver_id != 1)
        put_bits(&s->pb, 1, s->quarter_sample);
    put_bits(&s->pb, 1, 1);             /* complexity estimation disable */
1067
    put_bits(&s->pb, 1, s->rtp_mode ? 0 : 1); /* resync marker disable */
1068
    put_bits(&s->pb, 1, s->data_partitioning ? 1 : 0);
1069
    if (s->data_partitioning)
1070 1071
        put_bits(&s->pb, 1, 0);         /* no rvlc */

1072
    if (vo_ver_id != 1) {
1073 1074 1075 1076 1077 1078 1079 1080
        put_bits(&s->pb, 1, 0);         /* newpred */
        put_bits(&s->pb, 1, 0);         /* reduced res vop */
    }
    put_bits(&s->pb, 1, 0);             /* scalability */

    ff_mpeg4_stuffing(&s->pb);

    /* user data */
1081
    if (!(s->flags & CODEC_FLAG_BITEXACT)) {
1082 1083
        put_bits(&s->pb, 16, 0);
        put_bits(&s->pb, 16, 0x1B2);    /* user_data */
1084
        avpriv_put_string(&s->pb, LIBAVCODEC_IDENT, 0);
1085 1086 1087 1088
    }
}

/* write mpeg4 VOP header */
1089
void ff_mpeg4_encode_picture_header(MpegEncContext *s, int picture_number)
1090 1091 1092 1093
{
    int time_incr;
    int time_div, time_mod;

1094 1095 1096
    if (s->pict_type == AV_PICTURE_TYPE_I) {
        if (!(s->flags & CODEC_FLAG_GLOBAL_HEADER)) {
            if (s->strict_std_compliance < FF_COMPLIANCE_VERY_STRICT)  // HACK, the reference sw is buggy
1097
                mpeg4_encode_visual_object_header(s);
1098
            if (s->strict_std_compliance < FF_COMPLIANCE_VERY_STRICT || picture_number == 0)  // HACK, the reference sw is buggy
1099 1100
                mpeg4_encode_vol_header(s, 0, 0);
        }
1101
        if (!(s->workaround_bugs & FF_BUG_MS))
1102 1103 1104
            mpeg4_encode_gop_header(s);
    }

1105
    s->partitioned_frame = s->data_partitioning && s->pict_type != AV_PICTURE_TYPE_B;
1106 1107 1108 1109 1110

    put_bits(&s->pb, 16, 0);                /* vop header */
    put_bits(&s->pb, 16, VOP_STARTCODE);    /* vop header */
    put_bits(&s->pb, 2, s->pict_type - 1);  /* pict type: I = 0 , P = 1 */

1111 1112
    time_div  = FFUDIV(s->time, s->avctx->time_base.den);
    time_mod  = FFUMOD(s->time, s->avctx->time_base.den);
1113
    time_incr = time_div - s->last_time_base;
1114
    av_assert0(time_incr >= 0);
1115
    while (time_incr--)
1116 1117 1118 1119 1120 1121 1122 1123
        put_bits(&s->pb, 1, 1);

    put_bits(&s->pb, 1, 0);

    put_bits(&s->pb, 1, 1);                             /* marker */
    put_bits(&s->pb, s->time_increment_bits, time_mod); /* time increment */
    put_bits(&s->pb, 1, 1);                             /* marker */
    put_bits(&s->pb, 1, 1);                             /* vop coded */
1124
    if (s->pict_type == AV_PICTURE_TYPE_P) {
1125 1126 1127
        put_bits(&s->pb, 1, s->no_rounding);    /* rounding type */
    }
    put_bits(&s->pb, 3, 0);     /* intra dc VLC threshold */
1128
    if (!s->progressive_sequence) {
1129
        put_bits(&s->pb, 1, s->current_picture_ptr->f->top_field_first);
1130
        put_bits(&s->pb, 1, s->alternate_scan);
1131
    }
1132
    // FIXME sprite stuff
1133 1134 1135

    put_bits(&s->pb, 5, s->qscale);

1136
    if (s->pict_type != AV_PICTURE_TYPE_I)
1137
        put_bits(&s->pb, 3, s->f_code);  /* fcode_for */
1138
    if (s->pict_type == AV_PICTURE_TYPE_B)
1139
        put_bits(&s->pb, 3, s->b_code);  /* fcode_back */
1140 1141
}

1142
static av_cold void init_uni_dc_tab(void)
1143 1144 1145
{
    int level, uni_code, uni_len;

1146
    for (level = -256; level < 256; level++) {
1147 1148 1149
        int size, v, l;
        /* find number of bits */
        size = 0;
1150
        v    = abs(level);
1151 1152 1153 1154 1155 1156
        while (v) {
            v >>= 1;
            size++;
        }

        if (level < 0)
1157
            l = (-level) ^ ((1 << size) - 1);
1158
        else
1159
            l = level;
1160 1161

        /* luminance */
1162 1163
        uni_code = ff_mpeg4_DCtab_lum[size][0];
        uni_len  = ff_mpeg4_DCtab_lum[size][1];
1164 1165

        if (size > 0) {
1166 1167 1168 1169 1170 1171
            uni_code <<= size;
            uni_code  |= l;
            uni_len   += size;
            if (size > 8) {
                uni_code <<= 1;
                uni_code  |= 1;
1172 1173 1174
                uni_len++;
            }
        }
1175 1176
        uni_DCtab_lum_bits[level + 256] = uni_code;
        uni_DCtab_lum_len[level + 256]  = uni_len;
1177 1178

        /* chrominance */
1179 1180
        uni_code = ff_mpeg4_DCtab_chrom[size][0];
        uni_len  = ff_mpeg4_DCtab_chrom[size][1];
1181 1182

        if (size > 0) {
1183 1184 1185 1186 1187 1188
            uni_code <<= size;
            uni_code  |= l;
            uni_len   += size;
            if (size > 8) {
                uni_code <<= 1;
                uni_code  |= 1;
1189 1190 1191
                uni_len++;
            }
        }
1192 1193
        uni_DCtab_chrom_bits[level + 256] = uni_code;
        uni_DCtab_chrom_len[level + 256]  = uni_len;
1194 1195 1196
    }
}

1197 1198 1199
static av_cold void init_uni_mpeg4_rl_tab(RLTable *rl, uint32_t *bits_tab,
                                          uint8_t *len_tab)
{
1200 1201
    int slevel, run, last;

1202
    av_assert0(MAX_LEVEL >= 64);
1203
    av_assert0(MAX_RUN >= 63);
1204 1205 1206 1207 1208 1209 1210 1211 1212

    for (slevel = -64; slevel < 64; slevel++) {
        if (slevel == 0)
            continue;
        for (run = 0; run < 64; run++) {
            for (last = 0; last <= 1; last++) {
                const int index = UNI_MPEG4_ENC_INDEX(last, run, slevel + 64);
                int level       = slevel < 0 ? -slevel : slevel;
                int sign        = slevel < 0 ? 1 : 0;
1213 1214 1215
                int bits, len, code;
                int level1, run1;

1216
                len_tab[index] = 100;
1217 1218

                /* ESC0 */
1219 1220 1221 1222 1223 1224 1225 1226 1227
                code = get_rl_index(rl, last, run, level);
                bits = rl->table_vlc[code][0];
                len  = rl->table_vlc[code][1];
                bits = bits * 2 + sign;
                len++;

                if (code != rl->n && len < len_tab[index]) {
                    bits_tab[index] = bits;
                    len_tab[index]  = len;
1228 1229
                }
                /* ESC1 */
1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245
                bits = rl->table_vlc[rl->n][0];
                len  = rl->table_vlc[rl->n][1];
                bits = bits * 2;
                len++;                 // esc1
                level1 = level - rl->max_level[last][run];
                if (level1 > 0) {
                    code   = get_rl_index(rl, last, run, level1);
                    bits <<= rl->table_vlc[code][1];
                    len   += rl->table_vlc[code][1];
                    bits  += rl->table_vlc[code][0];
                    bits   = bits * 2 + sign;
                    len++;

                    if (code != rl->n && len < len_tab[index]) {
                        bits_tab[index] = bits;
                        len_tab[index]  = len;
1246 1247 1248
                    }
                }
                /* ESC2 */
1249 1250 1251 1252
                bits = rl->table_vlc[rl->n][0];
                len  = rl->table_vlc[rl->n][1];
                bits = bits * 4 + 2;
                len += 2;                 // esc2
1253
                run1 = run - rl->max_run[last][level] - 1;
1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264
                if (run1 >= 0) {
                    code   = get_rl_index(rl, last, run1, level);
                    bits <<= rl->table_vlc[code][1];
                    len   += rl->table_vlc[code][1];
                    bits  += rl->table_vlc[code][0];
                    bits   = bits * 2 + sign;
                    len++;

                    if (code != rl->n && len < len_tab[index]) {
                        bits_tab[index] = bits;
                        len_tab[index]  = len;
1265 1266 1267
                    }
                }
                /* ESC3 */
1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285
                bits = rl->table_vlc[rl->n][0];
                len  = rl->table_vlc[rl->n][1];
                bits = bits * 4 + 3;
                len += 2;                 // esc3
                bits = bits * 2 + last;
                len++;
                bits = bits * 64 + run;
                len += 6;
                bits = bits * 2 + 1;
                len++;                    // marker
                bits = bits * 4096 + (slevel & 0xfff);
                len += 12;
                bits = bits * 2 + 1;
                len++;                    // marker

                if (len < len_tab[index]) {
                    bits_tab[index] = bits;
                    len_tab[index]  = len;
1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297
                }
            }
        }
    }
}

static av_cold int encode_init(AVCodecContext *avctx)
{
    MpegEncContext *s = avctx->priv_data;
    int ret;
    static int done = 0;

1298 1299 1300 1301 1302
    if (avctx->width >= (1<<13) || avctx->height >= (1<<13)) {
        av_log(avctx, AV_LOG_ERROR, "dimensions too large for MPEG-4\n");
        return AVERROR(EINVAL);
    }

1303
    if ((ret = ff_mpv_encode_init(avctx)) < 0)
1304 1305 1306 1307 1308 1309 1310
        return ret;

    if (!done) {
        done = 1;

        init_uni_dc_tab();

1311
        ff_init_rl(&ff_mpeg4_rl_intra, ff_mpeg4_static_rl_table_store[0]);
1312

1313
        init_uni_mpeg4_rl_tab(&ff_mpeg4_rl_intra, uni_mpeg4_intra_rl_bits, uni_mpeg4_intra_rl_len);
1314
        init_uni_mpeg4_rl_tab(&ff_h263_rl_inter, uni_mpeg4_inter_rl_bits, uni_mpeg4_inter_rl_len);
1315 1316
    }

1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329
    s->min_qcoeff               = -2048;
    s->max_qcoeff               = 2047;
    s->intra_ac_vlc_length      = uni_mpeg4_intra_rl_len;
    s->intra_ac_vlc_last_length = uni_mpeg4_intra_rl_len + 128 * 64;
    s->inter_ac_vlc_length      = uni_mpeg4_inter_rl_len;
    s->inter_ac_vlc_last_length = uni_mpeg4_inter_rl_len + 128 * 64;
    s->luma_dc_vlc_length       = uni_DCtab_lum_len;
    s->ac_esc_length            = 7 + 2 + 1 + 6 + 1 + 12 + 1;
    s->y_dc_scale_table         = ff_mpeg4_y_dc_scale_table;
    s->c_dc_scale_table         = ff_mpeg4_c_dc_scale_table;

    if (s->flags & CODEC_FLAG_GLOBAL_HEADER) {
        s->avctx->extradata = av_malloc(1024);
1330 1331
        init_put_bits(&s->pb, s->avctx->extradata, 1024);

1332
        if (!(s->workaround_bugs & FF_BUG_MS))
1333 1334 1335 1336 1337
            mpeg4_encode_visual_object_header(s);
        mpeg4_encode_vol_header(s, 0, 0);

//            ff_mpeg4_stuffing(&s->pb); ?
        flush_put_bits(&s->pb);
1338
        s->avctx->extradata_size = (put_bits_count(&s->pb) + 7) >> 3;
1339 1340 1341 1342 1343 1344
    }
    return 0;
}

void ff_mpeg4_init_partitions(MpegEncContext *s)
{
1345 1346 1347 1348 1349
    uint8_t *start = put_bits_ptr(&s->pb);
    uint8_t *end   = s->pb.buf_end;
    int size       = end - start;
    int pb_size    = (((intptr_t)start + size / 3) & (~3)) - (intptr_t)start;
    int tex_size   = (size - 2 * pb_size) & (~3);
1350 1351

    set_put_bits_buffer_size(&s->pb, pb_size);
1352 1353
    init_put_bits(&s->tex_pb, start + pb_size, tex_size);
    init_put_bits(&s->pb2, start + pb_size + tex_size, pb_size);
1354 1355 1356 1357
}

void ff_mpeg4_merge_partitions(MpegEncContext *s)
{
1358 1359 1360
    const int pb2_len    = put_bits_count(&s->pb2);
    const int tex_pb_len = put_bits_count(&s->tex_pb);
    const int bits       = put_bits_count(&s->pb);
1361

1362
    if (s->pict_type == AV_PICTURE_TYPE_I) {
1363
        put_bits(&s->pb, 19, DC_MARKER);
1364 1365 1366
        s->misc_bits  += 19 + pb2_len + bits - s->last_bits;
        s->i_tex_bits += tex_pb_len;
    } else {
1367
        put_bits(&s->pb, 17, MOTION_MARKER);
1368 1369 1370
        s->misc_bits  += 17 + pb2_len;
        s->mv_bits    += bits - s->last_bits;
        s->p_tex_bits += tex_pb_len;
1371 1372 1373 1374 1375 1376
    }

    flush_put_bits(&s->pb2);
    flush_put_bits(&s->tex_pb);

    set_put_bits_buffer_size(&s->pb, s->pb2.buf_end - s->pb.buf);
1377
    avpriv_copy_bits(&s->pb, s->pb2.buf, pb2_len);
1378
    avpriv_copy_bits(&s->pb, s->tex_pb.buf, tex_pb_len);
1379
    s->last_bits = put_bits_count(&s->pb);
1380 1381 1382 1383
}

void ff_mpeg4_encode_video_packet_header(MpegEncContext *s)
{
1384
    int mb_num_bits = av_log2(s->mb_num - 1) + 1;
1385 1386 1387 1388

    put_bits(&s->pb, ff_mpeg4_get_video_packet_prefix_length(s), 0);
    put_bits(&s->pb, 1, 1);

1389
    put_bits(&s->pb, mb_num_bits, s->mb_x + s->mb_y * s->mb_width);
1390 1391 1392 1393
    put_bits(&s->pb, s->quant_precision, s->qscale);
    put_bits(&s->pb, 1, 0); /* no HEC */
}

1394 1395 1396
#define OFFSET(x) offsetof(MpegEncContext, x)
#define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
static const AVOption options[] = {
1397 1398
    { "data_partitioning", "Use data partitioning.",      OFFSET(data_partitioning), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VE },
    { "alternate_scan",    "Enable alternate scantable.", OFFSET(alternate_scan),    AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VE },
1399
    FF_MPV_COMMON_OPTS
1400 1401 1402 1403 1404 1405 1406 1407 1408 1409
    { NULL },
};

static const AVClass mpeg4enc_class = {
    .class_name = "MPEG4 encoder",
    .item_name  = av_default_item_name,
    .option     = options,
    .version    = LIBAVUTIL_VERSION_INT,
};

1410
AVCodec ff_mpeg4_encoder = {
1411
    .name           = "mpeg4",
1412
    .long_name      = NULL_IF_CONFIG_SMALL("MPEG-4 part 2"),
1413
    .type           = AVMEDIA_TYPE_VIDEO,
1414
    .id             = AV_CODEC_ID_MPEG4,
1415 1416
    .priv_data_size = sizeof(MpegEncContext),
    .init           = encode_init,
1417 1418
    .encode2        = ff_mpv_encode_picture,
    .close          = ff_mpv_encode_end,
1419
    .pix_fmts       = (const enum AVPixelFormat[]) { AV_PIX_FMT_YUV420P, AV_PIX_FMT_NONE },
1420
    .capabilities   = CODEC_CAP_DELAY | CODEC_CAP_SLICE_THREADS,
1421
    .priv_class     = &mpeg4enc_class,
1422
};