libx264.c 48 KB
Newer Older
1 2
/*
 * H.264 encoding using the x264 library
3
 * Copyright (C) 2005  Mans Rullgard <mans@mansr.com>
4
 *
5 6 7
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
8 9
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
10
 * version 2.1 of the License, or (at your option) any later version.
11
 *
12
 * FFmpeg is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with FFmpeg; if not, write to the Free Software
19
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 21
 */

22
#include "libavutil/eval.h"
23
#include "libavutil/internal.h"
24
#include "libavutil/opt.h"
25
#include "libavutil/mem.h"
26
#include "libavutil/pixdesc.h"
27
#include "libavutil/stereo3d.h"
28
#include "libavutil/intreadwrite.h"
29
#include "avcodec.h"
30
#include "internal.h"
31 32 33 34 35

#if defined(_MSC_VER)
#define X264_API_IMPORTS 1
#endif

36
#include <x264.h>
37
#include <float.h>
Michael Niedermayer's avatar
Michael Niedermayer committed
38
#include <math.h>
Robert Swain's avatar
Robert Swain committed
39 40 41
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
42

43 44 45 46
// from x264.h, for quant_offsets, Macroblocks are 16x16
// blocks of pixels (with respect to the luma plane)
#define MB_SIZE 16

47
typedef struct X264Context {
48
    AVClass        *class;
49 50 51 52 53
    x264_param_t    params;
    x264_t         *enc;
    x264_picture_t  pic;
    uint8_t        *sei;
    int             sei_size;
54 55 56 57
    char *preset;
    char *tune;
    char *profile;
    char *level;
58
    int fastfirstpass;
59
    char *wpredp;
60
    char *x264opts;
61
    float crf;
62
    float crf_max;
63
    int cqp;
64
    int aq_mode;
65
    float aq_strength;
66
    char *psy_rd;
67
    int psy;
68
    int rc_lookahead;
69
    int weightp;
70
    int weightb;
71
    int ssim;
72
    int intra_refresh;
73
    int bluray_compat;
74
    int b_bias;
75
    int b_pyramid;
76
    int mixed_refs;
77
    int dct8x8;
78
    int fast_pskip;
79
    int aud;
80
    int mbtree;
81
    char *deblock;
82
    float cplxblur;
83
    char *partitions;
84
    int direct_pred;
85
    int slice_max_size;
86
    char *stats;
Anton Khirnov's avatar
Anton Khirnov committed
87
    int nal_hrd;
88
    int avcintra_class;
89
    int motion_est;
90
    int forced_idr;
91
    int coder;
92
    int a53_cc;
93
    int b_frame_strategy;
94
    int chroma_offset;
95
    int scenechange_threshold;
96
    int noise_reduction;
97

98
    char *x264_params;
99 100 101

    int nb_reordered_opaque, next_reordered_opaque;
    int64_t *reordered_opaque;
102 103 104 105 106 107

    /**
     * If the encoder does not support ROI then warn the first time we
     * encounter a frame with ROI side data.
     */
    int roi_warned;
108 109
} X264Context;

110
static void X264_log(void *p, int level, const char *fmt, va_list args)
111 112
{
    static const int level_map[] = {
113
        [X264_LOG_ERROR]   = AV_LOG_ERROR,
114
        [X264_LOG_WARNING] = AV_LOG_WARNING,
115
        [X264_LOG_INFO]    = AV_LOG_INFO,
116
        [X264_LOG_DEBUG]   = AV_LOG_DEBUG
117 118
    };

119
    if (level < 0 || level > X264_LOG_DEBUG)
120
        return;
121 122 123 124 125

    av_vlog(p, level_map[level], fmt, args);
}


126
static int encode_nals(AVCodecContext *ctx, AVPacket *pkt,
127
                       const x264_nal_t *nals, int nnal)
128
{
129
    X264Context *x4 = ctx->priv_data;
130 131 132 133 134 135 136 137 138
    uint8_t *p;
    int i, size = x4->sei_size, ret;

    if (!nnal)
        return 0;

    for (i = 0; i < nnal; i++)
        size += nals[i].i_payload;

139
    if ((ret = ff_alloc_packet2(ctx, pkt, size, 0)) < 0)
140 141 142
        return ret;

    p = pkt->data;
143 144

    /* Write the SEI as part of the first frame. */
145
    if (x4->sei_size > 0 && nnal > 0) {
146 147 148 149
        if (x4->sei_size > size) {
            av_log(ctx, AV_LOG_ERROR, "Error: nal buffer is too small\n");
            return -1;
        }
150 151 152
        memcpy(p, x4->sei, x4->sei_size);
        p += x4->sei_size;
        x4->sei_size = 0;
153
        av_freep(&x4->sei);
154
    }
155

156
    for (i = 0; i < nnal; i++){
157 158
        memcpy(p, nals[i].p_payload, nals[i].i_payload);
        p += nals[i].i_payload;
159 160
    }

161
    return 1;
162 163
}

164 165 166
static int avfmt2_num_planes(int avfmt)
{
    switch (avfmt) {
167 168 169 170 171
    case AV_PIX_FMT_YUV420P:
    case AV_PIX_FMT_YUVJ420P:
    case AV_PIX_FMT_YUV420P9:
    case AV_PIX_FMT_YUV420P10:
    case AV_PIX_FMT_YUV444P:
172 173
        return 3;

174
    case AV_PIX_FMT_BGR0:
175 176
    case AV_PIX_FMT_BGR24:
    case AV_PIX_FMT_RGB24:
177 178
    case AV_PIX_FMT_GRAY8:
    case AV_PIX_FMT_GRAY10:
179 180 181 182 183 184 185
        return 1;

    default:
        return 3;
    }
}

186 187 188 189 190 191
static void reconfig_encoder(AVCodecContext *ctx, const AVFrame *frame)
{
    X264Context *x4 = ctx->priv_data;
    AVFrameSideData *side_data;


192 193 194
  if (x4->avcintra_class < 0) {
    if (x4->params.b_interlaced && x4->params.b_tff != frame->top_field_first) {

195 196 197
        x4->params.b_tff = frame->top_field_first;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }
198
    if (x4->params.vui.i_sar_height*ctx->sample_aspect_ratio.num != ctx->sample_aspect_ratio.den * x4->params.vui.i_sar_width) {
199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224
        x4->params.vui.i_sar_height = ctx->sample_aspect_ratio.den;
        x4->params.vui.i_sar_width  = ctx->sample_aspect_ratio.num;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }

    if (x4->params.rc.i_vbv_buffer_size != ctx->rc_buffer_size / 1000 ||
        x4->params.rc.i_vbv_max_bitrate != ctx->rc_max_rate    / 1000) {
        x4->params.rc.i_vbv_buffer_size = ctx->rc_buffer_size / 1000;
        x4->params.rc.i_vbv_max_bitrate = ctx->rc_max_rate    / 1000;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }

    if (x4->params.rc.i_rc_method == X264_RC_ABR &&
        x4->params.rc.i_bitrate != ctx->bit_rate / 1000) {
        x4->params.rc.i_bitrate = ctx->bit_rate / 1000;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }

    if (x4->crf >= 0 &&
        x4->params.rc.i_rc_method == X264_RC_CRF &&
        x4->params.rc.f_rf_constant != x4->crf) {
        x4->params.rc.f_rf_constant = x4->crf;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }

    if (x4->params.rc.i_rc_method == X264_RC_CQP &&
225
        x4->cqp >= 0 &&
226 227 228 229 230 231 232 233 234 235
        x4->params.rc.i_qp_constant != x4->cqp) {
        x4->params.rc.i_qp_constant = x4->cqp;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }

    if (x4->crf_max >= 0 &&
        x4->params.rc.f_rf_constant_max != x4->crf_max) {
        x4->params.rc.f_rf_constant_max = x4->crf_max;
        x264_encoder_reconfig(x4->enc, &x4->params);
    }
236
  }
237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261

    side_data = av_frame_get_side_data(frame, AV_FRAME_DATA_STEREO3D);
    if (side_data) {
        AVStereo3D *stereo = (AVStereo3D *)side_data->data;
        int fpa_type;

        switch (stereo->type) {
        case AV_STEREO3D_CHECKERBOARD:
            fpa_type = 0;
            break;
        case AV_STEREO3D_COLUMNS:
            fpa_type = 1;
            break;
        case AV_STEREO3D_LINES:
            fpa_type = 2;
            break;
        case AV_STEREO3D_SIDEBYSIDE:
            fpa_type = 3;
            break;
        case AV_STEREO3D_TOPBOTTOM:
            fpa_type = 4;
            break;
        case AV_STEREO3D_FRAMESEQUENCE:
            fpa_type = 5;
            break;
262 263 264 265 266
#if X264_BUILD >= 145
        case AV_STEREO3D_2D:
            fpa_type = 6;
            break;
#endif
267 268 269 270 271
        default:
            fpa_type = -1;
            break;
        }

272 273 274 275 276 277 278
        /* Inverted mode is not supported by x264 */
        if (stereo->flags & AV_STEREO3D_FLAG_INVERT) {
            av_log(ctx, AV_LOG_WARNING,
                   "Ignoring unsupported inverted stereo value %d\n", fpa_type);
            fpa_type = -1;
        }

279 280 281 282 283 284 285
        if (fpa_type != x4->params.i_frame_packing) {
            x4->params.i_frame_packing = fpa_type;
            x264_encoder_reconfig(x4->enc, &x4->params);
        }
    }
}

286 287
static int X264_frame(AVCodecContext *ctx, AVPacket *pkt, const AVFrame *frame,
                      int *got_packet)
288 289 290
{
    X264Context *x4 = ctx->priv_data;
    x264_nal_t *nal;
291
    int nnal, i, ret;
292
    x264_picture_t pic_out = {0};
293
    int pict_type;
294
    int bit_depth;
295
    int64_t *out_opaque;
296
    AVFrameSideData *sd;
297

298
    x264_picture_init( &x4->pic );
299
    x4->pic.img.i_csp   = x4->params.i_csp;
300
#if X264_BUILD >= 153
301
    bit_depth = x4->params.i_bitdepth;
302
#else
303
    bit_depth = x264_bit_depth;
304
#endif
305
    if (bit_depth > 8)
306
        x4->pic.img.i_csp |= X264_CSP_HIGH_DEPTH;
307
    x4->pic.img.i_plane = avfmt2_num_planes(ctx->pix_fmt);
308

309
    if (frame) {
310
        for (i = 0; i < x4->pic.img.i_plane; i++) {
311
            x4->pic.img.plane[i]    = frame->data[i];
Måns Rullgård's avatar
Måns Rullgård committed
312 313
            x4->pic.img.i_stride[i] = frame->linesize[i];
        }
314

315
        x4->pic.i_pts  = frame->pts;
316

317 318 319 320 321
        x4->reordered_opaque[x4->next_reordered_opaque] = frame->reordered_opaque;
        x4->pic.opaque = &x4->reordered_opaque[x4->next_reordered_opaque];
        x4->next_reordered_opaque++;
        x4->next_reordered_opaque %= x4->nb_reordered_opaque;

322 323
        switch (frame->pict_type) {
        case AV_PICTURE_TYPE_I:
324 325
            x4->pic.i_type = x4->forced_idr > 0 ? X264_TYPE_IDR
                                                : X264_TYPE_KEYFRAME;
326 327 328 329 330 331 332 333 334 335 336
            break;
        case AV_PICTURE_TYPE_P:
            x4->pic.i_type = X264_TYPE_P;
            break;
        case AV_PICTURE_TYPE_B:
            x4->pic.i_type = X264_TYPE_B;
            break;
        default:
            x4->pic.i_type = X264_TYPE_AUTO;
            break;
        }
337
        reconfig_encoder(ctx, frame);
338 339

        if (x4->a53_cc) {
340 341 342 343 344 345 346
            void *sei_data;
            size_t sei_size;

            ret = ff_alloc_a53_sei(frame, 0, &sei_data, &sei_size);
            if (ret < 0) {
                av_log(ctx, AV_LOG_ERROR, "Not enough memory for closed captions, skipping\n");
            } else if (sei_data) {
347 348 349
                x4->pic.extra_sei.payloads = av_mallocz(sizeof(x4->pic.extra_sei.payloads[0]));
                if (x4->pic.extra_sei.payloads == NULL) {
                    av_log(ctx, AV_LOG_ERROR, "Not enough memory for closed captions, skipping\n");
350 351 352 353 354 355 356 357
                    av_free(sei_data);
                } else {
                    x4->pic.extra_sei.sei_free = av_free;

                    x4->pic.extra_sei.payloads[0].payload_size = sei_size;
                    x4->pic.extra_sei.payloads[0].payload = sei_data;
                    x4->pic.extra_sei.num_payloads = 1;
                    x4->pic.extra_sei.payloads[0].payload_type = 4;
358 359 360
                }
            }
        }
361 362 363 364

        sd = av_frame_get_side_data(frame, AV_FRAME_DATA_REGIONS_OF_INTEREST);
        if (sd) {
            if (x4->params.rc.i_aq_mode == X264_AQ_NONE) {
365 366 367 368
                if (!x4->roi_warned) {
                    x4->roi_warned = 1;
                    av_log(ctx, AV_LOG_WARNING, "Adaptive quantization must be enabled to use ROI encoding, skipping ROI.\n");
                }
369 370 371 372
            } else {
                if (frame->interlaced_frame == 0) {
                    int mbx = (frame->width + MB_SIZE - 1) / MB_SIZE;
                    int mby = (frame->height + MB_SIZE - 1) / MB_SIZE;
373
                    int qp_range = 51 + 6 * (bit_depth - 8);
374
                    int nb_rois;
375 376 377 378 379 380 381 382 383 384 385 386
                    const AVRegionOfInterest *roi;
                    uint32_t roi_size;
                    float *qoffsets;

                    roi = (const AVRegionOfInterest*)sd->data;
                    roi_size = roi->self_size;
                    if (!roi_size || sd->size % roi_size != 0) {
                        av_log(ctx, AV_LOG_ERROR, "Invalid AVRegionOfInterest.self_size.\n");
                        return AVERROR(EINVAL);
                    }
                    nb_rois = sd->size / roi_size;

387 388 389 390
                    qoffsets = av_mallocz_array(mbx * mby, sizeof(*qoffsets));
                    if (!qoffsets)
                        return AVERROR(ENOMEM);

391 392 393 394
                    // This list must be iterated in reverse because the first
                    // region in the list applies when regions overlap.
                    for (int i = nb_rois - 1; i >= 0; i--) {
                        int startx, endx, starty, endy;
395 396
                        float qoffset;

397 398 399 400 401 402 403
                        roi = (const AVRegionOfInterest*)(sd->data + roi_size * i);

                        starty = FFMIN(mby, roi->top / MB_SIZE);
                        endy   = FFMIN(mby, (roi->bottom + MB_SIZE - 1)/ MB_SIZE);
                        startx = FFMIN(mbx, roi->left / MB_SIZE);
                        endx   = FFMIN(mbx, (roi->right + MB_SIZE - 1)/ MB_SIZE);

404 405
                        if (roi->qoffset.den == 0) {
                            av_free(qoffsets);
406
                            av_log(ctx, AV_LOG_ERROR, "AVRegionOfInterest.qoffset.den must not be zero.\n");
407 408 409
                            return AVERROR(EINVAL);
                        }
                        qoffset = roi->qoffset.num * 1.0f / roi->qoffset.den;
410
                        qoffset = av_clipf(qoffset * qp_range, -qp_range, +qp_range);
411 412 413 414 415 416 417 418 419 420 421

                        for (int y = starty; y < endy; y++) {
                            for (int x = startx; x < endx; x++) {
                                qoffsets[x + y*mbx] = qoffset;
                            }
                        }
                    }

                    x4->pic.prop.quant_offsets = qoffsets;
                    x4->pic.prop.quant_offsets_free = av_free;
                } else {
422 423 424 425
                    if (!x4->roi_warned) {
                        x4->roi_warned = 1;
                        av_log(ctx, AV_LOG_WARNING, "interlaced_frame not supported for ROI encoding yet, skipping ROI.\n");
                    }
426 427 428
                }
            }
        }
429
    }
430

431
    do {
432
        if (x264_encoder_encode(x4->enc, &nal, &nnal, frame? &x4->pic: NULL, &pic_out) < 0)
433
            return AVERROR_EXTERNAL;
434

435 436
        ret = encode_nals(ctx, pkt, nal, nnal);
        if (ret < 0)
437
            return ret;
438
    } while (!ret && !frame && x264_encoder_delayed_frames(x4->enc));
439

440 441
    pkt->pts = pic_out.i_pts;
    pkt->dts = pic_out.i_dts;
442

443 444 445 446 447 448 449 450
    out_opaque = pic_out.opaque;
    if (out_opaque >= x4->reordered_opaque &&
        out_opaque < &x4->reordered_opaque[x4->nb_reordered_opaque]) {
        ctx->reordered_opaque = *out_opaque;
    } else {
        // Unexpected opaque pointer on picture output
        ctx->reordered_opaque = 0;
    }
451

452
    switch (pic_out.i_type) {
453 454
    case X264_TYPE_IDR:
    case X264_TYPE_I:
455
        pict_type = AV_PICTURE_TYPE_I;
456 457
        break;
    case X264_TYPE_P:
458
        pict_type = AV_PICTURE_TYPE_P;
459 460 461
        break;
    case X264_TYPE_B:
    case X264_TYPE_BREF:
462
        pict_type = AV_PICTURE_TYPE_B;
463
        break;
464 465
    default:
        pict_type = AV_PICTURE_TYPE_NONE;
466
    }
467 468 469
#if FF_API_CODED_FRAME
FF_DISABLE_DEPRECATION_WARNINGS
    ctx->coded_frame->pict_type = pict_type;
470 471
FF_ENABLE_DEPRECATION_WARNINGS
#endif
472

473
    pkt->flags |= AV_PKT_FLAG_KEY*pic_out.b_keyframe;
474
    if (ret) {
475
        ff_side_data_set_encoder_stats(pkt, (pic_out.i_qpplus1 - 1) * FF_QP2LAMBDA, NULL, 0, pict_type);
476

477 478
#if FF_API_CODED_FRAME
FF_DISABLE_DEPRECATION_WARNINGS
479
        ctx->coded_frame->quality = (pic_out.i_qpplus1 - 1) * FF_QP2LAMBDA;
480 481
FF_ENABLE_DEPRECATION_WARNINGS
#endif
482
    }
483

484 485
    *got_packet = ret;
    return 0;
486 487
}

488
static av_cold int X264_close(AVCodecContext *avctx)
489 490 491
{
    X264Context *x4 = avctx->priv_data;

Ralf Terdic's avatar
Ralf Terdic committed
492
    av_freep(&avctx->extradata);
493
    av_freep(&x4->sei);
494
    av_freep(&x4->reordered_opaque);
Ralf Terdic's avatar
Ralf Terdic committed
495

496
    if (x4->enc) {
497
        x264_encoder_close(x4->enc);
498 499
        x4->enc = NULL;
    }
500 501 502 503

    return 0;
}

504 505 506
#define OPT_STR(opt, param)                                                   \
    do {                                                                      \
        int ret;                                                              \
507
        if ((ret = x264_param_parse(&x4->params, opt, param)) < 0) { \
508 509 510 511 512 513 514 515
            if(ret == X264_PARAM_BAD_NAME)                                    \
                av_log(avctx, AV_LOG_ERROR,                                   \
                        "bad option '%s': '%s'\n", opt, param);               \
            else                                                              \
                av_log(avctx, AV_LOG_ERROR,                                   \
                        "bad value for '%s': '%s'\n", opt, param);            \
            return -1;                                                        \
        }                                                                     \
516
    } while (0)
517

518
static int convert_pix_fmt(enum AVPixelFormat pix_fmt)
519 520
{
    switch (pix_fmt) {
521 522 523 524 525
    case AV_PIX_FMT_YUV420P:
    case AV_PIX_FMT_YUVJ420P:
    case AV_PIX_FMT_YUV420P9:
    case AV_PIX_FMT_YUV420P10: return X264_CSP_I420;
    case AV_PIX_FMT_YUV422P:
526
    case AV_PIX_FMT_YUVJ422P:
527 528
    case AV_PIX_FMT_YUV422P10: return X264_CSP_I422;
    case AV_PIX_FMT_YUV444P:
529
    case AV_PIX_FMT_YUVJ444P:
530 531
    case AV_PIX_FMT_YUV444P9:
    case AV_PIX_FMT_YUV444P10: return X264_CSP_I444;
532
#if CONFIG_LIBX264RGB_ENCODER
533 534
    case AV_PIX_FMT_BGR0:
        return X264_CSP_BGRA;
535
    case AV_PIX_FMT_BGR24:
536 537
        return X264_CSP_BGR;

538
    case AV_PIX_FMT_RGB24:
539 540
        return X264_CSP_RGB;
#endif
541 542 543
    case AV_PIX_FMT_NV12:      return X264_CSP_NV12;
    case AV_PIX_FMT_NV16:
    case AV_PIX_FMT_NV20:      return X264_CSP_NV16;
544 545
#ifdef X264_CSP_NV21
    case AV_PIX_FMT_NV21:      return X264_CSP_NV21;
546 547 548 549
#endif
#ifdef X264_CSP_I400
    case AV_PIX_FMT_GRAY8:
    case AV_PIX_FMT_GRAY10:    return X264_CSP_I400;
550
#endif
551 552 553 554
    };
    return 0;
}

555 556 557 558 559 560
#define PARSE_X264_OPT(name, var)\
    if (x4->var && x264_param_parse(&x4->params, name, x4->var) < 0) {\
        av_log(avctx, AV_LOG_ERROR, "Error parsing option '%s' with value '%s'.\n", name, x4->var);\
        return AVERROR(EINVAL);\
    }

561
static av_cold int X264_init(AVCodecContext *avctx)
562 563
{
    X264Context *x4 = avctx->priv_data;
564
    AVCPBProperties *cpb_props;
565
    int sw,sh;
566

567 568 569
    if (avctx->global_quality > 0)
        av_log(avctx, AV_LOG_WARNING, "-qscale is ignored, -crf is recommended.\n");

570 571 572 573 574 575
#if CONFIG_LIBX262_ENCODER
    if (avctx->codec_id == AV_CODEC_ID_MPEG2VIDEO) {
        x4->params.b_mpeg2 = 1;
        x264_param_default_mpeg2(&x4->params);
    } else
#endif
576
    x264_param_default(&x4->params);
577

578
    x4->params.b_deblocking_filter         = avctx->flags & AV_CODEC_FLAG_LOOP_FILTER;
579

580 581
    if (x4->preset || x4->tune)
        if (x264_param_default_preset(&x4->params, x4->preset, x4->tune) < 0) {
582
            int i;
583
            av_log(avctx, AV_LOG_ERROR, "Error setting preset/tune %s/%s.\n", x4->preset, x4->tune);
584 585 586 587 588 589 590 591
            av_log(avctx, AV_LOG_INFO, "Possible presets:");
            for (i = 0; x264_preset_names[i]; i++)
                av_log(avctx, AV_LOG_INFO, " %s", x264_preset_names[i]);
            av_log(avctx, AV_LOG_INFO, "\n");
            av_log(avctx, AV_LOG_INFO, "Possible tunes:");
            for (i = 0; x264_tune_names[i]; i++)
                av_log(avctx, AV_LOG_INFO, " %s", x264_tune_names[i]);
            av_log(avctx, AV_LOG_INFO, "\n");
592 593 594
            return AVERROR(EINVAL);
        }

595 596
    if (avctx->level > 0)
        x4->params.i_level_idc = avctx->level;
597 598 599 600

    x4->params.pf_log               = X264_log;
    x4->params.p_log_private        = avctx;
    x4->params.i_log_level          = X264_LOG_DEBUG;
601
    x4->params.i_csp                = convert_pix_fmt(avctx->pix_fmt);
602 603 604
#if X264_BUILD >= 153
    x4->params.i_bitdepth           = av_pix_fmt_desc_get(avctx->pix_fmt)->comp[0].depth;
#endif
605

606
    PARSE_X264_OPT("weightp", wpredp);
607

608
    if (avctx->bit_rate) {
609 610 611 612
        if (avctx->bit_rate / 1000 > INT_MAX || avctx->rc_max_rate / 1000 > INT_MAX) {
            av_log(avctx, AV_LOG_ERROR, "bit_rate and rc_max_rate > %d000 not supported by libx264\n", INT_MAX);
            return AVERROR(EINVAL);
        }
613 614 615
        x4->params.rc.i_bitrate   = avctx->bit_rate / 1000;
        x4->params.rc.i_rc_method = X264_RC_ABR;
    }
616 617
    x4->params.rc.i_vbv_buffer_size = avctx->rc_buffer_size / 1000;
    x4->params.rc.i_vbv_max_bitrate = avctx->rc_max_rate    / 1000;
618 619
    x4->params.rc.b_stat_write      = avctx->flags & AV_CODEC_FLAG_PASS1;
    if (avctx->flags & AV_CODEC_FLAG_PASS2) {
620 621
        x4->params.rc.b_stat_read = 1;
    } else {
622 623 624
        if (x4->crf >= 0) {
            x4->params.rc.i_rc_method   = X264_RC_CRF;
            x4->params.rc.f_rf_constant = x4->crf;
625 626 627
        } else if (x4->cqp >= 0) {
            x4->params.rc.i_rc_method   = X264_RC_CQP;
            x4->params.rc.i_qp_constant = x4->cqp;
628
        }
629 630 631

        if (x4->crf_max >= 0)
            x4->params.rc.f_rf_constant_max = x4->crf_max;
632 633
    }

634
    if (avctx->rc_buffer_size && avctx->rc_initial_buffer_occupancy > 0 &&
635
        (avctx->rc_initial_buffer_occupancy <= avctx->rc_buffer_size)) {
Robert Swain's avatar
Robert Swain committed
636
        x4->params.rc.f_vbv_buffer_init =
637
            (float)avctx->rc_initial_buffer_occupancy / avctx->rc_buffer_size;
638
    }
Robert Swain's avatar
Robert Swain committed
639

640
    PARSE_X264_OPT("level", level);
641

642 643
    if (avctx->i_quant_factor > 0)
        x4->params.rc.f_ip_factor         = 1 / fabs(avctx->i_quant_factor);
644 645
    if (avctx->b_quant_factor > 0)
        x4->params.rc.f_pb_factor         = avctx->b_quant_factor;
646 647 648

#if FF_API_PRIVATE_OPT
FF_DISABLE_DEPRECATION_WARNINGS
649
    if (avctx->chromaoffset >= 0)
650 651 652
        x4->chroma_offset = avctx->chromaoffset;
FF_ENABLE_DEPRECATION_WARNINGS
#endif
653
    if (x4->chroma_offset >= 0)
654
        x4->params.analyse.i_chroma_qp_offset = x4->chroma_offset;
Robert Swain's avatar
Robert Swain committed
655

656 657 658 659
    if (avctx->gop_size >= 0)
        x4->params.i_keyint_max         = avctx->gop_size;
    if (avctx->max_b_frames >= 0)
        x4->params.i_bframe             = avctx->max_b_frames;
660 661 662

#if FF_API_PRIVATE_OPT
FF_DISABLE_DEPRECATION_WARNINGS
663
    if (avctx->scenechange_threshold >= 0)
664 665 666
        x4->scenechange_threshold = avctx->scenechange_threshold;
FF_ENABLE_DEPRECATION_WARNINGS
#endif
667 668
    if (x4->scenechange_threshold >= 0)
        x4->params.i_scenecut_threshold = x4->scenechange_threshold;
669

670 671 672 673 674 675 676 677 678 679 680 681
    if (avctx->qmin >= 0)
        x4->params.rc.i_qp_min          = avctx->qmin;
    if (avctx->qmax >= 0)
        x4->params.rc.i_qp_max          = avctx->qmax;
    if (avctx->max_qdiff >= 0)
        x4->params.rc.i_qp_step         = avctx->max_qdiff;
    if (avctx->qblur >= 0)
        x4->params.rc.f_qblur           = avctx->qblur;     /* temporally blur quants */
    if (avctx->qcompress >= 0)
        x4->params.rc.f_qcompress       = avctx->qcompress; /* 0.0 => cbr, 1.0 => constant qp */
    if (avctx->refs >= 0)
        x4->params.i_frame_reference    = avctx->refs;
682 683
    else if (x4->level) {
        int i;
684
        int mbn = AV_CEIL_RSHIFT(avctx->width, 4) * AV_CEIL_RSHIFT(avctx->height, 4);
685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703
        int level_id = -1;
        char *tail;
        int scale = X264_BUILD < 129 ? 384 : 1;

        if (!strcmp(x4->level, "1b")) {
            level_id = 9;
        } else if (strlen(x4->level) <= 3){
            level_id = av_strtod(x4->level, &tail) * 10 + 0.5;
            if (*tail)
                level_id = -1;
        }
        if (level_id <= 0)
            av_log(avctx, AV_LOG_WARNING, "Failed to parse level\n");

        for (i = 0; i<x264_levels[i].level_idc; i++)
            if (x264_levels[i].level_idc == level_id)
                x4->params.i_frame_reference = av_clip(x264_levels[i].dpb / mbn / scale, 1, x4->params.i_frame_reference);
    }

704 705 706 707
    if (avctx->trellis >= 0)
        x4->params.analyse.i_trellis    = avctx->trellis;
    if (avctx->me_range >= 0)
        x4->params.analyse.i_me_range   = avctx->me_range;
708 709
#if FF_API_PRIVATE_OPT
    FF_DISABLE_DEPRECATION_WARNINGS
710
    if (avctx->noise_reduction >= 0)
711 712 713
        x4->noise_reduction = avctx->noise_reduction;
    FF_ENABLE_DEPRECATION_WARNINGS
#endif
714 715
    if (x4->noise_reduction >= 0)
        x4->params.analyse.i_noise_reduction = x4->noise_reduction;
716 717
    if (avctx->me_subpel_quality >= 0)
        x4->params.analyse.i_subpel_refine   = avctx->me_subpel_quality;
718 719
#if FF_API_PRIVATE_OPT
FF_DISABLE_DEPRECATION_WARNINGS
720
    if (avctx->b_frame_strategy >= 0)
721 722 723
        x4->b_frame_strategy = avctx->b_frame_strategy;
FF_ENABLE_DEPRECATION_WARNINGS
#endif
724 725
    if (avctx->keyint_min >= 0)
        x4->params.i_keyint_min = avctx->keyint_min;
726 727
#if FF_API_CODER_TYPE
FF_DISABLE_DEPRECATION_WARNINGS
728
    if (avctx->coder_type >= 0)
729 730 731
        x4->coder = avctx->coder_type == FF_CODER_TYPE_AC;
FF_ENABLE_DEPRECATION_WARNINGS
#endif
732 733
    if (avctx->me_cmp >= 0)
        x4->params.analyse.b_chroma_me = avctx->me_cmp & FF_CMP_CHROMA;
734

735 736
    if (x4->aq_mode >= 0)
        x4->params.rc.i_aq_mode = x4->aq_mode;
737 738
    if (x4->aq_strength >= 0)
        x4->params.rc.f_aq_strength = x4->aq_strength;
739 740
    PARSE_X264_OPT("psy-rd", psy_rd);
    PARSE_X264_OPT("deblock", deblock);
741
    PARSE_X264_OPT("partitions", partitions);
742
    PARSE_X264_OPT("stats", stats);
743 744
    if (x4->psy >= 0)
        x4->params.analyse.b_psy  = x4->psy;
745 746
    if (x4->rc_lookahead >= 0)
        x4->params.rc.i_lookahead = x4->rc_lookahead;
747 748
    if (x4->weightp >= 0)
        x4->params.analyse.i_weighted_pred = x4->weightp;
749 750
    if (x4->weightb >= 0)
        x4->params.analyse.b_weighted_bipred = x4->weightb;
751 752
    if (x4->cplxblur >= 0)
        x4->params.rc.f_complexity_blur = x4->cplxblur;
753

754 755
    if (x4->ssim >= 0)
        x4->params.analyse.b_ssim = x4->ssim;
756 757
    if (x4->intra_refresh >= 0)
        x4->params.b_intra_refresh = x4->intra_refresh;
758 759 760 761
    if (x4->bluray_compat >= 0) {
        x4->params.b_bluray_compat = x4->bluray_compat;
        x4->params.b_vfr_input = 0;
    }
762
    if (x4->avcintra_class >= 0)
763
#if X264_BUILD >= 142
764
        x4->params.i_avcintra_class = x4->avcintra_class;
765 766 767 768
#else
        av_log(avctx, AV_LOG_ERROR,
               "x264 too old for AVC Intra, at least version 142 needed\n");
#endif
769 770
    if (x4->b_bias != INT_MIN)
        x4->params.i_bframe_bias              = x4->b_bias;
771 772
    if (x4->b_pyramid >= 0)
        x4->params.i_bframe_pyramid = x4->b_pyramid;
773 774
    if (x4->mixed_refs >= 0)
        x4->params.analyse.b_mixed_references = x4->mixed_refs;
775 776
    if (x4->dct8x8 >= 0)
        x4->params.analyse.b_transform_8x8    = x4->dct8x8;
777 778
    if (x4->fast_pskip >= 0)
        x4->params.analyse.b_fast_pskip       = x4->fast_pskip;
779 780
    if (x4->aud >= 0)
        x4->params.b_aud                      = x4->aud;
781 782
    if (x4->mbtree >= 0)
        x4->params.rc.b_mb_tree               = x4->mbtree;
783 784
    if (x4->direct_pred >= 0)
        x4->params.analyse.i_direct_mv_pred   = x4->direct_pred;
785

786 787 788
    if (x4->slice_max_size >= 0)
        x4->params.i_slice_max_size =  x4->slice_max_size;

789 790 791
    if (x4->fastfirstpass)
        x264_param_apply_fastfirstpass(&x4->params);

792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815
    /* Allow specifying the x264 profile through AVCodecContext. */
    if (!x4->profile)
        switch (avctx->profile) {
        case FF_PROFILE_H264_BASELINE:
            x4->profile = av_strdup("baseline");
            break;
        case FF_PROFILE_H264_HIGH:
            x4->profile = av_strdup("high");
            break;
        case FF_PROFILE_H264_HIGH_10:
            x4->profile = av_strdup("high10");
            break;
        case FF_PROFILE_H264_HIGH_422:
            x4->profile = av_strdup("high422");
            break;
        case FF_PROFILE_H264_HIGH_444:
            x4->profile = av_strdup("high444");
            break;
        case FF_PROFILE_H264_MAIN:
            x4->profile = av_strdup("main");
            break;
        default:
            break;
        }
816

817 818 819
    if (x4->nal_hrd >= 0)
        x4->params.i_nal_hrd = x4->nal_hrd;

820
    if (x4->motion_est >= 0)
821 822
        x4->params.analyse.i_me_method = x4->motion_est;

823 824 825
    if (x4->coder >= 0)
        x4->params.b_cabac = x4->coder;

826 827 828
    if (x4->b_frame_strategy >= 0)
        x4->params.i_bframe_adaptive = x4->b_frame_strategy;

829
    if (x4->profile)
830
        if (x264_param_apply_profile(&x4->params, x4->profile) < 0) {
831
            int i;
832
            av_log(avctx, AV_LOG_ERROR, "Error setting profile %s.\n", x4->profile);
833 834
            av_log(avctx, AV_LOG_INFO, "Possible profiles:");
            for (i = 0; x264_profile_names[i]; i++)
Mahendra M's avatar
Mahendra M committed
835
                av_log(avctx, AV_LOG_INFO, " %s", x264_profile_names[i]);
836
            av_log(avctx, AV_LOG_INFO, "\n");
837 838
            return AVERROR(EINVAL);
        }
839

840 841
    x4->params.i_width          = avctx->width;
    x4->params.i_height         = avctx->height;
842 843 844
    av_reduce(&sw, &sh, avctx->sample_aspect_ratio.num, avctx->sample_aspect_ratio.den, 4096);
    x4->params.vui.i_sar_width  = sw;
    x4->params.vui.i_sar_height = sh;
845 846
    x4->params.i_timebase_den = avctx->time_base.den;
    x4->params.i_timebase_num = avctx->time_base.num;
847 848 849 850 851 852 853
    if (avctx->framerate.num > 0 && avctx->framerate.den > 0) {
        x4->params.i_fps_num = avctx->framerate.num;
        x4->params.i_fps_den = avctx->framerate.den;
    } else {
        x4->params.i_fps_num = avctx->time_base.den;
        x4->params.i_fps_den = avctx->time_base.num * avctx->ticks_per_frame;
    }
Robert Swain's avatar
Robert Swain committed
854

855
    x4->params.analyse.b_psnr = avctx->flags & AV_CODEC_FLAG_PSNR;
Robert Swain's avatar
Robert Swain committed
856

857
    x4->params.i_threads      = avctx->thread_count;
858 859
    if (avctx->thread_type)
        x4->params.b_sliced_threads = avctx->thread_type == FF_THREAD_SLICE;
860

861
    x4->params.b_interlaced   = avctx->flags & AV_CODEC_FLAG_INTERLACED_DCT;
862

863
    x4->params.b_open_gop     = !(avctx->flags & AV_CODEC_FLAG_CLOSED_GOP);
864

865 866
    x4->params.i_slice_count  = avctx->slices;

867 868
    x4->params.vui.b_fullrange = avctx->pix_fmt == AV_PIX_FMT_YUVJ420P ||
                                 avctx->pix_fmt == AV_PIX_FMT_YUVJ422P ||
869 870 871 872 873 874 875 876 877
                                 avctx->pix_fmt == AV_PIX_FMT_YUVJ444P ||
                                 avctx->color_range == AVCOL_RANGE_JPEG;

    if (avctx->colorspace != AVCOL_SPC_UNSPECIFIED)
        x4->params.vui.i_colmatrix = avctx->colorspace;
    if (avctx->color_primaries != AVCOL_PRI_UNSPECIFIED)
        x4->params.vui.i_colorprim = avctx->color_primaries;
    if (avctx->color_trc != AVCOL_TRC_UNSPECIFIED)
        x4->params.vui.i_transfer  = avctx->color_trc;
878

879
    if (avctx->flags & AV_CODEC_FLAG_GLOBAL_HEADER)
880 881
        x4->params.b_repeat_headers = 0;

882 883 884
    if(x4->x264opts){
        const char *p= x4->x264opts;
        while(p){
885 886
            char param[4096]={0}, val[4096]={0};
            if(sscanf(p, "%4095[^:=]=%4095[^:]", param, val) == 1){
887 888 889 890 891 892 893 894
                OPT_STR(param, "1");
            }else
                OPT_STR(param, val);
            p= strchr(p, ':');
            p+=!!p;
        }
    }

895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910
    if (x4->x264_params) {
        AVDictionary *dict    = NULL;
        AVDictionaryEntry *en = NULL;

        if (!av_dict_parse_string(&dict, x4->x264_params, "=", ":", 0)) {
            while ((en = av_dict_get(dict, "", en, AV_DICT_IGNORE_SUFFIX))) {
                if (x264_param_parse(&x4->params, en->key, en->value) < 0)
                    av_log(avctx, AV_LOG_WARNING,
                           "Error parsing option '%s = %s'.\n",
                            en->key, en->value);
            }

            av_dict_free(&dict);
        }
    }

911
    // update AVCodecContext with x264 parameters
912 913
    avctx->has_b_frames = x4->params.i_bframe ?
        x4->params.i_bframe_pyramid ? 2 : 1 : 0;
914 915 916
    if (avctx->max_b_frames < 0)
        avctx->max_b_frames = 0;

917
    avctx->bit_rate = x4->params.rc.i_bitrate*1000LL;
918

919
    x4->enc = x264_encoder_open(&x4->params);
920
    if (!x4->enc)
921
        return AVERROR_EXTERNAL;
922

923
    if (avctx->flags & AV_CODEC_FLAG_GLOBAL_HEADER) {
924
        x264_nal_t *nal;
925
        uint8_t *p;
926
        int nnal, s, i;
927

928
        s = x264_encoder_headers(x4->enc, &nal, &nnal);
929
        avctx->extradata = p = av_mallocz(s + AV_INPUT_BUFFER_PADDING_SIZE);
930
        if (!p)
931
            return AVERROR(ENOMEM);
932

933 934 935
        for (i = 0; i < nnal; i++) {
            /* Don't put the SEI in extradata. */
            if (nal[i].i_type == NAL_SEI) {
936
                av_log(avctx, AV_LOG_INFO, "%s\n", nal[i].p_payload+25);
937 938
                x4->sei_size = nal[i].i_payload;
                x4->sei      = av_malloc(x4->sei_size);
939
                if (!x4->sei)
940
                    return AVERROR(ENOMEM);
941 942 943 944 945 946 947
                memcpy(x4->sei, nal[i].p_payload, nal[i].i_payload);
                continue;
            }
            memcpy(p, nal[i].p_payload, nal[i].i_payload);
            p += nal[i].i_payload;
        }
        avctx->extradata_size = p - avctx->extradata;
948 949
    }

950 951 952 953
    cpb_props = ff_add_cpb_side_data(avctx);
    if (!cpb_props)
        return AVERROR(ENOMEM);
    cpb_props->buffer_size = x4->params.rc.i_vbv_buffer_size * 1000;
954 955
    cpb_props->max_bitrate = x4->params.rc.i_vbv_max_bitrate * 1000LL;
    cpb_props->avg_bitrate = x4->params.rc.i_bitrate         * 1000LL;
956

957 958 959 960 961 962 963 964
    // Overestimate the reordered opaque buffer size, in case a runtime
    // reconfigure would increase the delay (which it shouldn't).
    x4->nb_reordered_opaque = x264_encoder_maximum_delayed_frames(x4->enc) + 17;
    x4->reordered_opaque    = av_malloc_array(x4->nb_reordered_opaque,
                                              sizeof(*x4->reordered_opaque));
    if (!x4->reordered_opaque)
        return AVERROR(ENOMEM);

965 966 967
    return 0;
}

968
static const enum AVPixelFormat pix_fmts_8bit[] = {
969 970 971 972 973 974 975 976 977 978 979 980 981
    AV_PIX_FMT_YUV420P,
    AV_PIX_FMT_YUVJ420P,
    AV_PIX_FMT_YUV422P,
    AV_PIX_FMT_YUVJ422P,
    AV_PIX_FMT_YUV444P,
    AV_PIX_FMT_YUVJ444P,
    AV_PIX_FMT_NV12,
    AV_PIX_FMT_NV16,
#ifdef X264_CSP_NV21
    AV_PIX_FMT_NV21,
#endif
    AV_PIX_FMT_NONE
};
982 983 984 985
static const enum AVPixelFormat pix_fmts_9bit[] = {
    AV_PIX_FMT_YUV420P9,
    AV_PIX_FMT_YUV444P9,
    AV_PIX_FMT_NONE
986
};
987 988 989 990
static const enum AVPixelFormat pix_fmts_10bit[] = {
    AV_PIX_FMT_YUV420P10,
    AV_PIX_FMT_YUV422P10,
    AV_PIX_FMT_YUV444P10,
991
    AV_PIX_FMT_NV20,
992
    AV_PIX_FMT_NONE
993
};
994
static const enum AVPixelFormat pix_fmts_all[] = {
995 996 997
    AV_PIX_FMT_YUV420P,
    AV_PIX_FMT_YUVJ420P,
    AV_PIX_FMT_YUV422P,
998
    AV_PIX_FMT_YUVJ422P,
999
    AV_PIX_FMT_YUV444P,
1000
    AV_PIX_FMT_YUVJ444P,
1001 1002
    AV_PIX_FMT_NV12,
    AV_PIX_FMT_NV16,
1003 1004 1005
#ifdef X264_CSP_NV21
    AV_PIX_FMT_NV21,
#endif
1006 1007 1008
    AV_PIX_FMT_YUV420P10,
    AV_PIX_FMT_YUV422P10,
    AV_PIX_FMT_YUV444P10,
1009
    AV_PIX_FMT_NV20,
1010 1011 1012 1013
#ifdef X264_CSP_I400
    AV_PIX_FMT_GRAY8,
    AV_PIX_FMT_GRAY10,
#endif
1014
    AV_PIX_FMT_NONE
1015
};
1016
#if CONFIG_LIBX264RGB_ENCODER
1017
static const enum AVPixelFormat pix_fmts_8bit_rgb[] = {
1018
    AV_PIX_FMT_BGR0,
1019 1020 1021
    AV_PIX_FMT_BGR24,
    AV_PIX_FMT_RGB24,
    AV_PIX_FMT_NONE
1022
};
1023
#endif
1024 1025 1026

static av_cold void X264_init_static(AVCodec *codec)
{
1027 1028
#if X264_BUILD < 153
    if (x264_bit_depth == 8)
1029
        codec->pix_fmts = pix_fmts_8bit;
1030
    else if (x264_bit_depth == 9)
1031
        codec->pix_fmts = pix_fmts_9bit;
1032
    else if (x264_bit_depth == 10)
1033
        codec->pix_fmts = pix_fmts_10bit;
1034
#else
1035
    codec->pix_fmts = pix_fmts_all;
1036
#endif
1037 1038
}

1039
#define OFFSET(x) offsetof(X264Context, x)
1040 1041
#define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
static const AVOption options[] = {
1042 1043 1044
    { "preset",        "Set the encoding preset (cf. x264 --fullhelp)",   OFFSET(preset),        AV_OPT_TYPE_STRING, { .str = "medium" }, 0, 0, VE},
    { "tune",          "Tune the encoding params (cf. x264 --fullhelp)",  OFFSET(tune),          AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
    { "profile",       "Set profile restrictions (cf. x264 --fullhelp) ", OFFSET(profile),       AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
1045
    { "fastfirstpass", "Use fast settings when encoding first pass",      OFFSET(fastfirstpass), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, VE},
1046 1047 1048
    {"level", "Specify level (as defined by Annex A)", OFFSET(level), AV_OPT_TYPE_STRING, {.str=NULL}, 0, 0, VE},
    {"passlogfile", "Filename for 2 pass stats", OFFSET(stats), AV_OPT_TYPE_STRING, {.str=NULL}, 0, 0, VE},
    {"wpredp", "Weighted prediction for P-frames", OFFSET(wpredp), AV_OPT_TYPE_STRING, {.str=NULL}, 0, 0, VE},
1049
    {"a53cc",          "Use A53 Closed Captions (if available)",          OFFSET(a53_cc),        AV_OPT_TYPE_BOOL,   {.i64 = 1}, 0, 1, VE},
1050
    {"x264opts", "x264 options", OFFSET(x264opts), AV_OPT_TYPE_STRING, {.str=NULL}, 0, 0, VE},
1051 1052
    { "crf",           "Select the quality for constant quality mode",    OFFSET(crf),           AV_OPT_TYPE_FLOAT,  {.dbl = -1 }, -1, FLT_MAX, VE },
    { "crf_max",       "In CRF mode, prevents VBV from lowering quality beyond this point.",OFFSET(crf_max), AV_OPT_TYPE_FLOAT, {.dbl = -1 }, -1, FLT_MAX, VE },
1053 1054
    { "qp",            "Constant quantization parameter rate control method",OFFSET(cqp),        AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE },
    { "aq-mode",       "AQ method",                                       OFFSET(aq_mode),       AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE, "aq_mode"},
1055 1056
    { "none",          NULL,                              0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_NONE},         INT_MIN, INT_MAX, VE, "aq_mode" },
    { "variance",      "Variance AQ (complexity mask)",   0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_VARIANCE},     INT_MIN, INT_MAX, VE, "aq_mode" },
1057 1058 1059 1060
    { "autovariance",  "Auto-variance AQ",                0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_AUTOVARIANCE}, INT_MIN, INT_MAX, VE, "aq_mode" },
#if X264_BUILD >= 144
    { "autovariance-biased", "Auto-variance AQ with bias to dark scenes", 0, AV_OPT_TYPE_CONST, {.i64 = X264_AQ_AUTOVARIANCE_BIASED}, INT_MIN, INT_MAX, VE, "aq_mode" },
#endif
1061
    { "aq-strength",   "AQ strength. Reduces blocking and blurring in flat and textured areas.", OFFSET(aq_strength), AV_OPT_TYPE_FLOAT, {.dbl = -1}, -1, FLT_MAX, VE},
1062
    { "psy",           "Use psychovisual optimizations.",                 OFFSET(psy),           AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE },
1063
    { "psy-rd",        "Strength of psychovisual optimization, in <psy-rd>:<psy-trellis> format.", OFFSET(psy_rd), AV_OPT_TYPE_STRING,  {0 }, 0, 0, VE},
1064
    { "rc-lookahead",  "Number of frames to look ahead for frametype and ratecontrol", OFFSET(rc_lookahead), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, VE },
1065
    { "weightb",       "Weighted prediction for B-frames.",               OFFSET(weightb),       AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE },
1066
    { "weightp",       "Weighted prediction analysis method.",            OFFSET(weightp),       AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE, "weightp" },
1067 1068 1069
    { "none",          NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_NONE},   INT_MIN, INT_MAX, VE, "weightp" },
    { "simple",        NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SIMPLE}, INT_MIN, INT_MAX, VE, "weightp" },
    { "smart",         NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_WEIGHTP_SMART},  INT_MIN, INT_MAX, VE, "weightp" },
1070 1071 1072
    { "ssim",          "Calculate and print SSIM stats.",                 OFFSET(ssim),          AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE },
    { "intra-refresh", "Use Periodic Intra Refresh instead of IDR frames.",OFFSET(intra_refresh),AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE },
    { "bluray-compat", "Bluray compatibility workarounds.",               OFFSET(bluray_compat) ,AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE },
1073 1074
    { "b-bias",        "Influences how often B-frames are used",          OFFSET(b_bias),        AV_OPT_TYPE_INT,    { .i64 = INT_MIN}, INT_MIN, INT_MAX, VE },
    { "b-pyramid",     "Keep some B-frames as references.",               OFFSET(b_pyramid),     AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE, "b_pyramid" },
1075 1076 1077
    { "none",          NULL,                                  0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NONE},   INT_MIN, INT_MAX, VE, "b_pyramid" },
    { "strict",        "Strictly hierarchical pyramid",       0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_STRICT}, INT_MIN, INT_MAX, VE, "b_pyramid" },
    { "normal",        "Non-strict (not Blu-ray compatible)", 0, AV_OPT_TYPE_CONST, {.i64 = X264_B_PYRAMID_NORMAL}, INT_MIN, INT_MAX, VE, "b_pyramid" },
1078 1079 1080 1081 1082
    { "mixed-refs",    "One reference per partition, as opposed to one reference per macroblock", OFFSET(mixed_refs), AV_OPT_TYPE_BOOL, { .i64 = -1}, -1, 1, VE },
    { "8x8dct",        "High profile 8x8 transform.",                     OFFSET(dct8x8),        AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE},
    { "fast-pskip",    NULL,                                              OFFSET(fast_pskip),    AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE},
    { "aud",           "Use access unit delimiters.",                     OFFSET(aud),           AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE},
    { "mbtree",        "Use macroblock tree ratecontrol.",                OFFSET(mbtree),        AV_OPT_TYPE_BOOL,   { .i64 = -1 }, -1, 1, VE},
1083
    { "deblock",       "Loop filter parameters, in <alpha:beta> form.",   OFFSET(deblock),       AV_OPT_TYPE_STRING, { 0 },  0, 0, VE},
1084
    { "cplxblur",      "Reduce fluctuations in QP (before curve compression)", OFFSET(cplxblur), AV_OPT_TYPE_FLOAT,  {.dbl = -1 }, -1, FLT_MAX, VE},
1085
    { "partitions",    "A comma-separated list of partitions to consider. "
1086
                       "Possible values: p8x8, p4x4, b8x8, i8x8, i4x4, none, all", OFFSET(partitions), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE},
1087
    { "direct-pred",   "Direct MV prediction mode",                       OFFSET(direct_pred),   AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE, "direct-pred" },
1088 1089 1090 1091
    { "none",          NULL,      0,    AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_NONE },     0, 0, VE, "direct-pred" },
    { "spatial",       NULL,      0,    AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_SPATIAL },  0, 0, VE, "direct-pred" },
    { "temporal",      NULL,      0,    AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_TEMPORAL }, 0, 0, VE, "direct-pred" },
    { "auto",          NULL,      0,    AV_OPT_TYPE_CONST, { .i64 = X264_DIRECT_PRED_AUTO },     0, 0, VE, "direct-pred" },
1092
    { "slice-max-size","Limit the size of each slice in bytes",           OFFSET(slice_max_size),AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE },
1093
    { "stats",         "Filename for 2 pass stats",                       OFFSET(stats),         AV_OPT_TYPE_STRING, { 0 },  0,       0, VE },
1094 1095 1096 1097 1098
    { "nal-hrd",       "Signal HRD information (requires vbv-bufsize; "
                       "cbr not allowed in .mp4)",                        OFFSET(nal_hrd),       AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, INT_MAX, VE, "nal-hrd" },
    { "none",          NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_NONE}, INT_MIN, INT_MAX, VE, "nal-hrd" },
    { "vbr",           NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_VBR},  INT_MIN, INT_MAX, VE, "nal-hrd" },
    { "cbr",           NULL, 0, AV_OPT_TYPE_CONST, {.i64 = X264_NAL_HRD_CBR},  INT_MIN, INT_MAX, VE, "nal-hrd" },
1099
    { "avcintra-class","AVC-Intra class 50/100/200",                      OFFSET(avcintra_class),AV_OPT_TYPE_INT,     { .i64 = -1 }, -1, 200   , VE},
1100
    { "me_method",    "Set motion estimation method",                     OFFSET(motion_est),    AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, X264_ME_TESA, VE, "motion-est"},
1101 1102 1103 1104 1105 1106
    { "motion-est",   "Set motion estimation method",                     OFFSET(motion_est),    AV_OPT_TYPE_INT,    { .i64 = -1 }, -1, X264_ME_TESA, VE, "motion-est"},
    { "dia",           NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_ME_DIA },  INT_MIN, INT_MAX, VE, "motion-est" },
    { "hex",           NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_ME_HEX },  INT_MIN, INT_MAX, VE, "motion-est" },
    { "umh",           NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_ME_UMH },  INT_MIN, INT_MAX, VE, "motion-est" },
    { "esa",           NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_ME_ESA },  INT_MIN, INT_MAX, VE, "motion-est" },
    { "tesa",          NULL, 0, AV_OPT_TYPE_CONST, { .i64 = X264_ME_TESA }, INT_MIN, INT_MAX, VE, "motion-est" },
1107
    { "forced-idr",   "If forcing keyframes, force them as IDR frames.",                                  OFFSET(forced_idr),  AV_OPT_TYPE_BOOL,   { .i64 = 0 }, -1, 1, VE },
1108 1109 1110 1111
    { "coder",    "Coder type",                                           OFFSET(coder), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE, "coder" },
    { "default",          NULL, 0, AV_OPT_TYPE_CONST, { .i64 = -1 }, INT_MIN, INT_MAX, VE, "coder" },
    { "cavlc",            NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 },  INT_MIN, INT_MAX, VE, "coder" },
    { "cabac",            NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 },  INT_MIN, INT_MAX, VE, "coder" },
1112 1113
    { "vlc",              NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 },  INT_MIN, INT_MAX, VE, "coder" },
    { "ac",               NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 },  INT_MIN, INT_MAX, VE, "coder" },
1114
    { "b_strategy",   "Strategy to choose between I/P/B-frames",          OFFSET(b_frame_strategy), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 2, VE },
1115 1116 1117
    { "chromaoffset", "QP difference between chroma and luma",            OFFSET(chroma_offset), AV_OPT_TYPE_INT, { .i64 = -1 }, INT_MIN, INT_MAX, VE },
    { "sc_threshold", "Scene change threshold",                           OFFSET(scenechange_threshold), AV_OPT_TYPE_INT, { .i64 = -1 }, INT_MIN, INT_MAX, VE },
    { "noise_reduction", "Noise reduction",                               OFFSET(noise_reduction), AV_OPT_TYPE_INT, { .i64 = -1 }, INT_MIN, INT_MAX, VE },
1118

1119
    { "x264-params",  "Override the x264 configuration using a :-separated list of key=value parameters", OFFSET(x264_params), AV_OPT_TYPE_STRING, { 0 }, 0, 0, VE },
1120 1121 1122
    { NULL },
};

1123 1124
static const AVCodecDefault x264_defaults[] = {
    { "b",                "0" },
1125
    { "bf",               "-1" },
1126
    { "flags2",           "0" },
1127
    { "g",                "-1" },
1128
    { "i_qfactor",        "-1" },
1129
    { "b_qfactor",        "-1" },
1130 1131 1132 1133 1134
    { "qmin",             "-1" },
    { "qmax",             "-1" },
    { "qdiff",            "-1" },
    { "qblur",            "-1" },
    { "qcomp",            "-1" },
1135
//     { "rc_lookahead",     "-1" },
1136
    { "refs",             "-1" },
1137
#if FF_API_PRIVATE_OPT
1138
    { "sc_threshold",     "-1" },
1139
#endif
1140
    { "trellis",          "-1" },
1141
#if FF_API_PRIVATE_OPT
1142
    { "nr",               "-1" },
1143
#endif
1144 1145
    { "me_range",         "-1" },
    { "subq",             "-1" },
1146
#if FF_API_PRIVATE_OPT
1147
    { "b_strategy",       "-1" },
1148
#endif
1149
    { "keyint_min",       "-1" },
1150
#if FF_API_CODER_TYPE
1151
    { "coder",            "-1" },
1152
#endif
1153
    { "cmp",              "-1" },
1154
    { "threads",          AV_STRINGIFY(X264_THREADS_AUTO) },
1155
    { "thread_type",      "0" },
1156
    { "flags",            "+cgop" },
1157
    { "rc_init_occupancy","-1" },
1158 1159 1160
    { NULL },
};

1161
#if CONFIG_LIBX264_ENCODER
1162
static const AVClass x264_class = {
1163 1164 1165 1166 1167 1168
    .class_name = "libx264",
    .item_name  = av_default_item_name,
    .option     = options,
    .version    = LIBAVUTIL_VERSION_INT,
};

1169
AVCodec ff_libx264_encoder = {
1170
    .name             = "libx264",
1171
    .long_name        = NULL_IF_CONFIG_SMALL("libx264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
1172
    .type             = AVMEDIA_TYPE_VIDEO,
1173
    .id               = AV_CODEC_ID_H264,
1174 1175 1176 1177
    .priv_data_size   = sizeof(X264Context),
    .init             = X264_init,
    .encode2          = X264_frame,
    .close            = X264_close,
1178 1179
    .capabilities     = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_AUTO_THREADS |
                        AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
1180
    .priv_class       = &x264_class,
1181
    .defaults         = x264_defaults,
1182
    .init_static_data = X264_init_static,
1183 1184 1185
#if X264_BUILD >= 158
    .caps_internal    = FF_CODEC_CAP_INIT_CLEANUP | FF_CODEC_CAP_INIT_THREADSAFE,
#else
1186
    .caps_internal    = FF_CODEC_CAP_INIT_CLEANUP,
1187
#endif
1188
    .wrapper_name     = "libx264",
1189
};
1190 1191 1192 1193 1194 1195 1196 1197 1198
#endif

#if CONFIG_LIBX264RGB_ENCODER
static const AVClass rgbclass = {
    .class_name = "libx264rgb",
    .item_name  = av_default_item_name,
    .option     = options,
    .version    = LIBAVUTIL_VERSION_INT,
};
1199 1200 1201

AVCodec ff_libx264rgb_encoder = {
    .name           = "libx264rgb",
1202
    .long_name      = NULL_IF_CONFIG_SMALL("libx264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10 RGB"),
1203
    .type           = AVMEDIA_TYPE_VIDEO,
1204
    .id             = AV_CODEC_ID_H264,
1205 1206
    .priv_data_size = sizeof(X264Context),
    .init           = X264_init,
1207
    .encode2        = X264_frame,
1208
    .close          = X264_close,
1209 1210
    .capabilities   = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_AUTO_THREADS |
                      AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
1211 1212 1213
    .priv_class     = &rgbclass,
    .defaults       = x264_defaults,
    .pix_fmts       = pix_fmts_8bit_rgb,
1214 1215 1216
#if X264_BUILD >= 158
    .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP | FF_CODEC_CAP_INIT_THREADSAFE,
#else
1217
    .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP,
1218
#endif
1219
    .wrapper_name   = "libx264",
1220
};
1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239
#endif

#if CONFIG_LIBX262_ENCODER
static const AVClass X262_class = {
    .class_name = "libx262",
    .item_name  = av_default_item_name,
    .option     = options,
    .version    = LIBAVUTIL_VERSION_INT,
};

AVCodec ff_libx262_encoder = {
    .name             = "libx262",
    .long_name        = NULL_IF_CONFIG_SMALL("libx262 MPEG2VIDEO"),
    .type             = AVMEDIA_TYPE_VIDEO,
    .id               = AV_CODEC_ID_MPEG2VIDEO,
    .priv_data_size   = sizeof(X264Context),
    .init             = X264_init,
    .encode2          = X264_frame,
    .close            = X264_close,
1240 1241
    .capabilities     = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_AUTO_THREADS |
                        AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
1242 1243 1244
    .priv_class       = &X262_class,
    .defaults         = x264_defaults,
    .pix_fmts         = pix_fmts_8bit,
1245
    .caps_internal    = FF_CODEC_CAP_INIT_CLEANUP,
1246
    .wrapper_name     = "libx264",
1247 1248
};
#endif