libschroedingerenc.c 15.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22
/*
 * Dirac encoder support via Schroedinger libraries
 * Copyright (c) 2008 BBC, Anuradha Suraparaju <asuraparaju at gmail dot com >
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
23
* @file
24 25 26 27 28 29 30 31 32 33
* Dirac encoder support via libschroedinger-1.0 libraries. More details about
* the Schroedinger project can be found at http://www.diracvideo.org/.
* The library implements Dirac Specification Version 2.2
* (http://dirac.sourceforge.net/specification.html).
*/

#include <schroedinger/schro.h>
#include <schroedinger/schrodebug.h>
#include <schroedinger/schrovideoformat.h>

34
#include "libavutil/attributes.h"
35
#include "libavutil/avassert.h"
36
#include "avcodec.h"
37
#include "internal.h"
38
#include "libschroedinger.h"
David Conrad's avatar
David Conrad committed
39
#include "bytestream.h"
40 41 42


/** libschroedinger encoder private data */
43
typedef struct SchroEncoderParams {
44 45 46 47 48 49 50 51 52 53 54 55
    /** Schroedinger video format */
    SchroVideoFormat *format;

    /** Schroedinger frame format */
    SchroFrameFormat frame_format;

    /** frame size */
    int frame_size;

    /** Schroedinger encoder handle*/
    SchroEncoder* encoder;

56 57 58 59 60 61
    /** buffer to store encoder output before writing it to the frame queue*/
    unsigned char *enc_buf;

    /** Size of encoder buffer*/
    int enc_buf_size;

62
    /** queue storing encoded frames */
63
    FFSchroQueue enc_frame_queue;
64 65 66 67 68 69

    /** end of sequence signalled */
    int eos_signalled;

    /** end of sequence pulled */
    int eos_pulled;
70 71 72

    /* counter for frames submitted to encoder, used as dts */
    int64_t dts;
73
} SchroEncoderParams;
74 75 76 77

/**
* Works out Schro-compatible chroma format.
*/
78
static int set_chroma_format(AVCodecContext *avctx)
79
{
80 81
    int num_formats = sizeof(schro_pixel_format_map) /
                      sizeof(schro_pixel_format_map[0]);
82 83
    int idx;

84
    SchroEncoderParams *p_schro_params = avctx->priv_data;
85 86

    for (idx = 0; idx < num_formats; ++idx) {
87
        if (schro_pixel_format_map[idx].ff_pix_fmt == avctx->pix_fmt) {
88
            p_schro_params->format->chroma_format =
89
                            schro_pixel_format_map[idx].schro_pix_fmt;
90 91 92 93
            return 0;
        }
    }

94
    av_log(avctx, AV_LOG_ERROR,
95 96
           "This codec currently only supports planar YUV 4:2:0, 4:2:2"
           " and 4:4:4 formats.\n");
97 98 99 100

    return -1;
}

101
static av_cold int libschroedinger_encode_init(AVCodecContext *avctx)
102
{
103
    SchroEncoderParams *p_schro_params = avctx->priv_data;
104 105 106 107 108 109 110 111 112
    SchroVideoFormatEnum preset;

    /* Initialize the libraries that libschroedinger depends on. */
    schro_init();

    /* Create an encoder object. */
    p_schro_params->encoder = schro_encoder_new();

    if (!p_schro_params->encoder) {
113
        av_log(avctx, AV_LOG_ERROR,
114 115 116 117 118
               "Unrecoverable Error: schro_encoder_new failed. ");
        return -1;
    }

    /* Initialize the format. */
119
    preset = ff_get_schro_video_format_preset(avctx);
120 121
    p_schro_params->format =
                    schro_encoder_get_video_format(p_schro_params->encoder);
122
    schro_video_format_set_std_video_format(p_schro_params->format, preset);
123 124
    p_schro_params->format->width  = avctx->width;
    p_schro_params->format->height = avctx->height;
125

126
    if (set_chroma_format(avctx) == -1)
127 128
        return -1;

129
    if (avctx->color_primaries == AVCOL_PRI_BT709) {
130
        p_schro_params->format->colour_primaries = SCHRO_COLOUR_PRIMARY_HDTV;
131
    } else if (avctx->color_primaries == AVCOL_PRI_BT470BG) {
132
        p_schro_params->format->colour_primaries = SCHRO_COLOUR_PRIMARY_SDTV_625;
133
    } else if (avctx->color_primaries == AVCOL_PRI_SMPTE170M) {
134 135 136
        p_schro_params->format->colour_primaries = SCHRO_COLOUR_PRIMARY_SDTV_525;
    }

137
    if (avctx->colorspace == AVCOL_SPC_BT709) {
138
        p_schro_params->format->colour_matrix = SCHRO_COLOUR_MATRIX_HDTV;
139
    } else if (avctx->colorspace == AVCOL_SPC_BT470BG) {
140 141 142
        p_schro_params->format->colour_matrix = SCHRO_COLOUR_MATRIX_SDTV;
    }

143
    if (avctx->color_trc == AVCOL_TRC_BT709) {
144 145 146
        p_schro_params->format->transfer_function = SCHRO_TRANSFER_CHAR_TV_GAMMA;
    }

147 148
    if (ff_get_schro_frame_format(p_schro_params->format->chroma_format,
                                  &p_schro_params->frame_format) == -1) {
149
        av_log(avctx, AV_LOG_ERROR,
150 151
               "This codec currently supports only planar YUV 4:2:0, 4:2:2"
               " and 4:4:4 formats.\n");
152 153 154
        return -1;
    }

155 156
    p_schro_params->format->frame_rate_numerator   = avctx->time_base.den;
    p_schro_params->format->frame_rate_denominator = avctx->time_base.num;
157

158 159 160
    p_schro_params->frame_size = avpicture_get_size(avctx->pix_fmt,
                                                    avctx->width,
                                                    avctx->height);
161

162 163 164
    avctx->coded_frame = av_frame_alloc();
    if (!avctx->coded_frame)
        return AVERROR(ENOMEM);
165

166
    if (!avctx->gop_size) {
167 168 169
        schro_encoder_setting_set_double(p_schro_params->encoder,
                                         "gop_structure",
                                         SCHRO_ENCODER_GOP_INTRA_ONLY);
170

171
        if (avctx->coder_type == FF_CODER_TYPE_VLC)
172 173 174
            schro_encoder_setting_set_double(p_schro_params->encoder,
                                             "enable_noarith", 1);
    } else {
175
        schro_encoder_setting_set_double(p_schro_params->encoder,
176 177
                                         "au_distance", avctx->gop_size);
        avctx->has_b_frames = 1;
178
        p_schro_params->dts = -1;
179 180 181
    }

    /* FIXME - Need to handle SCHRO_ENCODER_RATE_CONTROL_LOW_DELAY. */
182 183
    if (avctx->flags & CODEC_FLAG_QSCALE) {
        if (!avctx->global_quality) {
184
            /* lossless coding */
185 186 187
            schro_encoder_setting_set_double(p_schro_params->encoder,
                                             "rate_control",
                                             SCHRO_ENCODER_RATE_CONTROL_LOSSLESS);
188
        } else {
189
            int quality;
190 191
            schro_encoder_setting_set_double(p_schro_params->encoder,
                                             "rate_control",
192
                                             SCHRO_ENCODER_RATE_CONTROL_CONSTANT_QUALITY);
193

194
            quality = avctx->global_quality / FF_QP2LAMBDA;
195 196
            if (quality > 10)
                quality = 10;
197
            schro_encoder_setting_set_double(p_schro_params->encoder,
198
                                             "quality", quality);
199
        }
200 201 202 203
    } else {
        schro_encoder_setting_set_double(p_schro_params->encoder,
                                         "rate_control",
                                         SCHRO_ENCODER_RATE_CONTROL_CONSTANT_BITRATE);
204

205
        schro_encoder_setting_set_double(p_schro_params->encoder,
206
                                         "bitrate", avctx->bit_rate);
207 208
    }

209
    if (avctx->flags & CODEC_FLAG_INTERLACED_ME)
210 211
        /* All material can be coded as interlaced or progressive
           irrespective of the type of source material. */
212 213
        schro_encoder_setting_set_double(p_schro_params->encoder,
                                         "interlaced_coding", 1);
214

David Conrad's avatar
David Conrad committed
215
    schro_encoder_setting_set_double(p_schro_params->encoder, "open_gop",
216
                                     !(avctx->flags & CODEC_FLAG_CLOSED_GOP));
David Conrad's avatar
David Conrad committed
217

218 219 220 221 222 223 224 225 226 227
    /* FIXME: Signal range hardcoded to 8-bit data until both libschroedinger
     * and libdirac support other bit-depth data. */
    schro_video_format_set_std_signal_range(p_schro_params->format,
                                            SCHRO_SIGNAL_RANGE_8BIT_VIDEO);

    /* Set the encoder format. */
    schro_encoder_set_video_format(p_schro_params->encoder,
                                   p_schro_params->format);

    /* Set the debug level. */
228
    schro_debug_set_level(avctx->debug);
229

230
    schro_encoder_start(p_schro_params->encoder);
231 232

    /* Initialize the encoded frame queue. */
233
    ff_schro_queue_init(&p_schro_params->enc_frame_queue);
234
    return 0;
235 236
}

237
static SchroFrame *libschroedinger_frame_from_data(AVCodecContext *avctx,
238
                                                   const AVFrame *frame)
239
{
240
    SchroEncoderParams *p_schro_params = avctx->priv_data;
241 242 243 244
    SchroFrame *in_frame;
    /* Input line size may differ from what the codec supports. Especially
     * when transcoding from one format to another. So use avpicture_layout
     * to copy the frame. */
245
    in_frame = ff_create_schro_frame(avctx, p_schro_params->frame_format);
246 247

    if (in_frame)
248 249
        avpicture_layout((const AVPicture *)frame, avctx->pix_fmt,
                          avctx->width, avctx->height,
250 251
                          in_frame->components[0].data,
                          p_schro_params->frame_size);
252 253 254 255

    return in_frame;
}

256
static void libschroedinger_free_frame(void *data)
257
{
258
    FFSchroEncodedFrame *enc_frame = data;
259

260
    av_freep(&enc_frame->p_encbuf);
261 262 263
    av_free(enc_frame);
}

264
static int libschroedinger_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
265
                                        const AVFrame *frame, int *got_packet)
266 267
{
    int enc_size = 0;
268
    SchroEncoderParams *p_schro_params = avctx->priv_data;
269
    SchroEncoder *encoder = p_schro_params->encoder;
270
    struct FFSchroEncodedFrame *p_frame_output = NULL;
271 272 273 274
    int go = 1;
    SchroBuffer *enc_buf;
    int presentation_frame;
    int parse_code;
275
    int last_frame_in_sequence = 0;
276
    int pkt_size, ret;
277

278
    if (!frame) {
279 280 281 282 283 284 285
        /* Push end of sequence if not already signalled. */
        if (!p_schro_params->eos_signalled) {
            schro_encoder_end_of_stream(encoder);
            p_schro_params->eos_signalled = 1;
        }
    } else {
        /* Allocate frame data to schro input buffer. */
286
        SchroFrame *in_frame = libschroedinger_frame_from_data(avctx, frame);
287 288 289 290 291 292 293 294 295
        /* Load next frame. */
        schro_encoder_push_frame(encoder, in_frame);
    }

    if (p_schro_params->eos_pulled)
        go = 0;

    /* Now check to see if we have any output from the encoder. */
    while (go) {
296
        int err;
297
        SchroStateEnum state;
298
        state = schro_encoder_wait(encoder);
299
        switch (state) {
300 301
        case SCHRO_STATE_HAVE_BUFFER:
        case SCHRO_STATE_END_OF_STREAM:
302
            enc_buf = schro_encoder_pull(encoder, &presentation_frame);
303 304
            if (enc_buf->length <= 0)
                return AVERROR_BUG;
305 306 307 308 309 310
            parse_code = enc_buf->data[4];

            /* All non-frame data is prepended to actual frame data to
             * be able to set the pts correctly. So we don't write data
             * to the frame output queue until we actually have a frame
             */
311 312 313 314 315 316
            if ((err = av_reallocp(&p_schro_params->enc_buf,
                                   p_schro_params->enc_buf_size +
                                   enc_buf->length)) < 0) {
                p_schro_params->enc_buf_size = 0;
                return err;
            }
317

318
            memcpy(p_schro_params->enc_buf + p_schro_params->enc_buf_size,
319 320 321 322 323 324 325 326 327 328
                   enc_buf->data, enc_buf->length);
            p_schro_params->enc_buf_size += enc_buf->length;


            if (state == SCHRO_STATE_END_OF_STREAM) {
                p_schro_params->eos_pulled = 1;
                go = 0;
            }

            if (!SCHRO_PARSE_CODE_IS_PICTURE(parse_code)) {
329
                schro_buffer_unref(enc_buf);
330 331
                break;
            }
332 333

            /* Create output frame. */
334
            p_frame_output = av_mallocz(sizeof(FFSchroEncodedFrame));
335
            /* Set output data. */
336 337
            p_frame_output->size     = p_schro_params->enc_buf_size;
            p_frame_output->p_encbuf = p_schro_params->enc_buf;
338
            if (SCHRO_PARSE_CODE_IS_INTRA(parse_code) &&
339
                SCHRO_PARSE_CODE_IS_REFERENCE(parse_code))
340 341 342 343
                p_frame_output->key_frame = 1;

            /* Parse the coded frame number from the bitstream. Bytes 14
             * through 17 represesent the frame number. */
David Conrad's avatar
David Conrad committed
344
            p_frame_output->frame_num = AV_RB32(enc_buf->data + 13);
345

346 347
            ff_schro_queue_push_back(&p_schro_params->enc_frame_queue,
                                     p_frame_output);
348 349 350
            p_schro_params->enc_buf_size = 0;
            p_schro_params->enc_buf      = NULL;

351
            schro_buffer_unref(enc_buf);
352 353 354 355 356 357 358 359 360 361 362

            break;

        case SCHRO_STATE_NEED_FRAME:
            go = 0;
            break;

        case SCHRO_STATE_AGAIN:
            break;

        default:
363
            av_log(avctx, AV_LOG_ERROR, "Unknown Schro Encoder state\n");
364 365 366 367 368
            return -1;
        }
    }

    /* Copy 'next' frame in queue. */
369 370 371 372 373

    if (p_schro_params->enc_frame_queue.size == 1 &&
        p_schro_params->eos_pulled)
        last_frame_in_sequence = 1;

374
    p_frame_output = ff_schro_queue_pop(&p_schro_params->enc_frame_queue);
375

376
    if (!p_frame_output)
377 378
        return 0;

379 380 381
    pkt_size = p_frame_output->size;
    if (last_frame_in_sequence && p_schro_params->enc_buf_size > 0)
        pkt_size += p_schro_params->enc_buf_size;
382
    if ((ret = ff_alloc_packet2(avctx, pkt, pkt_size)) < 0)
383 384 385
        goto error;

    memcpy(pkt->data, p_frame_output->p_encbuf, p_frame_output->size);
386
    avctx->coded_frame->key_frame = p_frame_output->key_frame;
387 388 389
    /* Use the frame number of the encoded frame as the pts. It is OK to
     * do so since Dirac is a constant frame rate codec. It expects input
     * to be of constant frame rate. */
390
    pkt->pts =
391
    avctx->coded_frame->pts = p_frame_output->frame_num;
392
    pkt->dts = p_schro_params->dts++;
393 394
    enc_size = p_frame_output->size;

395 396
    /* Append the end of sequence information to the last frame in the
     * sequence. */
397
    if (last_frame_in_sequence && p_schro_params->enc_buf_size > 0) {
398
        memcpy(pkt->data + enc_size, p_schro_params->enc_buf,
399
               p_schro_params->enc_buf_size);
400
        enc_size += p_schro_params->enc_buf_size;
401
        av_freep(&p_schro_params->enc_buf);
402 403 404
        p_schro_params->enc_buf_size = 0;
    }

405 406 407 408 409
    if (p_frame_output->key_frame)
        pkt->flags |= AV_PKT_FLAG_KEY;
    *got_packet = 1;

error:
410
    /* free frame */
411
    libschroedinger_free_frame(p_frame_output);
412
    return ret;
413 414 415
}


416
static int libschroedinger_encode_close(AVCodecContext *avctx)
417
{
418
    SchroEncoderParams *p_schro_params = avctx->priv_data;
419

420
    /* Close the encoder. */
421 422 423
    schro_encoder_free(p_schro_params->encoder);

    /* Free data in the output frame queue. */
424
    ff_schro_queue_free(&p_schro_params->enc_frame_queue,
425
                        libschroedinger_free_frame);
426

427 428 429 430 431

    /* Free the encoder buffer. */
    if (p_schro_params->enc_buf_size)
        av_freep(&p_schro_params->enc_buf);

432 433 434
    /* Free the video format structure. */
    av_freep(&p_schro_params->format);

435 436
    av_frame_free(&avctx->coded_frame);

437
    return 0;
438 439 440
}


441
AVCodec ff_libschroedinger_encoder = {
442
    .name           = "libschroedinger",
443
    .long_name      = NULL_IF_CONFIG_SMALL("libschroedinger Dirac 2.2"),
444
    .type           = AVMEDIA_TYPE_VIDEO,
445
    .id             = AV_CODEC_ID_DIRAC,
446
    .priv_data_size = sizeof(SchroEncoderParams),
447
    .init           = libschroedinger_encode_init,
448
    .encode2        = libschroedinger_encode_frame,
449
    .close          = libschroedinger_encode_close,
450
    .capabilities   = CODEC_CAP_DELAY,
451 452
    .pix_fmts       = (const enum AVPixelFormat[]){
        AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P, AV_PIX_FMT_YUV444P, AV_PIX_FMT_NONE
453
    },
454
};