h264_mp4toannexb_bsf.c 9.93 KB
Newer Older
1
/*
2
 * H.264 MP4 to Annex B byte stream format filter
3
 * Copyright (c) 2007 Benoit Fouet <benoit.fouet@free.fr>
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

22 23
#include <string.h>

24
#include "libavutil/avassert.h"
25
#include "libavutil/intreadwrite.h"
26
#include "libavutil/mem.h"
27

28
#include "avcodec.h"
29
#include "bsf.h"
30
#include "h264.h"
31 32

typedef struct H264BSFContext {
33 34
    int32_t  sps_offset;
    int32_t  pps_offset;
35
    uint8_t  length_size;
36
    uint8_t  new_idr;
37 38
    uint8_t  idr_sps_seen;
    uint8_t  idr_pps_seen;
39
    int      extradata_parsed;
40 41
} H264BSFContext;

42
static int alloc_and_copy(AVPacket *out,
43
                          const uint8_t *sps_pps, uint32_t sps_pps_size,
44
                          const uint8_t *in, uint32_t in_size, int ps)
45
{
46
    uint32_t offset         = out->size;
47
    uint8_t start_code_size = offset == 0 || ps ? 4 : 3;
48
    int err;
49

50
    err = av_grow_packet(out, sps_pps_size + in_size + start_code_size);
51
    if (err < 0)
52
        return err;
53

54
    if (sps_pps)
55
        memcpy(out->data + offset, sps_pps, sps_pps_size);
56 57 58
    memcpy(out->data + sps_pps_size + start_code_size + offset, in, in_size);
    if (start_code_size == 4) {
        AV_WB32(out->data + offset + sps_pps_size, 1);
59
    } else {
60 61 62
        (out->data + offset + sps_pps_size)[0] =
        (out->data + offset + sps_pps_size)[1] = 0;
        (out->data + offset + sps_pps_size)[2] = 1;
63
    }
64 65

    return 0;
66 67
}

68
static int h264_extradata_to_annexb(AVBSFContext *ctx, const int padding)
69
{
70
    H264BSFContext *s = ctx->priv_data;
71
    uint16_t unit_size;
72
    uint32_t total_size                 = 0;
73 74
    uint8_t *out                        = NULL, unit_nb, sps_done = 0,
             sps_seen                   = 0, pps_seen = 0;
75
    const uint8_t *extradata            = ctx->par_in->extradata + 4;
76 77 78
    static const uint8_t nalu_header[4] = { 0, 0, 0, 1 };
    int length_size = (*extradata++ & 0x3) + 1; // retrieve length coded size

79
    s->sps_offset = s->pps_offset = -1;
80

81 82 83
    /* retrieve sps and pps unit(s) */
    unit_nb = *extradata++ & 0x1f; /* number of sps unit(s) */
    if (!unit_nb) {
84
        goto pps;
85
    } else {
86
        s->sps_offset = 0;
87 88 89 90
        sps_seen = 1;
    }

    while (unit_nb--) {
91
        int err;
92 93 94

        unit_size   = AV_RB16(extradata);
        total_size += unit_size + 4;
95
        av_assert1(total_size <= INT_MAX - padding);
96 97
        if (extradata + 2 + unit_size > ctx->par_in->extradata + ctx->par_in->extradata_size) {
            av_log(ctx, AV_LOG_ERROR, "Packet header is not contained in global extradata, "
98
                   "corrupted stream or invalid MP4/AVCC bitstream\n");
99 100 101
            av_free(out);
            return AVERROR(EINVAL);
        }
102 103
        if ((err = av_reallocp(&out, total_size + padding)) < 0)
            return err;
104 105 106
        memcpy(out + total_size - unit_size - 4, nalu_header, 4);
        memcpy(out + total_size - unit_size, extradata + 2, unit_size);
        extradata += 2 + unit_size;
107
pps:
108 109
        if (!unit_nb && !sps_done++) {
            unit_nb = *extradata++; /* number of pps unit(s) */
110
            if (unit_nb) {
111
                s->pps_offset = total_size;
112
                pps_seen = 1;
113
            }
114 115 116 117
        }
    }

    if (out)
118
        memset(out + total_size, 0, padding);
119 120

    if (!sps_seen)
121
        av_log(ctx, AV_LOG_WARNING,
122 123 124 125
               "Warning: SPS NALU missing or invalid. "
               "The resulting stream may not play.\n");

    if (!pps_seen)
126
        av_log(ctx, AV_LOG_WARNING,
127 128 129
               "Warning: PPS NALU missing or invalid. "
               "The resulting stream may not play.\n");

130 131 132
    av_freep(&ctx->par_out->extradata);
    ctx->par_out->extradata      = out;
    ctx->par_out->extradata_size = total_size;
133 134 135 136

    return length_size;
}

137
static int h264_mp4toannexb_init(AVBSFContext *ctx)
138
{
139
    H264BSFContext *s = ctx->priv_data;
140
    int extra_size = ctx->par_in->extradata_size;
141 142 143
    int ret;

    /* retrieve sps and pps NAL units from extradata */
144 145 146 147 148 149
    if (!extra_size                                               ||
        (extra_size >= 3 && AV_RB24(ctx->par_in->extradata) == 1) ||
        (extra_size >= 4 && AV_RB32(ctx->par_in->extradata) == 1)) {
        av_log(ctx, AV_LOG_VERBOSE,
               "The input looks like it is Annex B already\n");
    } else if (extra_size >= 6) {
150 151 152 153 154
        ret = h264_extradata_to_annexb(ctx, AV_INPUT_BUFFER_PADDING_SIZE);
        if (ret < 0)
            return ret;

        s->length_size      = ret;
155 156 157
        s->new_idr          = 1;
        s->idr_sps_seen     = 0;
        s->idr_pps_seen     = 0;
158
        s->extradata_parsed = 1;
159 160 161
    } else {
        av_log(ctx, AV_LOG_ERROR, "Invalid extradata size: %d\n", extra_size);
        return AVERROR_INVALIDDATA;
162 163 164 165 166 167 168 169 170 171
    }

    return 0;
}

static int h264_mp4toannexb_filter(AVBSFContext *ctx, AVPacket *out)
{
    H264BSFContext *s = ctx->priv_data;

    AVPacket *in;
172
    uint8_t unit_type;
173
    int32_t nal_size;
174
    uint32_t cumul_size    = 0;
175 176 177
    const uint8_t *buf;
    const uint8_t *buf_end;
    int            buf_size;
178
    int ret = 0, i;
179

180 181 182
    ret = ff_bsf_get_packet(ctx, &in);
    if (ret < 0)
        return ret;
183 184

    /* nothing to filter */
185 186 187
    if (!s->extradata_parsed) {
        av_packet_move_ref(out, in);
        av_packet_free(&in);
188 189 190
        return 0;
    }

191 192 193
    buf      = in->data;
    buf_size = in->size;
    buf_end  = in->data + in->size;
194

195
    do {
196
        ret= AVERROR(EINVAL);
197
        if (buf + s->length_size > buf_end)
198 199
            goto fail;

200
        for (nal_size = 0, i = 0; i<s->length_size; i++)
201
            nal_size = (nal_size << 8) | buf[i];
202

203
        buf += s->length_size;
204 205
        unit_type = *buf & 0x1f;

206
        if (nal_size > buf_end - buf || nal_size < 0)
207 208
            goto fail;

209
        if (unit_type == H264_NAL_SPS)
210
            s->idr_sps_seen = s->new_idr = 1;
211
        else if (unit_type == H264_NAL_PPS) {
212
            s->idr_pps_seen = s->new_idr = 1;
213
            /* if SPS has not been seen yet, prepend the AVCC one to PPS */
214 215 216
            if (!s->idr_sps_seen) {
                if (s->sps_offset == -1)
                    av_log(ctx, AV_LOG_WARNING, "SPS not present in the stream, nor in AVCC, stream may be unreadable\n");
217
                else {
218 219 220
                    if ((ret = alloc_and_copy(out,
                                         ctx->par_out->extradata + s->sps_offset,
                                         s->pps_offset != -1 ? s->pps_offset : ctx->par_out->extradata_size - s->sps_offset,
221
                                         buf, nal_size, 1)) < 0)
222
                        goto fail;
223
                    s->idr_sps_seen = 1;
224 225 226 227
                    goto next_nal;
                }
            }
        }
228

229 230 231
        /* if this is a new IDR picture following an IDR picture, reset the idr flag.
         * Just check first_mb_in_slice to be 0 as this is the simplest solution.
         * This could be checking idr_pic_id instead, but would complexify the parsing. */
232
        if (!s->new_idr && unit_type == H264_NAL_IDR_SLICE && (buf[1] & 0x80))
233
            s->new_idr = 1;
234 235

        /* prepend only to the first type 5 NAL unit of an IDR picture, if no sps/pps are already present */
236
        if (s->new_idr && unit_type == H264_NAL_IDR_SLICE && !s->idr_sps_seen && !s->idr_pps_seen) {
237
            if ((ret=alloc_and_copy(out,
238
                               ctx->par_out->extradata, ctx->par_out->extradata_size,
239
                               buf, nal_size, 1)) < 0)
240
                goto fail;
241
            s->new_idr = 0;
242
        /* if only SPS has been seen, also insert PPS */
243
        } else if (s->new_idr && unit_type == H264_NAL_IDR_SLICE && s->idr_sps_seen && !s->idr_pps_seen) {
244 245
            if (s->pps_offset == -1) {
                av_log(ctx, AV_LOG_WARNING, "PPS not present in the stream, nor in AVCC, stream may be unreadable\n");
246
                if ((ret = alloc_and_copy(out, NULL, 0, buf, nal_size, 0)) < 0)
247
                    goto fail;
248 249
            } else if ((ret = alloc_and_copy(out,
                                        ctx->par_out->extradata + s->pps_offset, ctx->par_out->extradata_size - s->pps_offset,
250
                                        buf, nal_size, 1)) < 0)
251
                goto fail;
252
        } else {
253
            if ((ret=alloc_and_copy(out, NULL, 0, buf, nal_size, unit_type == H264_NAL_SPS || unit_type == H264_NAL_PPS)) < 0)
254
                goto fail;
255
            if (!s->new_idr && unit_type == H264_NAL_SLICE) {
256 257 258
                s->new_idr = 1;
                s->idr_sps_seen = 0;
                s->idr_pps_seen = 0;
259
            }
260 261
        }

262
next_nal:
263
        buf        += nal_size;
264
        cumul_size += nal_size + s->length_size;
265 266
    } while (cumul_size < buf_size);

267 268 269
    ret = av_packet_copy_props(out, in);
    if (ret < 0)
        goto fail;
270 271

fail:
272 273 274 275
    if (ret < 0)
        av_packet_unref(out);
    av_packet_free(&in);

276
    return ret;
277 278
}

279 280 281 282 283 284 285 286 287
static void h264_mp4toannexb_flush(AVBSFContext *ctx)
{
    H264BSFContext *s = ctx->priv_data;

    s->idr_sps_seen = 0;
    s->idr_pps_seen = 0;
    s->new_idr      = s->extradata_parsed;
}

288 289 290
static const enum AVCodecID codec_ids[] = {
    AV_CODEC_ID_H264, AV_CODEC_ID_NONE,
};
291

292
const AVBitStreamFilter ff_h264_mp4toannexb_bsf = {
293 294
    .name           = "h264_mp4toannexb",
    .priv_data_size = sizeof(H264BSFContext),
295
    .init           = h264_mp4toannexb_init,
296
    .filter         = h264_mp4toannexb_filter,
297
    .flush          = h264_mp4toannexb_flush,
298
    .codec_ids      = codec_ids,
299
};