hevc_sei.c 12.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * HEVC Supplementary Enhancement Information messages
 *
 * Copyright (C) 2012 - 2013 Guillaume Martres
 * Copyright (C) 2012 - 2013 Gildas Cocherel
 * Copyright (C) 2013 Vittorio Giovara
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "golomb.h"
26 27
#include "hevc_ps.h"
#include "hevc_sei.h"
28

29
static int decode_nal_sei_decoded_picture_hash(HEVCSEIPictureHash *s, GetBitContext *gb)
30 31 32 33 34 35 36
{
    int cIdx, i;
    uint8_t hash_type;
    //uint16_t picture_crc;
    //uint32_t picture_checksum;
    hash_type = get_bits(gb, 8);

37 38
    for (cIdx = 0; cIdx < 3/*((s->sps->chroma_format_idc == 0) ? 1 : 3)*/; cIdx++) {
        if (hash_type == 0) {
39
            s->is_md5 = 1;
40
            for (i = 0; i < 16; i++)
41
                s->md5[cIdx][i] = get_bits(gb, 8);
42
        } else if (hash_type == 1) {
43 44
            // picture_crc = get_bits(gb, 16);
            skip_bits(gb, 16);
45
        } else if (hash_type == 2) {
46
            // picture_checksum = get_bits_long(gb, 32);
47 48 49
            skip_bits(gb, 32);
        }
    }
50
    return 0;
51 52
}

53
static int decode_nal_sei_mastering_display_info(HEVCSEIMasteringDisplay *s, GetBitContext *gb)
54 55 56 57 58 59 60 61 62 63 64 65
{
    int i;
    // Mastering primaries
    for (i = 0; i < 3; i++) {
        s->display_primaries[i][0] = get_bits(gb, 16);
        s->display_primaries[i][1] = get_bits(gb, 16);
    }
    // White point (x, y)
    s->white_point[0] = get_bits(gb, 16);
    s->white_point[1] = get_bits(gb, 16);

    // Max and min luminance of mastering display
66 67
    s->max_luminance = get_bits_long(gb, 32);
    s->min_luminance = get_bits_long(gb, 32);
68 69 70 71

    // As this SEI message comes before the first frame that references it,
    // initialize the flag to 2 and decrement on IRAP access unit so it
    // persists for the coded video sequence (e.g., between two IRAPs)
72
    s->present = 2;
73 74 75
    return 0;
}

76
static int decode_nal_sei_content_light_info(HEVCSEIContentLight *s, GetBitContext *gb)
77 78 79 80 81 82 83
{
    // Max and average light levels
    s->max_content_light_level     = get_bits_long(gb, 16);
    s->max_pic_average_light_level = get_bits_long(gb, 16);
    // As this SEI message comes before the first frame that references it,
    // initialize the flag to 2 and decrement on IRAP access unit so it
    // persists for the coded video sequence (e.g., between two IRAPs)
84
    s->present = 2;
85 86 87
    return  0;
}

88
static int decode_nal_sei_frame_packing_arrangement(HEVCSEIFramePacking *s, GetBitContext *gb)
89
{
90
    get_ue_golomb_long(gb);             // frame_packing_arrangement_id
91
    s->present = !get_bits1(gb);
92

93 94
    if (s->present) {
        s->arrangement_type               = get_bits(gb, 7);
95 96
        s->quincunx_subsampling           = get_bits1(gb);
        s->content_interpretation_type    = get_bits(gb, 6);
97

98 99 100 101 102
        // spatial_flipping_flag, frame0_flipped_flag, field_views_flag
        skip_bits(gb, 3);
        s->current_frame_is_frame0_flag = get_bits1(gb);
        // frame0_self_contained_flag, frame1_self_contained_flag
        skip_bits(gb, 2);
103

104
        if (!s->quincunx_subsampling && s->arrangement_type != 5)
105 106
            skip_bits(gb, 16);  // frame[01]_grid_position_[xy]
        skip_bits(gb, 8);       // frame_packing_arrangement_reserved_byte
107
        skip_bits1(gb);         // frame_packing_arrangement_persistence_flag
108
    }
109
    skip_bits1(gb);             // upsampled_aspect_ratio_flag
110
    return 0;
111 112
}

113
static int decode_nal_sei_display_orientation(HEVCSEIDisplayOrientation *s, GetBitContext *gb)
114
{
115
    s->present = !get_bits1(gb);
116

117 118 119
    if (s->present) {
        s->hflip = get_bits1(gb);     // hor_flip
        s->vflip = get_bits1(gb);     // ver_flip
120

121
        s->anticlockwise_rotation = get_bits(gb, 16);
122 123
        skip_bits1(gb);     // display_orientation_persistence_flag
    }
124 125

    return 0;
126 127
}

128
static int decode_nal_sei_pic_timing(HEVCSEI *s, GetBitContext *gb, const HEVCParamSets *ps,
129
                                     void *logctx, int size)
130
{
131
    HEVCSEIPictureTiming *h = &s->picture_timing;
132
    HEVCSPS *sps;
133

134
    if (!ps->sps_list[s->active_seq_parameter_set_id])
135
        return(AVERROR(ENOMEM));
136
    sps = (HEVCSPS*)ps->sps_list[s->active_seq_parameter_set_id]->data;
137 138 139

    if (sps->vui.frame_field_info_present_flag) {
        int pic_struct = get_bits(gb, 4);
140
        h->picture_struct = AV_PICTURE_STRUCTURE_UNKNOWN;
141
        if (pic_struct == 2 || pic_struct == 10 || pic_struct == 12) {
142 143
            av_log(logctx, AV_LOG_DEBUG, "BOTTOM Field\n");
            h->picture_struct = AV_PICTURE_STRUCTURE_BOTTOM_FIELD;
144
        } else if (pic_struct == 1 || pic_struct == 9 || pic_struct == 11) {
145 146
            av_log(logctx, AV_LOG_DEBUG, "TOP Field\n");
            h->picture_struct = AV_PICTURE_STRUCTURE_TOP_FIELD;
147 148 149
        }
        get_bits(gb, 2);                   // source_scan_type
        get_bits(gb, 1);                   // duplicate_flag
150 151
        skip_bits1(gb);
        size--;
152
    }
153 154 155
    skip_bits_long(gb, 8 * size);

    return 0;
156 157
}

158 159
static int decode_registered_user_data_closed_caption(HEVCSEIA53Caption *s, GetBitContext *gb,
                                                      int size)
160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179
{
    int flag;
    int user_data_type_code;
    int cc_count;

    if (size < 3)
       return AVERROR(EINVAL);

    user_data_type_code = get_bits(gb, 8);
    if (user_data_type_code == 0x3) {
        skip_bits(gb, 1); // reserved

        flag = get_bits(gb, 1); // process_cc_data_flag
        if (flag) {
            skip_bits(gb, 1);
            cc_count = get_bits(gb, 5);
            skip_bits(gb, 8); // reserved
            size -= 2;

            if (cc_count && size >= cc_count * 3) {
180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195
                const uint64_t new_size = (s->a53_caption_size + cc_count
                                           * UINT64_C(3));
                int i, ret;

                if (new_size > INT_MAX)
                    return AVERROR(EINVAL);

                /* Allow merging of the cc data from two fields. */
                ret = av_reallocp(&s->a53_caption, new_size);
                if (ret < 0)
                    return ret;

                for (i = 0; i < cc_count; i++) {
                    s->a53_caption[s->a53_caption_size++] = get_bits(gb, 8);
                    s->a53_caption[s->a53_caption_size++] = get_bits(gb, 8);
                    s->a53_caption[s->a53_caption_size++] = get_bits(gb, 8);
196 197 198 199 200
                }
                skip_bits(gb, 8); // marker_bits
            }
        }
    } else {
201
        int i;
202 203 204 205 206 207 208
        for (i = 0; i < size - 1; i++)
            skip_bits(gb, 8);
    }

    return 0;
}

209
static int decode_nal_sei_user_data_registered_itu_t_t35(HEVCSEI *s, GetBitContext *gb,
210
                                                         int size)
211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231
{
    uint32_t country_code;
    uint32_t user_identifier;

    if (size < 7)
        return AVERROR(EINVAL);
    size -= 7;

    country_code = get_bits(gb, 8);
    if (country_code == 0xFF) {
        skip_bits(gb, 8);
        size--;
    }

    skip_bits(gb, 8);
    skip_bits(gb, 8);

    user_identifier = get_bits_long(gb, 32);

    switch (user_identifier) {
        case MKBETAG('G', 'A', '9', '4'):
232
            return decode_registered_user_data_closed_caption(&s->a53_caption, gb, size);
233 234 235 236 237 238 239
        default:
            skip_bits_long(gb, size * 8);
            break;
    }
    return 0;
}

240
static int decode_nal_sei_active_parameter_sets(HEVCSEI *s, GetBitContext *gb, void *logctx)
241
{
242 243
    int num_sps_ids_minus1;
    int i;
244
    unsigned active_seq_parameter_set_id;
245 246 247 248 249 250

    get_bits(gb, 4); // active_video_parameter_set_id
    get_bits(gb, 1); // self_contained_cvs_flag
    get_bits(gb, 1); // num_sps_ids_minus1
    num_sps_ids_minus1 = get_ue_golomb_long(gb); // num_sps_ids_minus1

251
    if (num_sps_ids_minus1 < 0 || num_sps_ids_minus1 > 15) {
252
        av_log(logctx, AV_LOG_ERROR, "num_sps_ids_minus1 %d invalid\n", num_sps_ids_minus1);
253 254 255
        return AVERROR_INVALIDDATA;
    }

256
    active_seq_parameter_set_id = get_ue_golomb_long(gb);
James Almer's avatar
James Almer committed
257
    if (active_seq_parameter_set_id >= HEVC_MAX_SPS_COUNT) {
258
        av_log(logctx, AV_LOG_ERROR, "active_parameter_set_id %d invalid\n", active_seq_parameter_set_id);
259 260 261
        return AVERROR_INVALIDDATA;
    }
    s->active_seq_parameter_set_id = active_seq_parameter_set_id;
262 263 264

    for (i = 1; i <= num_sps_ids_minus1; i++)
        get_ue_golomb_long(gb); // active_seq_parameter_set_id[i]
265 266

    return 0;
267 268
}

269 270 271 272 273 274 275
static int decode_nal_sei_alternative_transfer(HEVCSEIAlternativeTransfer *s, GetBitContext *gb)
{
    s->present = 1;
    s->preferred_transfer_characteristics = get_bits(gb, 8);
    return 0;
}

276 277
static int decode_nal_sei_prefix(GetBitContext *gb, void *logctx, HEVCSEI *s,
                                 const HEVCParamSets *ps, int type, int size)
278 279 280
{
    switch (type) {
    case 256:  // Mismatched value from HM 8.1
281
        return decode_nal_sei_decoded_picture_hash(&s->picture_hash, gb);
282
    case HEVC_SEI_TYPE_FRAME_PACKING:
283
        return decode_nal_sei_frame_packing_arrangement(&s->frame_packing, gb);
284
    case HEVC_SEI_TYPE_DISPLAY_ORIENTATION:
285
        return decode_nal_sei_display_orientation(&s->display_orientation, gb);
286
    case HEVC_SEI_TYPE_PICTURE_TIMING:
287
        return decode_nal_sei_pic_timing(s, gb, ps, logctx, size);
288
    case HEVC_SEI_TYPE_MASTERING_DISPLAY_INFO:
289
        return decode_nal_sei_mastering_display_info(&s->mastering_display, gb);
290
    case HEVC_SEI_TYPE_CONTENT_LIGHT_LEVEL_INFO:
291
        return decode_nal_sei_content_light_info(&s->content_light, gb);
292
    case HEVC_SEI_TYPE_ACTIVE_PARAMETER_SETS:
293
        return decode_nal_sei_active_parameter_sets(s, gb, logctx);
294
    case HEVC_SEI_TYPE_USER_DATA_REGISTERED_ITU_T_T35:
295
        return decode_nal_sei_user_data_registered_itu_t_t35(s, gb, size);
296 297
    case HEVC_SEI_TYPE_ALTERNATIVE_TRANSFER_CHARACTERISTICS:
        return decode_nal_sei_alternative_transfer(&s->alternative_transfer, gb);
298
    default:
299
        av_log(logctx, AV_LOG_DEBUG, "Skipped PREFIX SEI %d\n", type);
300 301 302 303 304
        skip_bits_long(gb, 8 * size);
        return 0;
    }
}

305 306
static int decode_nal_sei_suffix(GetBitContext *gb, void *logctx, HEVCSEI *s,
                                 int type, int size)
307 308
{
    switch (type) {
309
    case HEVC_SEI_TYPE_DECODED_PICTURE_HASH:
310
        return decode_nal_sei_decoded_picture_hash(&s->picture_hash, gb);
311
    default:
312
        av_log(logctx, AV_LOG_DEBUG, "Skipped SUFFIX SEI %d\n", type);
313 314 315 316 317
        skip_bits_long(gb, 8 * size);
        return 0;
    }
}

318 319
static int decode_nal_sei_message(GetBitContext *gb, void *logctx, HEVCSEI *s,
                                  const HEVCParamSets *ps, int nal_unit_type)
320 321 322 323
{
    int payload_type = 0;
    int payload_size = 0;
    int byte = 0xFF;
324
    av_log(logctx, AV_LOG_DEBUG, "Decoding SEI\n");
325 326

    while (byte == 0xFF) {
327 328
        if (get_bits_left(gb) < 16 || payload_type > INT_MAX - 255)
            return AVERROR_INVALIDDATA;
329
        byte          = get_bits(gb, 8);
330 331 332 333
        payload_type += byte;
    }
    byte = 0xFF;
    while (byte == 0xFF) {
334 335
        if (get_bits_left(gb) < 8 + 8LL*payload_size)
            return AVERROR_INVALIDDATA;
336
        byte          = get_bits(gb, 8);
337 338
        payload_size += byte;
    }
339
    if (nal_unit_type == HEVC_NAL_SEI_PREFIX) {
340
        return decode_nal_sei_prefix(gb, logctx, s, ps, payload_type, payload_size);
341
    } else { /* nal_unit_type == NAL_SEI_SUFFIX */
342
        return decode_nal_sei_suffix(gb, logctx, s, payload_type, payload_size);
343 344 345 346 347 348 349 350
    }
}

static int more_rbsp_data(GetBitContext *gb)
{
    return get_bits_left(gb) > 0 && show_bits(gb, 8) != 0x80;
}

351
int ff_hevc_decode_nal_sei(GetBitContext *gb, void *logctx, HEVCSEI *s,
352
                           const HEVCParamSets *ps, int type)
353
{
354 355
    int ret;

356
    do {
357
        ret = decode_nal_sei_message(gb, logctx, s, ps, type);
358
        if (ret < 0)
359
            return ret;
360
    } while (more_rbsp_data(gb));
361
    return 1;
362
}
363

364
void ff_hevc_reset_sei(HEVCSEI *s)
365
{
366 367
    s->a53_caption.a53_caption_size = 0;
    av_freep(&s->a53_caption.a53_caption);
368
}