hevc_sei.c 12.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * HEVC Supplementary Enhancement Information messages
 *
 * Copyright (C) 2012 - 2013 Guillaume Martres
 * Copyright (C) 2012 - 2013 Gildas Cocherel
 * Copyright (C) 2013 Vittorio Giovara
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "golomb.h"
26 27
#include "hevc_ps.h"
#include "hevc_sei.h"
28

29
static int decode_nal_sei_decoded_picture_hash(HEVCSEIPictureHash *s, GetBitContext *gb)
30 31 32 33 34 35 36
{
    int cIdx, i;
    uint8_t hash_type;
    //uint16_t picture_crc;
    //uint32_t picture_checksum;
    hash_type = get_bits(gb, 8);

37 38
    for (cIdx = 0; cIdx < 3/*((s->sps->chroma_format_idc == 0) ? 1 : 3)*/; cIdx++) {
        if (hash_type == 0) {
39
            s->is_md5 = 1;
40
            for (i = 0; i < 16; i++)
41
                s->md5[cIdx][i] = get_bits(gb, 8);
42
        } else if (hash_type == 1) {
43 44
            // picture_crc = get_bits(gb, 16);
            skip_bits(gb, 16);
45
        } else if (hash_type == 2) {
46
            // picture_checksum = get_bits_long(gb, 32);
47 48 49
            skip_bits(gb, 32);
        }
    }
50
    return 0;
51 52
}

53
static int decode_nal_sei_mastering_display_info(HEVCSEIMasteringDisplay *s, GetBitContext *gb)
54 55 56 57 58 59 60 61 62 63 64 65
{
    int i;
    // Mastering primaries
    for (i = 0; i < 3; i++) {
        s->display_primaries[i][0] = get_bits(gb, 16);
        s->display_primaries[i][1] = get_bits(gb, 16);
    }
    // White point (x, y)
    s->white_point[0] = get_bits(gb, 16);
    s->white_point[1] = get_bits(gb, 16);

    // Max and min luminance of mastering display
66 67
    s->max_luminance = get_bits_long(gb, 32);
    s->min_luminance = get_bits_long(gb, 32);
68 69 70 71

    // As this SEI message comes before the first frame that references it,
    // initialize the flag to 2 and decrement on IRAP access unit so it
    // persists for the coded video sequence (e.g., between two IRAPs)
72
    s->present = 2;
73 74 75
    return 0;
}

76
static int decode_nal_sei_content_light_info(HEVCSEIContentLight *s, GetBitContext *gb)
77 78 79 80 81 82 83
{
    // Max and average light levels
    s->max_content_light_level     = get_bits_long(gb, 16);
    s->max_pic_average_light_level = get_bits_long(gb, 16);
    // As this SEI message comes before the first frame that references it,
    // initialize the flag to 2 and decrement on IRAP access unit so it
    // persists for the coded video sequence (e.g., between two IRAPs)
84
    s->present = 2;
85 86 87
    return  0;
}

88
static int decode_nal_sei_frame_packing_arrangement(HEVCSEIFramePacking *s, GetBitContext *gb)
89
{
90
    get_ue_golomb_long(gb);             // frame_packing_arrangement_id
91
    s->present = !get_bits1(gb);
92

93 94
    if (s->present) {
        s->arrangement_type               = get_bits(gb, 7);
95 96
        s->quincunx_subsampling           = get_bits1(gb);
        s->content_interpretation_type    = get_bits(gb, 6);
97 98 99 100 101 102

        // the following skips spatial_flipping_flag frame0_flipped_flag
        // field_views_flag current_frame_is_frame0_flag
        // frame0_self_contained_flag frame1_self_contained_flag
        skip_bits(gb, 6);

103
        if (!s->quincunx_subsampling && s->arrangement_type != 5)
104 105
            skip_bits(gb, 16);  // frame[01]_grid_position_[xy]
        skip_bits(gb, 8);       // frame_packing_arrangement_reserved_byte
106
        skip_bits1(gb);         // frame_packing_arrangement_persistence_flag
107
    }
108
    skip_bits1(gb);             // upsampled_aspect_ratio_flag
109
    return 0;
110 111
}

112
static int decode_nal_sei_display_orientation(HEVCSEIDisplayOrientation *s, GetBitContext *gb)
113
{
114
    s->present = !get_bits1(gb);
115

116 117 118
    if (s->present) {
        s->hflip = get_bits1(gb);     // hor_flip
        s->vflip = get_bits1(gb);     // ver_flip
119

120
        s->anticlockwise_rotation = get_bits(gb, 16);
121 122
        skip_bits1(gb);     // display_orientation_persistence_flag
    }
123 124

    return 0;
125 126
}

127 128
static int decode_nal_sei_pic_timing(HEVCSEIContext *s, GetBitContext *gb, const HEVCParamSets *ps,
                                     void *logctx, int size)
129
{
130
    HEVCSEIPictureTiming *h = &s->picture_timing;
131
    HEVCSPS *sps;
132

133
    if (!ps->sps_list[s->active_seq_parameter_set_id])
134
        return(AVERROR(ENOMEM));
135
    sps = (HEVCSPS*)ps->sps_list[s->active_seq_parameter_set_id]->data;
136 137 138

    if (sps->vui.frame_field_info_present_flag) {
        int pic_struct = get_bits(gb, 4);
139
        h->picture_struct = AV_PICTURE_STRUCTURE_UNKNOWN;
140
        if (pic_struct == 2) {
141 142
            av_log(logctx, AV_LOG_DEBUG, "BOTTOM Field\n");
            h->picture_struct = AV_PICTURE_STRUCTURE_BOTTOM_FIELD;
143
        } else if (pic_struct == 1) {
144 145
            av_log(logctx, AV_LOG_DEBUG, "TOP Field\n");
            h->picture_struct = AV_PICTURE_STRUCTURE_TOP_FIELD;
146 147 148
        }
        get_bits(gb, 2);                   // source_scan_type
        get_bits(gb, 1);                   // duplicate_flag
149 150
        skip_bits1(gb);
        size--;
151
    }
152 153 154
    skip_bits_long(gb, 8 * size);

    return 0;
155 156
}

157 158
static int decode_registered_user_data_closed_caption(HEVCSEIA53Caption *s, GetBitContext *gb,
                                                      int size)
159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178
{
    int flag;
    int user_data_type_code;
    int cc_count;

    if (size < 3)
       return AVERROR(EINVAL);

    user_data_type_code = get_bits(gb, 8);
    if (user_data_type_code == 0x3) {
        skip_bits(gb, 1); // reserved

        flag = get_bits(gb, 1); // process_cc_data_flag
        if (flag) {
            skip_bits(gb, 1);
            cc_count = get_bits(gb, 5);
            skip_bits(gb, 8); // reserved
            size -= 2;

            if (cc_count && size >= cc_count * 3) {
179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194
                const uint64_t new_size = (s->a53_caption_size + cc_count
                                           * UINT64_C(3));
                int i, ret;

                if (new_size > INT_MAX)
                    return AVERROR(EINVAL);

                /* Allow merging of the cc data from two fields. */
                ret = av_reallocp(&s->a53_caption, new_size);
                if (ret < 0)
                    return ret;

                for (i = 0; i < cc_count; i++) {
                    s->a53_caption[s->a53_caption_size++] = get_bits(gb, 8);
                    s->a53_caption[s->a53_caption_size++] = get_bits(gb, 8);
                    s->a53_caption[s->a53_caption_size++] = get_bits(gb, 8);
195 196 197 198 199
                }
                skip_bits(gb, 8); // marker_bits
            }
        }
    } else {
200
        int i;
201 202 203 204 205 206 207
        for (i = 0; i < size - 1; i++)
            skip_bits(gb, 8);
    }

    return 0;
}

208 209
static int decode_nal_sei_user_data_registered_itu_t_t35(HEVCSEIContext *s, GetBitContext *gb,
                                                         int size)
210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230
{
    uint32_t country_code;
    uint32_t user_identifier;

    if (size < 7)
        return AVERROR(EINVAL);
    size -= 7;

    country_code = get_bits(gb, 8);
    if (country_code == 0xFF) {
        skip_bits(gb, 8);
        size--;
    }

    skip_bits(gb, 8);
    skip_bits(gb, 8);

    user_identifier = get_bits_long(gb, 32);

    switch (user_identifier) {
        case MKBETAG('G', 'A', '9', '4'):
231
            return decode_registered_user_data_closed_caption(&s->a53_caption, gb, size);
232 233 234 235 236 237 238
        default:
            skip_bits_long(gb, size * 8);
            break;
    }
    return 0;
}

239
static int decode_nal_sei_active_parameter_sets(HEVCSEIContext *s, GetBitContext *gb, void *logctx)
240
{
241 242
    int num_sps_ids_minus1;
    int i;
243
    unsigned active_seq_parameter_set_id;
244 245 246 247 248 249

    get_bits(gb, 4); // active_video_parameter_set_id
    get_bits(gb, 1); // self_contained_cvs_flag
    get_bits(gb, 1); // num_sps_ids_minus1
    num_sps_ids_minus1 = get_ue_golomb_long(gb); // num_sps_ids_minus1

250
    if (num_sps_ids_minus1 < 0 || num_sps_ids_minus1 > 15) {
251
        av_log(logctx, AV_LOG_ERROR, "num_sps_ids_minus1 %d invalid\n", num_sps_ids_minus1);
252 253 254
        return AVERROR_INVALIDDATA;
    }

255
    active_seq_parameter_set_id = get_ue_golomb_long(gb);
James Almer's avatar
James Almer committed
256
    if (active_seq_parameter_set_id >= HEVC_MAX_SPS_COUNT) {
257
        av_log(logctx, AV_LOG_ERROR, "active_parameter_set_id %d invalid\n", active_seq_parameter_set_id);
258 259 260
        return AVERROR_INVALIDDATA;
    }
    s->active_seq_parameter_set_id = active_seq_parameter_set_id;
261 262 263

    for (i = 1; i <= num_sps_ids_minus1; i++)
        get_ue_golomb_long(gb); // active_seq_parameter_set_id[i]
264 265

    return 0;
266 267
}

268 269 270 271 272 273 274
static int decode_nal_sei_alternative_transfer(HEVCSEIAlternativeTransfer *s, GetBitContext *gb)
{
    s->present = 1;
    s->preferred_transfer_characteristics = get_bits(gb, 8);
    return 0;
}

275 276
static int decode_nal_sei_prefix(GetBitContext *gb, HEVCSEIContext *s, const HEVCParamSets *ps,
                                 int type, int size, void *logctx)
277 278 279
{
    switch (type) {
    case 256:  // Mismatched value from HM 8.1
280
        return decode_nal_sei_decoded_picture_hash(&s->picture_hash, gb);
281
    case HEVC_SEI_TYPE_FRAME_PACKING:
282
        return decode_nal_sei_frame_packing_arrangement(&s->frame_packing, gb);
283
    case HEVC_SEI_TYPE_DISPLAY_ORIENTATION:
284
        return decode_nal_sei_display_orientation(&s->display_orientation, gb);
285
    case HEVC_SEI_TYPE_PICTURE_TIMING:
286
        return decode_nal_sei_pic_timing(s, gb, ps, logctx, size);
287
    case HEVC_SEI_TYPE_MASTERING_DISPLAY_INFO:
288
        return decode_nal_sei_mastering_display_info(&s->mastering_display, gb);
289
    case HEVC_SEI_TYPE_CONTENT_LIGHT_LEVEL_INFO:
290
        return decode_nal_sei_content_light_info(&s->content_light, gb);
291
    case HEVC_SEI_TYPE_ACTIVE_PARAMETER_SETS:
292
        return decode_nal_sei_active_parameter_sets(s, gb, logctx);
293
    case HEVC_SEI_TYPE_USER_DATA_REGISTERED_ITU_T_T35:
294
        return decode_nal_sei_user_data_registered_itu_t_t35(s, gb, size);
295 296
    case HEVC_SEI_TYPE_ALTERNATIVE_TRANSFER_CHARACTERISTICS:
        return decode_nal_sei_alternative_transfer(&s->alternative_transfer, gb);
297
    default:
298
        av_log(logctx, AV_LOG_DEBUG, "Skipped PREFIX SEI %d\n", type);
299 300 301 302 303
        skip_bits_long(gb, 8 * size);
        return 0;
    }
}

304 305
static int decode_nal_sei_suffix(GetBitContext *gb, HEVCSEIContext *s,
                                 int type, int size, void *logctx)
306 307
{
    switch (type) {
308
    case HEVC_SEI_TYPE_DECODED_PICTURE_HASH:
309
        return decode_nal_sei_decoded_picture_hash(&s->picture_hash, gb);
310
    default:
311
        av_log(logctx, AV_LOG_DEBUG, "Skipped SUFFIX SEI %d\n", type);
312 313 314 315 316
        skip_bits_long(gb, 8 * size);
        return 0;
    }
}

317 318 319
static int decode_nal_sei_message(GetBitContext *gb, HEVCSEIContext *s,
                                  const HEVCParamSets *ps, int nal_unit_type,
                                  void *logctx)
320 321 322 323
{
    int payload_type = 0;
    int payload_size = 0;
    int byte = 0xFF;
324
    av_log(logctx, AV_LOG_DEBUG, "Decoding SEI\n");
325 326

    while (byte == 0xFF) {
327
        byte          = get_bits(gb, 8);
328 329 330 331
        payload_type += byte;
    }
    byte = 0xFF;
    while (byte == 0xFF) {
332
        byte          = get_bits(gb, 8);
333 334
        payload_size += byte;
    }
335 336
    if (nal_unit_type == HEVC_NAL_SEI_PREFIX) {
        return decode_nal_sei_prefix(gb, s, ps, payload_type, payload_size, logctx);
337
    } else { /* nal_unit_type == NAL_SEI_SUFFIX */
338
        return decode_nal_sei_suffix(gb, s, payload_type, payload_size, logctx);
339 340 341 342 343 344 345 346
    }
}

static int more_rbsp_data(GetBitContext *gb)
{
    return get_bits_left(gb) > 0 && show_bits(gb, 8) != 0x80;
}

347 348
int ff_hevc_decode_nal_sei(GetBitContext *gb, void *logctx, HEVCSEIContext *s,
                           const HEVCParamSets *ps, int type)
349
{
350 351
    int ret;

352
    do {
353
        ret = decode_nal_sei_message(gb, s, ps, type, logctx);
354
        if (ret < 0)
355
            return ret;
356
    } while (more_rbsp_data(gb));
357
    return 1;
358
}
359

360
void ff_hevc_reset_sei(HEVCSEIContext *s)
361
{
362 363
    s->a53_caption.a53_caption_size = 0;
    av_freep(&s->a53_caption.a53_caption);
364
}