mvdec.c 16.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
/*
 * Silicon Graphics Movie demuxer
 * Copyright (c) 2012 Peter Ross
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
 * @file
 * Silicon Graphics Movie demuxer
 */

27
#include "libavutil/channel_layout.h"
28 29 30
#include "libavutil/eval.h"
#include "libavutil/intreadwrite.h"
#include "libavutil/rational.h"
31

32 33 34
#include "avformat.h"
#include "internal.h"

35
typedef struct MvContext {
36 37 38
    int nb_video_tracks;
    int nb_audio_tracks;

39 40 41 42 43 44
    int eof_count;        ///< number of streams that have finished
    int stream_index;     ///< current stream index
    int frame[2];         ///< frame nb for current stream

    int acompression;     ///< compression level for audio stream
    int aformat;          ///< audio format
45 46 47 48
} MvContext;

#define AUDIO_FORMAT_SIGNED 401

49
static int mv_probe(const AVProbeData *p)
50
{
51 52
    if (AV_RB32(p->buf) == MKBETAG('M', 'O', 'V', 'I') &&
        AV_RB16(p->buf + 4) < 3)
53 54 55 56
        return AVPROBE_SCORE_MAX;
    return 0;
}

57
static char *var_read_string(AVIOContext *pb, int size)
58 59
{
    int n;
60 61 62 63 64 65
    char *str;

    if (size < 0 || size == INT_MAX)
        return NULL;

    str = av_malloc(size + 1);
66 67 68 69
    if (!str)
        return NULL;
    n = avio_get_str(pb, size, str, size + 1);
    if (n < size)
70
        avio_skip(pb, size - n);
71 72 73 74 75 76
    return str;
}

static int var_read_int(AVIOContext *pb, int size)
{
    int v;
77 78 79 80
    char *s = var_read_string(pb, size);
    if (!s)
        return 0;
    v = strtol(s, NULL, 10);
81 82 83 84 85 86 87
    av_free(s);
    return v;
}

static AVRational var_read_float(AVIOContext *pb, int size)
{
    AVRational v;
88
    char *s = var_read_string(pb, size);
89
    if (!s)
90
        return (AVRational) { 0, 0 };
91 92 93 94 95 96 97 98 99 100 101 102
    v = av_d2q(av_strtod(s, NULL), INT_MAX);
    av_free(s);
    return v;
}

static void var_read_metadata(AVFormatContext *avctx, const char *tag, int size)
{
    char *value = var_read_string(avctx->pb, size);
    if (value)
        av_dict_set(&avctx->metadata, tag, value, AV_DICT_DONT_STRDUP_VAL);
}

103 104
static int set_channels(AVFormatContext *avctx, AVStream *st, int channels)
{
105
    if (channels <= 0) {
106
        av_log(avctx, AV_LOG_ERROR, "Channel count %d invalid.\n", channels);
107 108
        return AVERROR_INVALIDDATA;
    }
109 110 111
    st->codecpar->channels       = channels;
    st->codecpar->channel_layout = (st->codecpar->channels == 1) ? AV_CH_LAYOUT_MONO
                                                                 : AV_CH_LAYOUT_STEREO;
112 113 114
    return 0;
}

115 116 117 118
/**
 * Parse global variable
 * @return < 0 if unknown
 */
119 120
static int parse_global_var(AVFormatContext *avctx, AVStream *st,
                            const char *name, int size)
121 122 123 124 125 126 127 128 129
{
    MvContext *mv = avctx->priv_data;
    AVIOContext *pb = avctx->pb;
    if (!strcmp(name, "__NUM_I_TRACKS")) {
        mv->nb_video_tracks = var_read_int(pb, size);
    } else if (!strcmp(name, "__NUM_A_TRACKS")) {
        mv->nb_audio_tracks = var_read_int(pb, size);
    } else if (!strcmp(name, "COMMENT") || !strcmp(name, "TITLE")) {
        var_read_metadata(avctx, name, size);
130 131
    } else if (!strcmp(name, "LOOP_MODE") || !strcmp(name, "NUM_LOOPS") ||
               !strcmp(name, "OPTIMIZED")) {
132 133
        avio_skip(pb, size); // ignore
    } else
134
        return AVERROR_INVALIDDATA;
135 136 137 138 139 140 141 142

    return 0;
}

/**
 * Parse audio variable
 * @return < 0 if unknown
 */
143 144
static int parse_audio_var(AVFormatContext *avctx, AVStream *st,
                           const char *name, int size)
145
{
146
    MvContext *mv = avctx->priv_data;
147 148 149 150
    AVIOContext *pb = avctx->pb;
    if (!strcmp(name, "__DIR_COUNT")) {
        st->nb_frames = var_read_int(pb, size);
    } else if (!strcmp(name, "AUDIO_FORMAT")) {
151
        mv->aformat = var_read_int(pb, size);
152
    } else if (!strcmp(name, "COMPRESSION")) {
153
        mv->acompression = var_read_int(pb, size);
154 155 156
    } else if (!strcmp(name, "DEFAULT_VOL")) {
        var_read_metadata(avctx, name, size);
    } else if (!strcmp(name, "NUM_CHANNELS")) {
157
        return set_channels(avctx, st, var_read_int(pb, size));
158
    } else if (!strcmp(name, "SAMPLE_RATE")) {
159 160
        st->codecpar->sample_rate = var_read_int(pb, size);
        avpriv_set_pts_info(st, 33, 1, st->codecpar->sample_rate);
161
    } else if (!strcmp(name, "SAMPLE_WIDTH")) {
162
        st->codecpar->bits_per_coded_sample = var_read_int(pb, size) * 8;
163
    } else
164 165
        return AVERROR_INVALIDDATA;

166 167 168 169 170 171 172
    return 0;
}

/**
 * Parse video variable
 * @return < 0 if unknown
 */
173 174
static int parse_video_var(AVFormatContext *avctx, AVStream *st,
                           const char *name, int size)
175 176 177 178 179
{
    AVIOContext *pb = avctx->pb;
    if (!strcmp(name, "__DIR_COUNT")) {
        st->nb_frames = st->duration = var_read_int(pb, size);
    } else if (!strcmp(name, "COMPRESSION")) {
180
        char *str = var_read_string(pb, size);
181 182
        if (!str)
            return AVERROR_INVALIDDATA;
183
        if (!strcmp(str, "1")) {
184
            st->codecpar->codec_id = AV_CODEC_ID_MVC1;
185
        } else if (!strcmp(str, "2")) {
186 187
            st->codecpar->format = AV_PIX_FMT_ABGR;
            st->codecpar->codec_id = AV_CODEC_ID_RAWVIDEO;
188
        } else if (!strcmp(str, "3")) {
189
            st->codecpar->codec_id = AV_CODEC_ID_SGIRLE;
190
        } else if (!strcmp(str, "10")) {
191
            st->codecpar->codec_id = AV_CODEC_ID_MJPEG;
192
        } else if (!strcmp(str, "MVC2")) {
193
            st->codecpar->codec_id = AV_CODEC_ID_MVC2;
194
        } else {
195
            avpriv_request_sample(avctx, "Video compression %s", str);
196 197 198
        }
        av_free(str);
    } else if (!strcmp(name, "FPS")) {
199 200
        AVRational fps = var_read_float(pb, size);
        avpriv_set_pts_info(st, 64, fps.den, fps.num);
201
        st->avg_frame_rate = fps;
202
    } else if (!strcmp(name, "HEIGHT")) {
203
        st->codecpar->height = var_read_int(pb, size);
204 205 206
    } else if (!strcmp(name, "PIXEL_ASPECT")) {
        st->sample_aspect_ratio = var_read_float(pb, size);
        av_reduce(&st->sample_aspect_ratio.num, &st->sample_aspect_ratio.den,
207 208
                  st->sample_aspect_ratio.num, st->sample_aspect_ratio.den,
                  INT_MAX);
209
    } else if (!strcmp(name, "WIDTH")) {
210
        st->codecpar->width = var_read_int(pb, size);
211 212
    } else if (!strcmp(name, "ORIENTATION")) {
        if (var_read_int(pb, size) == 1101) {
213
            st->codecpar->extradata      = av_strdup("BottomUp");
214 215
            if (!st->codecpar->extradata)
                return AVERROR(ENOMEM);
216
            st->codecpar->extradata_size = 9;
217 218 219 220 221 222
        }
    } else if (!strcmp(name, "Q_SPATIAL") || !strcmp(name, "Q_TEMPORAL")) {
        var_read_metadata(avctx, name, size);
    } else if (!strcmp(name, "INTERLACING") || !strcmp(name, "PACKING")) {
        avio_skip(pb, size); // ignore
    } else
223 224
        return AVERROR_INVALIDDATA;

225 226 227
    return 0;
}

228
static int read_table(AVFormatContext *avctx, AVStream *st,
229 230
                       int (*parse)(AVFormatContext *avctx, AVStream *st,
                                    const char *name, int size))
231
{
232 233 234
    unsigned count;
    int i;

235 236 237 238 239 240 241
    AVIOContext *pb = avctx->pb;
    avio_skip(pb, 4);
    count = avio_rb32(pb);
    avio_skip(pb, 4);
    for (i = 0; i < count; i++) {
        char name[17];
        int size;
242 243 244 245

        if (avio_feof(pb))
            return AVERROR_EOF;

246 247 248
        avio_read(pb, name, 16);
        name[sizeof(name) - 1] = 0;
        size = avio_rb32(pb);
249 250 251 252
        if (size < 0) {
            av_log(avctx, AV_LOG_ERROR, "entry size %d is invalid\n", size);
            return AVERROR_INVALIDDATA;
        }
253
        if (parse(avctx, st, name, size) < 0) {
254
            avpriv_request_sample(avctx, "Variable %s", name);
255 256 257
            avio_skip(pb, size);
        }
    }
258
    return 0;
259 260 261 262 263 264 265 266 267 268 269
}

static void read_index(AVIOContext *pb, AVStream *st)
{
    uint64_t timestamp = 0;
    int i;
    for (i = 0; i < st->nb_frames; i++) {
        uint32_t pos  = avio_rb32(pb);
        uint32_t size = avio_rb32(pb);
        avio_skip(pb, 8);
        av_add_index_entry(st, pos, timestamp, size, 0, AVINDEX_KEYFRAME);
270 271
        if (st->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
            timestamp += size / (st->codecpar->channels * 2);
272 273 274 275 276 277 278 279 280 281
        } else {
            timestamp++;
        }
    }
}

static int mv_read_header(AVFormatContext *avctx)
{
    MvContext *mv = avctx->priv_data;
    AVIOContext *pb = avctx->pb;
282
    AVStream *ast = NULL, *vst = NULL; //initialization to suppress warning
283
    int version, i;
284
    int ret;
285 286 287 288 289 290 291 292 293 294

    avio_skip(pb, 4);

    version = avio_rb16(pb);
    if (version == 2) {
        uint64_t timestamp;
        int v;
        avio_skip(pb, 22);

        /* allocate audio track first to prevent unnecessary seeking
295
         * (audio packet always precede video packet for a given frame) */
296 297 298 299 300 301 302
        ast = avformat_new_stream(avctx, NULL);
        if (!ast)
            return AVERROR(ENOMEM);

        vst = avformat_new_stream(avctx, NULL);
        if (!vst)
            return AVERROR(ENOMEM);
303
        avpriv_set_pts_info(vst, 64, 1, 15);
304
        vst->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
305 306
        vst->avg_frame_rate    = av_inv_q(vst->time_base);
        vst->nb_frames         = avio_rb32(pb);
307 308 309
        v = avio_rb32(pb);
        switch (v) {
        case 1:
310
            vst->codecpar->codec_id = AV_CODEC_ID_MVC1;
311 312
            break;
        case 2:
313 314
            vst->codecpar->format = AV_PIX_FMT_ARGB;
            vst->codecpar->codec_id = AV_CODEC_ID_RAWVIDEO;
315 316
            break;
        default:
317
            avpriv_request_sample(avctx, "Video compression %i", v);
318 319
            break;
        }
320 321 322
        vst->codecpar->codec_tag = 0;
        vst->codecpar->width     = avio_rb32(pb);
        vst->codecpar->height    = avio_rb32(pb);
323 324
        avio_skip(pb, 12);

325
        ast->codecpar->codec_type  = AVMEDIA_TYPE_AUDIO;
326
        ast->nb_frames          = vst->nb_frames;
327
        ast->codecpar->sample_rate = avio_rb32(pb);
328 329 330 331
        if (ast->codecpar->sample_rate <= 0) {
            av_log(avctx, AV_LOG_ERROR, "Invalid sample rate %d\n", ast->codecpar->sample_rate);
            return AVERROR_INVALIDDATA;
        }
332
        avpriv_set_pts_info(ast, 33, 1, ast->codecpar->sample_rate);
333 334 335
        if (set_channels(avctx, ast, avio_rb32(pb)) < 0)
            return AVERROR_INVALIDDATA;

336 337
        v = avio_rb32(pb);
        if (v == AUDIO_FORMAT_SIGNED) {
338
            ast->codecpar->codec_id = AV_CODEC_ID_PCM_S16BE;
339
        } else {
340
            avpriv_request_sample(avctx, "Audio compression (format %i)", v);
341 342 343 344 345 346 347 348 349 350 351 352
        }

        avio_skip(pb, 12);
        var_read_metadata(avctx, "title", 0x80);
        var_read_metadata(avctx, "comment", 0x100);
        avio_skip(pb, 0x80);

        timestamp = 0;
        for (i = 0; i < vst->nb_frames; i++) {
            uint32_t pos   = avio_rb32(pb);
            uint32_t asize = avio_rb32(pb);
            uint32_t vsize = avio_rb32(pb);
353 354
            if (avio_feof(pb))
                return AVERROR_INVALIDDATA;
355
            avio_skip(pb, 8);
356 357
            av_add_index_entry(ast, pos, timestamp, asize, 0, AVINDEX_KEYFRAME);
            av_add_index_entry(vst, pos + asize, i, vsize, 0, AVINDEX_KEYFRAME);
358
            timestamp += asize / (ast->codecpar->channels * 2);
359 360 361 362
        }
    } else if (!version && avio_rb16(pb) == 3) {
        avio_skip(pb, 4);

363 364
        if ((ret = read_table(avctx, NULL, parse_global_var)) < 0)
            return ret;
365

366 367 368 369 370 371
        if (mv->nb_audio_tracks < 0  || mv->nb_video_tracks < 0 ||
           (mv->nb_audio_tracks == 0 && mv->nb_video_tracks == 0)) {
            av_log(avctx, AV_LOG_ERROR, "Stream count is invalid.\n");
            return AVERROR_INVALIDDATA;
        }

372
        if (mv->nb_audio_tracks > 1) {
373
            avpriv_request_sample(avctx, "Multiple audio streams support");
374 375 376 377 378
            return AVERROR_PATCHWELCOME;
        } else if (mv->nb_audio_tracks) {
            ast = avformat_new_stream(avctx, NULL);
            if (!ast)
                return AVERROR(ENOMEM);
379
            ast->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
380 381
            if ((read_table(avctx, ast, parse_audio_var)) < 0)
                return ret;
382 383
            if (mv->acompression == 100 &&
                mv->aformat == AUDIO_FORMAT_SIGNED &&
384 385
                ast->codecpar->bits_per_coded_sample == 16) {
                ast->codecpar->codec_id = AV_CODEC_ID_PCM_S16BE;
386
            } else {
387 388 389
                avpriv_request_sample(avctx,
                                      "Audio compression %i (format %i, sr %i)",
                                      mv->acompression, mv->aformat,
390 391
                                      ast->codecpar->bits_per_coded_sample);
                ast->codecpar->codec_id = AV_CODEC_ID_NONE;
392
            }
393
            if (ast->codecpar->channels <= 0) {
394
                av_log(avctx, AV_LOG_ERROR, "No valid channel count found.\n");
395 396
                return AVERROR_INVALIDDATA;
            }
397 398 399
        }

        if (mv->nb_video_tracks > 1) {
400
            avpriv_request_sample(avctx, "Multiple video streams support");
401 402 403 404 405
            return AVERROR_PATCHWELCOME;
        } else if (mv->nb_video_tracks) {
            vst = avformat_new_stream(avctx, NULL);
            if (!vst)
                return AVERROR(ENOMEM);
406
            vst->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
407 408
            if ((ret = read_table(avctx, vst, parse_video_var))<0)
                return ret;
409 410 411 412 413 414 415 416
        }

        if (mv->nb_audio_tracks)
            read_index(pb, ast);

        if (mv->nb_video_tracks)
            read_index(pb, vst);
    } else {
417
        avpriv_request_sample(avctx, "Version %i", version);
418 419 420 421 422 423 424 425 426 427 428 429 430
        return AVERROR_PATCHWELCOME;
    }

    return 0;
}

static int mv_read_packet(AVFormatContext *avctx, AVPacket *pkt)
{
    MvContext *mv = avctx->priv_data;
    AVIOContext *pb = avctx->pb;
    AVStream *st = avctx->streams[mv->stream_index];
    const AVIndexEntry *index;
    int frame = mv->frame[mv->stream_index];
431
    int64_t ret;
432 433
    uint64_t pos;

434
    if (frame < st->nb_index_entries) {
435
        index = &st->index_entries[frame];
436
        pos   = avio_tell(pb);
437 438 439
        if (index->pos > pos)
            avio_skip(pb, index->pos - pos);
        else if (index->pos < pos) {
440
            if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
441 442 443 444 445 446 447 448 449 450
                return AVERROR(EIO);
            ret = avio_seek(pb, index->pos, SEEK_SET);
            if (ret < 0)
                return ret;
        }
        ret = av_get_packet(pb, pkt, index->size);
        if (ret < 0)
            return ret;

        pkt->stream_index = mv->stream_index;
451 452
        pkt->pts          = index->timestamp;
        pkt->flags       |= AV_PKT_FLAG_KEY;
453 454 455 456 457 458 459

        mv->frame[mv->stream_index]++;
        mv->eof_count = 0;
    } else {
        mv->eof_count++;
        if (mv->eof_count >= avctx->nb_streams)
            return AVERROR_EOF;
460 461 462

        // avoid returning 0 without a packet
        return AVERROR(EAGAIN);
463 464 465 466 467 468 469 470 471
    }

    mv->stream_index++;
    if (mv->stream_index >= avctx->nb_streams)
        mv->stream_index = 0;

    return 0;
}

472 473
static int mv_read_seek(AVFormatContext *avctx, int stream_index,
                        int64_t timestamp, int flags)
474 475 476 477 478 479 480 481
{
    MvContext *mv = avctx->priv_data;
    AVStream *st = avctx->streams[stream_index];
    int frame, i;

    if ((flags & AVSEEK_FLAG_FRAME) || (flags & AVSEEK_FLAG_BYTE))
        return AVERROR(ENOSYS);

482
    if (!(avctx->pb->seekable & AVIO_SEEKABLE_NORMAL))
483 484 485 486
        return AVERROR(EIO);

    frame = av_index_search_timestamp(st, timestamp, flags);
    if (frame < 0)
487
        return AVERROR_INVALIDDATA;
488 489 490 491 492 493 494 495 496 497 498 499 500 501 502

    for (i = 0; i < avctx->nb_streams; i++)
        mv->frame[i] = frame;
    return 0;
}

AVInputFormat ff_mv_demuxer = {
    .name           = "mv",
    .long_name      = NULL_IF_CONFIG_SMALL("Silicon Graphics Movie"),
    .priv_data_size = sizeof(MvContext),
    .read_probe     = mv_probe,
    .read_header    = mv_read_header,
    .read_packet    = mv_read_packet,
    .read_seek      = mv_read_seek,
};