aiffdec.c 12.8 KB
Newer Older
1
/*
2
 * AIFF/AIFF-C demuxer
3 4
 * Copyright (c) 2006  Patrick Guimond
 *
5 6 7
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
8 9
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
10
 * version 2.1 of the License, or (at your option) any later version.
11
 *
12
 * FFmpeg is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with FFmpeg; if not, write to the Free Software
19 20
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */
21

22
#include "libavutil/intreadwrite.h"
23
#include "libavutil/mathematics.h"
24
#include "libavutil/dict.h"
25
#include "avformat.h"
26
#include "internal.h"
27
#include "pcm.h"
28
#include "aiff.h"
29
#include "isom.h"
30
#include "id3v2.h"
31
#include "mov_chan.h"
32 33 34 35

#define AIFF                    0
#define AIFF_C_VERSION1         0xA2805140

36
typedef struct AIFFInputContext {
37
    int64_t data_end;
38
    int block_duration;
39 40
} AIFFInputContext;

41
static enum AVCodecID aiff_codec_get_id(int bps)
42 43
{
    if (bps <= 8)
44
        return AV_CODEC_ID_PCM_S8;
45
    if (bps <= 16)
46
        return AV_CODEC_ID_PCM_S16BE;
47
    if (bps <= 24)
48
        return AV_CODEC_ID_PCM_S24BE;
49
    if (bps <= 32)
50
        return AV_CODEC_ID_PCM_S32BE;
51 52

    /* bigger than 32 isn't allowed  */
53
    return AV_CODEC_ID_NONE;
54 55 56
}

/* returns the size of the found tag */
57
static int get_tag(AVIOContext *pb, uint32_t * tag)
58 59 60
{
    int size;

61
    if (avio_feof(pb))
62
        return AVERROR(EIO);
63

64 65
    *tag = avio_rl32(pb);
    size = avio_rb32(pb);
66 67 68 69 70 71 72 73

    if (size < 0)
        size = 0x7fffffff;

    return size;
}

/* Metadata string read */
74
static void get_meta(AVFormatContext *s, const char *key, int size)
75
{
76 77
    uint8_t *str = av_malloc(size+1);

78 79 80 81 82 83 84 85
    if (str) {
        int res = avio_read(s->pb, str, size);
        if (res < 0){
            av_free(str);
            return;
        }
        size += (size&1)-res;
        str[res] = 0;
86
        av_dict_set(&s->metadata, key, str, AV_DICT_DONT_STRDUP_VAL);
87 88 89 90
    }else
        size+= size&1;

    avio_skip(s->pb, size);
91 92 93
}

/* Returns the number of sound data frames or negative on error */
94
static int get_aiff_header(AVFormatContext *s, int size,
95
                                    unsigned version)
96
{
97
    AVIOContext *pb        = s->pb;
98
    AVCodecParameters *par = s->streams[0]->codecpar;
99
    AIFFInputContext *aiff = s->priv_data;
100 101
    int exp;
    uint64_t val;
102
    int sample_rate;
103 104 105 106
    unsigned int num_frames;

    if (size & 1)
        size++;
107 108
    par->codec_type = AVMEDIA_TYPE_AUDIO;
    par->channels = avio_rb16(pb);
109
    num_frames = avio_rb32(pb);
110
    par->bits_per_coded_sample = avio_rb16(pb);
111

112
    exp = avio_rb16(pb) - 16383 - 63;
113
    val = avio_rb64(pb);
114 115 116 117 118 119 120 121
    if (exp <-63 || exp >63) {
        av_log(s, AV_LOG_ERROR, "exp %d is out of range\n", exp);
        return AVERROR_INVALIDDATA;
    }
    if (exp >= 0)
        sample_rate = val << exp;
    else
        sample_rate = (val + (1ULL<<(-exp-1))) >> -exp;
122
    par->sample_rate = sample_rate;
123 124
    size -= 18;

125
    /* get codec id for AIFF-C */
126 127 128
    if (size < 4) {
        version = AIFF;
    } else if (version == AIFF_C_VERSION1) {
129 130
        par->codec_tag = avio_rl32(pb);
        par->codec_id  = ff_codec_get_id(ff_codec_aiff_tags, par->codec_tag);
131
        if (par->codec_id == AV_CODEC_ID_NONE) {
132
            char tag[32];
133
            av_get_codec_tag_string(tag, sizeof(tag), par->codec_tag);
134 135
            avpriv_request_sample(s, "unknown or unsupported codec tag: %s", tag);
        }
136 137
        size -= 4;
    }
138

139 140 141
    if (version != AIFF_C_VERSION1 || par->codec_id == AV_CODEC_ID_PCM_S16BE) {
        par->codec_id = aiff_codec_get_id(par->bits_per_coded_sample);
        par->bits_per_coded_sample = av_get_bits_per_sample(par->codec_id);
142 143
        aiff->block_duration = 1;
    } else {
144
        switch (par->codec_id) {
145 146 147 148 149
        case AV_CODEC_ID_PCM_F32BE:
        case AV_CODEC_ID_PCM_F64BE:
        case AV_CODEC_ID_PCM_S16LE:
        case AV_CODEC_ID_PCM_ALAW:
        case AV_CODEC_ID_PCM_MULAW:
150
            aiff->block_duration = 1;
151
            break;
152
        case AV_CODEC_ID_ADPCM_IMA_QT:
153
            par->block_align = 34 * par->channels;
154
            break;
155
        case AV_CODEC_ID_MACE3:
156
            par->block_align = 2 * par->channels;
157
            break;
158
        case AV_CODEC_ID_ADPCM_G726LE:
159
            par->bits_per_coded_sample = 5;
160
        case AV_CODEC_ID_ADPCM_IMA_WS:
161
        case AV_CODEC_ID_ADPCM_G722:
162
        case AV_CODEC_ID_MACE6:
163
        case AV_CODEC_ID_SDX2_DPCM:
164
            par->block_align = 1 * par->channels;
Baptiste Coudurier's avatar
Baptiste Coudurier committed
165
            break;
166
        case AV_CODEC_ID_GSM:
167
            par->block_align = 33;
168
            break;
169
        default:
170
            aiff->block_duration = 1;
171
            break;
172
        }
173 174 175
        if (par->block_align > 0)
            aiff->block_duration = av_get_audio_frame_duration2(par,
                                                                par->block_align);
176 177 178 179
    }

    /* Block align needs to be computed in all cases, as the definition
     * is specific to applications -> here we use the WAVE format definition */
180
    if (!par->block_align)
181
        par->block_align = (av_get_bits_per_sample(par->codec_id) * par->channels) >> 3;
182

183
    if (aiff->block_duration) {
184 185
        par->bit_rate = par->sample_rate * (par->block_align << 3) /
                        aiff->block_duration;
186
    }
187 188 189

    /* Chunk is over */
    if (size)
190
        avio_skip(pb, size);
191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207

    return num_frames;
}

static int aiff_probe(AVProbeData *p)
{
    /* check file header */
    if (p->buf[0] == 'F' && p->buf[1] == 'O' &&
        p->buf[2] == 'R' && p->buf[3] == 'M' &&
        p->buf[8] == 'A' && p->buf[9] == 'I' &&
        p->buf[10] == 'F' && (p->buf[11] == 'F' || p->buf[11] == 'C'))
        return AVPROBE_SCORE_MAX;
    else
        return 0;
}

/* aiff input */
208
static int aiff_read_header(AVFormatContext *s)
209
{
210
    int ret, size, filesize;
211
    int64_t offset = 0, position;
212 213
    uint32_t tag;
    unsigned version = AIFF_C_VERSION1;
214
    AVIOContext *pb = s->pb;
215
    AVStream * st;
216
    AIFFInputContext *aiff = s->priv_data;
217
    ID3v2ExtraMeta *id3v2_extra_meta = NULL;
218 219 220 221 222 223 224

    /* check FORM header */
    filesize = get_tag(pb, &tag);
    if (filesize < 0 || tag != MKTAG('F', 'O', 'R', 'M'))
        return AVERROR_INVALIDDATA;

    /* AIFF data type */
225
    tag = avio_rl32(pb);
226 227 228 229 230 231 232
    if (tag == MKTAG('A', 'I', 'F', 'F'))       /* Got an AIFF file */
        version = AIFF;
    else if (tag != MKTAG('A', 'I', 'F', 'C'))  /* An AIFF-C file then */
        return AVERROR_INVALIDDATA;

    filesize -= 4;

233
    st = avformat_new_stream(s, NULL);
234
    if (!st)
235
        return AVERROR(ENOMEM);
236 237 238 239

    while (filesize > 0) {
        /* parse different chunks */
        size = get_tag(pb, &tag);
240

241
        if (size == AVERROR_EOF && offset > 0 && st->codecpar->block_align) {
242 243 244
            av_log(s, AV_LOG_WARNING, "header parser hit EOF\n");
            goto got_sound;
        }
245 246 247 248 249 250
        if (size < 0)
            return size;

        filesize -= size + 8;

        switch (tag) {
Baptiste Coudurier's avatar
Baptiste Coudurier committed
251 252
        case MKTAG('C', 'O', 'M', 'M'):     /* Common chunk */
            /* Then for the complete header info */
253
            st->nb_frames = get_aiff_header(s, size, version);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
254 255 256 257 258
            if (st->nb_frames < 0)
                return st->nb_frames;
            if (offset > 0) // COMM is after SSND
                goto got_sound;
            break;
259
        case MKTAG('I', 'D', '3', ' '):
260
            position = avio_tell(pb);
261
            ff_id3v2_read(s, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta, size);
262 263 264 265 266
            if (id3v2_extra_meta)
                if ((ret = ff_id3v2_parse_apic(s, &id3v2_extra_meta)) < 0) {
                    ff_id3v2_free_extra_meta(&id3v2_extra_meta);
                    return ret;
                }
267
            ff_id3v2_free_extra_meta(&id3v2_extra_meta);
268 269
            if (position + size > avio_tell(pb))
                avio_skip(pb, position + size - avio_tell(pb));
270
            break;
Baptiste Coudurier's avatar
Baptiste Coudurier committed
271
        case MKTAG('F', 'V', 'E', 'R'):     /* Version chunk */
272
            version = avio_rb32(pb);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
273 274
            break;
        case MKTAG('N', 'A', 'M', 'E'):     /* Sample name chunk */
275
            get_meta(s, "title"    , size);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
276 277
            break;
        case MKTAG('A', 'U', 'T', 'H'):     /* Author chunk */
278
            get_meta(s, "author"   , size);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
279 280
            break;
        case MKTAG('(', 'c', ')', ' '):     /* Copyright chunk */
281
            get_meta(s, "copyright", size);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
282 283
            break;
        case MKTAG('A', 'N', 'N', 'O'):     /* Annotation chunk */
284
            get_meta(s, "comment"  , size);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
285 286
            break;
        case MKTAG('S', 'S', 'N', 'D'):     /* Sampled sound chunk */
287
            aiff->data_end = avio_tell(pb) + size;
288 289
            offset = avio_rb32(pb);      /* Offset of sound data */
            avio_rb32(pb);               /* BlockSize... don't care */
290
            offset += avio_tell(pb);    /* Compute absolute data offset */
291
            if (st->codecpar->block_align && !pb->seekable)    /* Assume COMM already parsed */
Baptiste Coudurier's avatar
Baptiste Coudurier committed
292
                goto got_sound;
293
            if (!pb->seekable) {
Baptiste Coudurier's avatar
Baptiste Coudurier committed
294 295 296
                av_log(s, AV_LOG_ERROR, "file is not seekable\n");
                return -1;
            }
297
            avio_skip(pb, size - 8);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
298
            break;
299
        case MKTAG('w', 'a', 'v', 'e'):
300 301
            if ((uint64_t)size > (1<<30))
                return -1;
302
            if (ff_get_extradata(s, st->codecpar, pb, size) < 0)
303
                return AVERROR(ENOMEM);
304 305 306 307
            if (st->codecpar->codec_id == AV_CODEC_ID_QDM2 && size>=12*4 && !st->codecpar->block_align) {
                st->codecpar->block_align = AV_RB32(st->codecpar->extradata+11*4);
                aiff->block_duration = AV_RB32(st->codecpar->extradata+9*4);
            } else if (st->codecpar->codec_id == AV_CODEC_ID_QCELP) {
308 309
                char rate = 0;
                if (size >= 25)
310
                    rate = st->codecpar->extradata[24];
311 312
                switch (rate) {
                case 'H': // RATE_HALF
313
                    st->codecpar->block_align = 17;
314 315 316
                    break;
                case 'F': // RATE_FULL
                default:
317
                    st->codecpar->block_align = 35;
318 319
                }
                aiff->block_duration = 160;
320 321
                st->codecpar->bit_rate = st->codecpar->sample_rate * (st->codecpar->block_align << 3) /
                                         aiff->block_duration;
322
            }
323
            break;
324
        case MKTAG('C','H','A','N'):
325
            if(ff_mov_read_chan(s, pb, st, size) < 0)
326 327
                return AVERROR_INVALIDDATA;
            break;
328
        case 0:
329
            if (offset > 0 && st->codecpar->block_align) // COMM && SSND
330
                goto got_sound;
Baptiste Coudurier's avatar
Baptiste Coudurier committed
331 332 333
        default: /* Jump */
            if (size & 1)   /* Always even aligned */
                size++;
334
            avio_skip(pb, size);
335 336 337
        }
    }

338
got_sound:
339
    if (!st->codecpar->block_align) {
340
        av_log(s, AV_LOG_ERROR, "could not find COMM tag or invalid block_align value\n");
341 342
        return -1;
    }
343 344

    /* Now positioned, get the sound data start and end */
345
    avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
346
    st->start_time = 0;
347
    st->duration = st->nb_frames * aiff->block_duration;
348 349

    /* Position the stream at the first block */
350
    avio_seek(pb, offset, SEEK_SET);
351 352 353 354 355 356 357 358 359

    return 0;
}

#define MAX_SIZE 4096

static int aiff_read_packet(AVFormatContext *s,
                            AVPacket *pkt)
{
360
    AVStream *st = s->streams[0];
361 362
    AIFFInputContext *aiff = s->priv_data;
    int64_t max_size;
363
    int res, size;
364

365
    /* calculate size of remaining data */
366
    max_size = aiff->data_end - avio_tell(s->pb);
367 368 369
    if (max_size <= 0)
        return AVERROR_EOF;

370
    /* Now for that packet */
371
    switch (st->codecpar->codec_id) {
372 373 374 375
    case AV_CODEC_ID_ADPCM_IMA_QT:
    case AV_CODEC_ID_GSM:
    case AV_CODEC_ID_QDM2:
    case AV_CODEC_ID_QCELP:
376
        size = st->codecpar->block_align;
377 378
        break;
    default:
379
        size = (MAX_SIZE / st->codecpar->block_align) * st->codecpar->block_align;
380
    }
381 382
    size = FFMIN(max_size, size);
    res = av_get_packet(s->pb, pkt, size);
383 384 385
    if (res < 0)
        return res;

386
    if (size >= st->codecpar->block_align)
387
        pkt->flags &= ~AV_PKT_FLAG_CORRUPT;
388 389
    /* Only one stream in an AIFF file */
    pkt->stream_index = 0;
390
    pkt->duration     = (res / st->codecpar->block_align) * aiff->block_duration;
391 392 393
    return 0;
}

394
AVInputFormat ff_aiff_demuxer = {
395 396 397 398 399 400
    .name           = "aiff",
    .long_name      = NULL_IF_CONFIG_SMALL("Audio IFF"),
    .priv_data_size = sizeof(AIFFInputContext),
    .read_probe     = aiff_probe,
    .read_header    = aiff_read_header,
    .read_packet    = aiff_read_packet,
401
    .read_seek      = ff_pcm_read_seek,
402
    .codec_tag      = (const AVCodecTag* const []){ ff_codec_aiff_tags, 0 },
403
};