wav.c 12.1 KB
Newer Older
1
/*
Fabrice Bellard's avatar
Fabrice Bellard committed
2
 * WAV encoder and decoder
3
 * Copyright (c) 2001, 2002 Fabrice Bellard.
Fabrice Bellard's avatar
Fabrice Bellard committed
4
 *
5 6 7 8
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
Fabrice Bellard's avatar
Fabrice Bellard committed
9
 *
10
 * This library is distributed in the hope that it will be useful,
Fabrice Bellard's avatar
Fabrice Bellard committed
11
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 13
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
Fabrice Bellard's avatar
Fabrice Bellard committed
14
 *
15 16
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
17
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Fabrice Bellard's avatar
Fabrice Bellard committed
18 19 20 21
 */
#include "avformat.h"
#include "avi.h"

22
const CodecTag codec_wav_tags[] = {
23
    { CODEC_ID_MP2, 0x50 },
24
    { CODEC_ID_MP3, 0x55 },
25
    { CODEC_ID_AC3, 0x2000 },
26
    { CODEC_ID_DTS, 0x2001 },
27 28
    { CODEC_ID_PCM_S16LE, 0x01 },
    { CODEC_ID_PCM_U8, 0x01 }, /* must come after s16le in this list */
29 30
    { CODEC_ID_PCM_S24LE, 0x01 },
    { CODEC_ID_PCM_S32LE, 0x01 },
31 32
    { CODEC_ID_PCM_ALAW, 0x06 },
    { CODEC_ID_PCM_MULAW, 0x07 },
33 34
    { CODEC_ID_ADPCM_MS, 0x02 },
    { CODEC_ID_ADPCM_IMA_WAV, 0x11 },
35
    { CODEC_ID_ADPCM_YAMAHA, 0x20 },
36
    { CODEC_ID_ADPCM_G726, 0x45 },
37 38
    { CODEC_ID_ADPCM_IMA_DK4, 0x61 },  /* rogue format number */
    { CODEC_ID_ADPCM_IMA_DK3, 0x62 },  /* rogue format number */
39 40
    { CODEC_ID_WMAV1, 0x160 },
    { CODEC_ID_WMAV2, 0x161 },
41
    { CODEC_ID_AAC, 0x706d },
42
    { CODEC_ID_VORBIS, ('V'<<8)+'o' }, //HACK/FIXME, does vorbis in WAV/AVI have an (in)official id?
43 44
    { CODEC_ID_SONIC, 0x2048 },
    { CODEC_ID_SONIC_LS, 0x2048 },
45
    { CODEC_ID_ADPCM_CT, 0x200 },
46
    { CODEC_ID_ADPCM_SWF, ('S'<<8)+'F' },
47
    { CODEC_ID_TRUESPEECH, 0x22 },
48 49 50 51

    // for NuppelVideo (nuv.c)
    { CODEC_ID_PCM_S16LE, MKTAG('R', 'A', 'W', 'A') },
    { CODEC_ID_MP3, MKTAG('L', 'A', 'M', 'E') },
52 53 54
    { 0, 0 },
};

55
#ifdef CONFIG_MUXERS
56
/* WAVEFORMATEX header */
57
/* returns the size or -1 on error */
58 59
int put_wav_header(ByteIOContext *pb, AVCodecContext *enc)
{
60
    int bps, blkalign, bytespersec;
61
    int hdrsize = 18;
62

63 64 65
    if(!enc->codec_tag)
       enc->codec_tag = codec_get_tag(codec_wav_tags, enc->codec_id);
    if(!enc->codec_tag)
66
        return -1;
67 68

    put_le16(pb, enc->codec_tag);
69 70 71 72 73 74
    put_le16(pb, enc->channels);
    put_le32(pb, enc->sample_rate);
    if (enc->codec_id == CODEC_ID_PCM_U8 ||
        enc->codec_id == CODEC_ID_PCM_ALAW ||
        enc->codec_id == CODEC_ID_PCM_MULAW) {
        bps = 8;
75
    } else if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
76
        bps = 0;
77
    } else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV || enc->codec_id == CODEC_ID_ADPCM_MS || enc->codec_id == CODEC_ID_ADPCM_G726 || enc->codec_id == CODEC_ID_ADPCM_YAMAHA) { //
78
        bps = 4;
79 80 81 82
    } else if (enc->codec_id == CODEC_ID_PCM_S24LE) {
        bps = 24;
    } else if (enc->codec_id == CODEC_ID_PCM_S32LE) {
        bps = 32;
83 84 85
    } else {
        bps = 16;
    }
86

87
    if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
88
        blkalign = enc->frame_size; //this is wrong, but seems many demuxers dont work if this is set correctly
89
        //blkalign = 144 * enc->bit_rate/enc->sample_rate;
90 91
    } else if (enc->codec_id == CODEC_ID_ADPCM_G726) { //
        blkalign = 1;
92 93
    } else if (enc->block_align != 0) { /* specified by the codec */
        blkalign = enc->block_align;
94
    } else
95 96
        blkalign = enc->channels*bps >> 3;
    if (enc->codec_id == CODEC_ID_PCM_U8 ||
97 98
        enc->codec_id == CODEC_ID_PCM_S24LE ||
        enc->codec_id == CODEC_ID_PCM_S32LE ||
99 100 101 102 103 104 105 106
        enc->codec_id == CODEC_ID_PCM_S16LE) {
        bytespersec = enc->sample_rate * blkalign;
    } else {
        bytespersec = enc->bit_rate / 8;
    }
    put_le32(pb, bytespersec); /* bytes per second */
    put_le16(pb, blkalign); /* block align */
    put_le16(pb, bps); /* bits per sample */
107
    if (enc->codec_id == CODEC_ID_MP3) {
108
        put_le16(pb, 12); /* wav_extra_size */
109
        hdrsize += 12;
110 111 112 113 114
        put_le16(pb, 1); /* wID */
        put_le32(pb, 2); /* fdwFlags */
        put_le16(pb, 1152); /* nBlockSize */
        put_le16(pb, 1); /* nFramesPerBlock */
        put_le16(pb, 1393); /* nCodecDelay */
115 116
    } else if (enc->codec_id == CODEC_ID_MP2) {
        put_le16(pb, 22); /* wav_extra_size */
117
        hdrsize += 22;
118 119 120 121 122 123 124 125
        put_le16(pb, 2);  /* fwHeadLayer */
        put_le32(pb, enc->bit_rate); /* dwHeadBitrate */
        put_le16(pb, enc->channels == 2 ? 1 : 8); /* fwHeadMode */
        put_le16(pb, 0);  /* fwHeadModeExt */
        put_le16(pb, 1);  /* wHeadEmphasis */
        put_le16(pb, 16); /* fwHeadFlags */
        put_le32(pb, 0);  /* dwPTSLow */
        put_le32(pb, 0);  /* dwPTSHigh */
126 127
    } else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV) {
        put_le16(pb, 2); /* wav_extra_size */
128
        hdrsize += 2;
129
        put_le16(pb, ((enc->block_align - 4 * enc->channels) / (4 * enc->channels)) * 8 + 1); /* wSamplesPerBlock */
130
    } else if(enc->extradata_size){
131 132 133
        put_le16(pb, enc->extradata_size);
        put_buffer(pb, enc->extradata, enc->extradata_size);
        hdrsize += enc->extradata_size;
Michael Niedermayer's avatar
Michael Niedermayer committed
134 135 136 137
        if(hdrsize&1){
            hdrsize++;
            put_byte(pb, 0);
        }
138 139
    } else {
        hdrsize -= 2;
140
    }
141

142
    return hdrsize;
143
}
144
#endif //CONFIG_MUXERS
145

146 147 148 149 150 151 152
/* We could be given one of the three possible structures here:
 * WAVEFORMAT, PCMWAVEFORMAT or WAVEFORMATEX. Each structure
 * is an expansion of the previous one with the fields added
 * at the bottom. PCMWAVEFORMAT adds 'WORD wBitsPerSample' and
 * WAVEFORMATEX adds 'WORD  cbSize' and basically makes itself
 * an openended structure.
 */
153
void get_wav_header(ByteIOContext *pb, AVCodecContext *codec, int size)
154
{
155
    int id;
156 157 158 159 160 161 162 163

    id = get_le16(pb);
    codec->codec_type = CODEC_TYPE_AUDIO;
    codec->codec_tag = id;
    codec->channels = get_le16(pb);
    codec->sample_rate = get_le32(pb);
    codec->bit_rate = get_le32(pb) * 8;
    codec->block_align = get_le16(pb);
164 165
    if (size == 14) {  /* We're dealing with plain vanilla WAVEFORMAT */
        codec->bits_per_sample = 8;
Michael Niedermayer's avatar
Michael Niedermayer committed
166 167 168
    }else
        codec->bits_per_sample = get_le16(pb);
    codec->codec_id = wav_codec_get_id(id, codec->bits_per_sample);
169

170
    if (size > 16) {  /* We're obviously dealing with WAVEFORMATEX */
171 172 173 174
        codec->extradata_size = get_le16(pb);
        if (codec->extradata_size > 0) {
            if (codec->extradata_size > size - 18)
                codec->extradata_size = size - 18;
175
            codec->extradata = av_mallocz(codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
176
            get_buffer(pb, codec->extradata, codec->extradata_size);
177
        } else
178
            codec->extradata_size = 0;
179

180 181 182
        /* It is possible for the chunk to contain garbage at the end */
        if (size - codec->extradata_size - 18 > 0)
            url_fskip(pb, size - codec->extradata_size - 18);
183 184 185 186
    }
}


187 188 189 190 191 192 193 194 195
int wav_codec_get_id(unsigned int tag, int bps)
{
    int id;
    id = codec_get_id(codec_wav_tags, tag);
    if (id <= 0)
        return id;
    /* handle specific u8 codec */
    if (id == CODEC_ID_PCM_S16LE && bps == 8)
        id = CODEC_ID_PCM_U8;
196 197 198 199
    if (id == CODEC_ID_PCM_S16LE && bps == 24)
        id = CODEC_ID_PCM_S24LE;
    if (id == CODEC_ID_PCM_S16LE && bps == 32)
        id = CODEC_ID_PCM_S32LE;
200 201 202
    return id;
}

203
#ifdef CONFIG_MUXERS
Fabrice Bellard's avatar
Fabrice Bellard committed
204 205 206 207 208 209
typedef struct {
    offset_t data;
} WAVContext;

static int wav_write_header(AVFormatContext *s)
{
Fabrice Bellard's avatar
Fabrice Bellard committed
210
    WAVContext *wav = s->priv_data;
Fabrice Bellard's avatar
Fabrice Bellard committed
211 212 213 214 215 216 217 218 219
    ByteIOContext *pb = &s->pb;
    offset_t fmt;

    put_tag(pb, "RIFF");
    put_le32(pb, 0); /* file length */
    put_tag(pb, "WAVE");

    /* format header */
    fmt = start_tag(pb, "fmt ");
220
    if (put_wav_header(pb, s->streams[0]->codec) < 0) {
221
        av_free(wav);
222 223
        return -1;
    }
Fabrice Bellard's avatar
Fabrice Bellard committed
224 225
    end_tag(pb, fmt);

226
    av_set_pts_info(s->streams[0], 64, 1, s->streams[0]->codec->sample_rate);
227

Fabrice Bellard's avatar
Fabrice Bellard committed
228 229
    /* data header */
    wav->data = start_tag(pb, "data");
230

Fabrice Bellard's avatar
Fabrice Bellard committed
231 232 233 234 235
    put_flush_packet(pb);

    return 0;
}

236
static int wav_write_packet(AVFormatContext *s, AVPacket *pkt)
Fabrice Bellard's avatar
Fabrice Bellard committed
237 238
{
    ByteIOContext *pb = &s->pb;
239
    put_buffer(pb, pkt->data, pkt->size);
Fabrice Bellard's avatar
Fabrice Bellard committed
240 241 242 243 244 245 246 247 248 249 250 251 252 253 254
    return 0;
}

static int wav_write_trailer(AVFormatContext *s)
{
    ByteIOContext *pb = &s->pb;
    WAVContext *wav = s->priv_data;
    offset_t file_size;

    if (!url_is_streamed(&s->pb)) {
        end_tag(pb, wav->data);

        /* update file size */
        file_size = url_ftell(pb);
        url_fseek(pb, 4, SEEK_SET);
255
        put_le32(pb, (uint32_t)(file_size - 8));
Fabrice Bellard's avatar
Fabrice Bellard committed
256 257 258 259 260 261
        url_fseek(pb, file_size, SEEK_SET);

        put_flush_packet(pb);
    }
    return 0;
}
262
#endif //CONFIG_MUXERS
Fabrice Bellard's avatar
Fabrice Bellard committed
263 264 265

/* return the size of the found tag */
/* XXX: > 2GB ? */
266
static int find_tag(ByteIOContext *pb, uint32_t tag1)
Fabrice Bellard's avatar
Fabrice Bellard committed
267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284
{
    unsigned int tag;
    int size;

    for(;;) {
        if (url_feof(pb))
            return -1;
        tag = get_le32(pb);
        size = get_le32(pb);
        if (tag == tag1)
            break;
        url_fseek(pb, size, SEEK_CUR);
    }
    if (size < 0)
        size = 0x7fffffff;
    return size;
}

Fabrice Bellard's avatar
Fabrice Bellard committed
285 286 287 288 289 290 291 292 293 294 295 296 297 298
static int wav_probe(AVProbeData *p)
{
    /* check file header */
    if (p->buf_size <= 32)
        return 0;
    if (p->buf[0] == 'R' && p->buf[1] == 'I' &&
        p->buf[2] == 'F' && p->buf[3] == 'F' &&
        p->buf[8] == 'W' && p->buf[9] == 'A' &&
        p->buf[10] == 'V' && p->buf[11] == 'E')
        return AVPROBE_SCORE_MAX;
    else
        return 0;
}

Fabrice Bellard's avatar
Fabrice Bellard committed
299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316
/* wav input */
static int wav_read_header(AVFormatContext *s,
                           AVFormatParameters *ap)
{
    int size;
    unsigned int tag;
    ByteIOContext *pb = &s->pb;
    AVStream *st;

    /* check RIFF header */
    tag = get_le32(pb);

    if (tag != MKTAG('R', 'I', 'F', 'F'))
        return -1;
    get_le32(pb); /* file size */
    tag = get_le32(pb);
    if (tag != MKTAG('W', 'A', 'V', 'E'))
        return -1;
317

Fabrice Bellard's avatar
Fabrice Bellard committed
318 319 320 321
    /* parse fmt header */
    size = find_tag(pb, MKTAG('f', 'm', 't', ' '));
    if (size < 0)
        return -1;
Fabrice Bellard's avatar
Fabrice Bellard committed
322
    st = av_new_stream(s, 0);
Fabrice Bellard's avatar
Fabrice Bellard committed
323
    if (!st)
Fabrice Bellard's avatar
Fabrice Bellard committed
324
        return AVERROR_NOMEM;
Fabrice Bellard's avatar
Fabrice Bellard committed
325

326
    get_wav_header(pb, st->codec, size);
327
    st->need_parsing = 1;
328

329
    av_set_pts_info(st, 64, 1, st->codec->sample_rate);
330

331 332 333
    size = find_tag(pb, MKTAG('d', 'a', 't', 'a'));
    if (size < 0)
        return -1;
Fabrice Bellard's avatar
Fabrice Bellard committed
334 335 336 337 338 339 340 341
    return 0;
}

#define MAX_SIZE 4096

static int wav_read_packet(AVFormatContext *s,
                           AVPacket *pkt)
{
342 343
    int ret, size;
    AVStream *st;
Fabrice Bellard's avatar
Fabrice Bellard committed
344 345

    if (url_feof(&s->pb))
346
        return AVERROR_IO;
347 348 349
    st = s->streams[0];

    size = MAX_SIZE;
350 351 352 353
    if (st->codec->block_align > 1) {
        if (size < st->codec->block_align)
            size = st->codec->block_align;
        size = (size / st->codec->block_align) * st->codec->block_align;
354 355
    }
    if (av_new_packet(pkt, size))
356
        return AVERROR_IO;
Fabrice Bellard's avatar
Fabrice Bellard committed
357 358 359 360 361
    pkt->stream_index = 0;

    ret = get_buffer(&s->pb, pkt->data, pkt->size);
    if (ret < 0)
        av_free_packet(pkt);
Fabrice Bellard's avatar
Fabrice Bellard committed
362 363 364
    /* note: we need to modify the packet size here to handle the last
       packet */
    pkt->size = ret;
Fabrice Bellard's avatar
Fabrice Bellard committed
365 366 367 368 369 370 371 372
    return ret;
}

static int wav_read_close(AVFormatContext *s)
{
    return 0;
}

373
static int wav_read_seek(AVFormatContext *s,
374
                         int stream_index, int64_t timestamp, int flags)
375 376 377 378
{
    AVStream *st;

    st = s->streams[0];
379
    switch(st->codec->codec_id) {
380 381 382
    case CODEC_ID_MP2:
    case CODEC_ID_MP3:
    case CODEC_ID_AC3:
383
    case CODEC_ID_DTS:
384 385 386 387 388
        /* use generic seeking with dynamically generated indexes */
        return -1;
    default:
        break;
    }
389
    return pcm_read_seek(s, stream_index, timestamp, flags);
390 391 392
}


Fabrice Bellard's avatar
Fabrice Bellard committed
393 394 395 396 397 398 399 400
static AVInputFormat wav_iformat = {
    "wav",
    "wav format",
    0,
    wav_probe,
    wav_read_header,
    wav_read_packet,
    wav_read_close,
401
    wav_read_seek,
Fabrice Bellard's avatar
Fabrice Bellard committed
402 403
};

404
#ifdef CONFIG_MUXERS
Fabrice Bellard's avatar
Fabrice Bellard committed
405
static AVOutputFormat wav_oformat = {
Fabrice Bellard's avatar
Fabrice Bellard committed
406 407 408 409
    "wav",
    "wav format",
    "audio/x-wav",
    "wav",
Fabrice Bellard's avatar
Fabrice Bellard committed
410
    sizeof(WAVContext),
Fabrice Bellard's avatar
Fabrice Bellard committed
411
    CODEC_ID_PCM_S16LE,
Fabrice Bellard's avatar
Fabrice Bellard committed
412 413 414 415 416
    CODEC_ID_NONE,
    wav_write_header,
    wav_write_packet,
    wav_write_trailer,
};
417
#endif //CONFIG_MUXERS
Fabrice Bellard's avatar
Fabrice Bellard committed
418

419
int ff_wav_init(void)
Fabrice Bellard's avatar
Fabrice Bellard committed
420 421
{
    av_register_input_format(&wav_iformat);
422
#ifdef CONFIG_MUXERS
Fabrice Bellard's avatar
Fabrice Bellard committed
423
    av_register_output_format(&wav_oformat);
424
#endif //CONFIG_MUXERS
Fabrice Bellard's avatar
Fabrice Bellard committed
425 426
    return 0;
}