wv.c 11.2 KB
Newer Older
1 2
/*
 * WavPack demuxer
3
 * Copyright (c) 2006,2011 Konstantin Shishkov
4
 *
5 6 7
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
8 9
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
10
 * version 2.1 of the License, or (at your option) any later version.
11
 *
12
 * FFmpeg is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with FFmpeg; if not, write to the Free Software
19 20 21
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

22
#include "libavutil/audioconvert.h"
23
#include "libavutil/intreadwrite.h"
24
#include "libavutil/dict.h"
25
#include "avformat.h"
26
#include "internal.h"
27 28
#include "apetag.h"
#include "id3v1.h"
29 30 31 32 33 34

// specs say that maximum block size is 1Mb
#define WV_BLOCK_LIMIT 1047576

#define WV_EXTRA_SIZE 12

35 36 37 38
#define WV_START_BLOCK  0x0800
#define WV_END_BLOCK    0x1000
#define WV_SINGLE_BLOCK (WV_START_BLOCK | WV_END_BLOCK)

39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60
enum WV_FLAGS{
    WV_MONO   = 0x0004,
    WV_HYBRID = 0x0008,
    WV_JOINT  = 0x0010,
    WV_CROSSD = 0x0020,
    WV_HSHAPE = 0x0040,
    WV_FLOAT  = 0x0080,
    WV_INT32  = 0x0100,
    WV_HBR    = 0x0200,
    WV_HBAL   = 0x0400,
    WV_MCINIT = 0x0800,
    WV_MCEND  = 0x1000,
};

static const int wv_rates[16] = {
     6000,  8000,  9600, 11025, 12000, 16000, 22050, 24000,
    32000, 44100, 48000, 64000, 88200, 96000, 192000, -1
};

typedef struct{
    uint32_t blksize, flags;
    int rate, chan, bpp;
61
    uint32_t chmask;
62
    uint32_t samples, soff;
63
    int multichannel;
64 65
    int block_parsed;
    uint8_t extra[WV_EXTRA_SIZE];
66
    int64_t pos;
67 68 69 70 71 72 73 74 75 76 77 78 79 80
}WVContext;

static int wv_probe(AVProbeData *p)
{
    /* check file header */
    if (p->buf_size <= 32)
        return 0;
    if (p->buf[0] == 'w' && p->buf[1] == 'v' &&
        p->buf[2] == 'p' && p->buf[3] == 'k')
        return AVPROBE_SCORE_MAX;
    else
        return 0;
}

81
static int wv_read_block_header(AVFormatContext *ctx, AVIOContext *pb, int append)
82 83 84 85 86
{
    WVContext *wc = ctx->priv_data;
    uint32_t tag, ver;
    int size;
    int rate, bpp, chan;
87
    uint32_t chmask;
88

89
    wc->pos = avio_tell(pb);
90
    if(!append){
91
        tag = avio_rl32(pb);
Kostya's avatar
Kostya committed
92 93
        if (tag != MKTAG('w', 'v', 'p', 'k'))
            return -1;
94
        size = avio_rl32(pb);
Kostya's avatar
Kostya committed
95 96 97 98 99
        if(size < 24 || size > WV_BLOCK_LIMIT){
            av_log(ctx, AV_LOG_ERROR, "Incorrect block size %i\n", size);
            return -1;
        }
        wc->blksize = size;
100
        ver = avio_rl16(pb);
Kostya's avatar
Kostya committed
101 102 103 104
        if(ver < 0x402 || ver > 0x410){
            av_log(ctx, AV_LOG_ERROR, "Unsupported version %03X\n", ver);
            return -1;
        }
105 106 107 108 109
        avio_r8(pb); // track no
        avio_r8(pb); // track sub index
        wc->samples = avio_rl32(pb); // total samples in file
        wc->soff = avio_rl32(pb); // offset in samples of current block
        avio_read(pb, wc->extra, WV_EXTRA_SIZE);
110 111 112
    }else{
        size = wc->blksize;
    }
113
    wc->flags = AV_RL32(wc->extra + 4);
114 115 116
    // blocks with zero samples don't contain actual audio information and should be ignored
    if (!AV_RN32(wc->extra))
        return 0;
117 118 119
    //parse flags
    bpp = ((wc->flags & 3) + 1) << 3;
    chan = 1 + !(wc->flags & WV_MONO);
120
    chmask = wc->flags & WV_MONO ? AV_CH_LAYOUT_MONO : AV_CH_LAYOUT_STEREO;
121
    rate = wv_rates[(wc->flags >> 23) & 0xF];
122 123 124 125
    wc->multichannel = !!((wc->flags & WV_SINGLE_BLOCK) != WV_SINGLE_BLOCK);
    if(wc->multichannel){
        chan = wc->chan;
        chmask = wc->chmask;
126
    }
127
    if((rate == -1 || !chan) && !wc->block_parsed){
128
        int64_t block_end = avio_tell(pb) + wc->blksize - 24;
129
        if(!pb->seekable){
130
            av_log(ctx, AV_LOG_ERROR, "Cannot determine additional parameters\n");
131 132
            return -1;
        }
133
        while(avio_tell(pb) < block_end){
134
            int id, size;
135 136
            id = avio_r8(pb);
            size = (id & 0x80) ? avio_rl24(pb) : avio_r8(pb);
137 138 139
            size <<= 1;
            if(id&0x40)
                size--;
140 141 142 143 144 145
            switch(id&0x3F){
            case 0xD:
                if(size <= 1){
                    av_log(ctx, AV_LOG_ERROR, "Insufficient channel information\n");
                    return -1;
                }
146
                chan = avio_r8(pb);
147 148
                switch(size - 2){
                case 0:
149
                    chmask = avio_r8(pb);
150 151
                    break;
                case 1:
152
                    chmask = avio_rl16(pb);
153 154
                    break;
                case 2:
155
                    chmask = avio_rl24(pb);
156 157
                    break;
                case 3:
158
                    chmask = avio_rl32(pb);
159 160
                    break;
                case 5:
161
                    avio_skip(pb, 1);
162 163
                    chan |= (avio_r8(pb) & 0xF) << 8;
                    chmask = avio_rl24(pb);
164 165 166 167 168 169 170
                    break;
                default:
                    av_log(ctx, AV_LOG_ERROR, "Invalid channel info size %d\n", size);
                    return -1;
                }
                break;
            case 0x27:
171
                rate = avio_rl24(pb);
172
                break;
173
            default:
174
                avio_skip(pb, size);
175
            }
176
            if(id&0x40)
177
                avio_skip(pb, 1);
178 179 180 181 182
        }
        if(rate == -1){
            av_log(ctx, AV_LOG_ERROR, "Cannot determine custom sampling rate\n");
            return -1;
        }
183
        avio_seek(pb, block_end - wc->blksize + 24, SEEK_SET);
184 185 186
    }
    if(!wc->bpp) wc->bpp = bpp;
    if(!wc->chan) wc->chan = chan;
187
    if(!wc->chmask) wc->chmask = chmask;
188 189
    if(!wc->rate) wc->rate = rate;

190
    if(wc->flags && bpp != wc->bpp){
191 192 193
        av_log(ctx, AV_LOG_ERROR, "Bits per sample differ, this block: %i, header block: %i\n", bpp, wc->bpp);
        return -1;
    }
194
    if(wc->flags && !wc->multichannel && chan != wc->chan){
195 196 197
        av_log(ctx, AV_LOG_ERROR, "Channels differ, this block: %i, header block: %i\n", chan, wc->chan);
        return -1;
    }
198
    if(wc->flags && rate != -1 && rate != wc->rate){
199 200 201 202 203 204 205
        av_log(ctx, AV_LOG_ERROR, "Sampling rate differ, this block: %i, header block: %i\n", rate, wc->rate);
        return -1;
    }
    wc->blksize = size - 24;
    return 0;
}

206
static int wv_read_header(AVFormatContext *s)
207
{
208
    AVIOContext *pb = s->pb;
209 210 211
    WVContext *wc = s->priv_data;
    AVStream *st;

212
    wc->block_parsed = 0;
213 214 215 216 217 218 219 220
    for(;;){
        if(wv_read_block_header(s, pb, 0) < 0)
            return -1;
        if(!AV_RN32(wc->extra))
            avio_skip(pb, wc->blksize - 24);
        else
            break;
    }
221 222

    /* now we are ready: build format streams */
223
    st = avformat_new_stream(s, NULL);
224 225
    if (!st)
        return -1;
226
    st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
227 228
    st->codec->codec_id = CODEC_ID_WAVPACK;
    st->codec->channels = wc->chan;
229
    st->codec->channel_layout = wc->chmask;
230
    st->codec->sample_rate = wc->rate;
231
    st->codec->bits_per_coded_sample = wc->bpp;
232
    avpriv_set_pts_info(st, 64, 1, wc->rate);
233 234
    st->start_time = 0;
    st->duration = wc->samples;
235

236
    if(s->pb->seekable) {
237
        int64_t cur = avio_tell(s->pb);
238
        ff_ape_parse_tag(s);
239
        if(!av_dict_get(s->metadata, "", NULL, AV_DICT_IGNORE_SUFFIX))
240
            ff_id3v1_read(s);
241
        avio_seek(s->pb, cur, SEEK_SET);
242 243
    }

244 245 246 247 248 249 250
    return 0;
}

static int wv_read_packet(AVFormatContext *s,
                          AVPacket *pkt)
{
    WVContext *wc = s->priv_data;
Diego Biurrun's avatar
Diego Biurrun committed
251
    int ret;
252
    int size, ver, off;
253
    int64_t pos;
254
    uint32_t block_samples;
255

256
    if (url_feof(s->pb))
257
        return AVERROR(EIO);
258
    if(wc->block_parsed){
259
        if(wv_read_block_header(s, s->pb, 0) < 0)
260 261 262
            return -1;
    }

263
    pos = wc->pos;
264 265
    off = wc->multichannel ? 4 : 0;
    if(av_new_packet(pkt, wc->blksize + WV_EXTRA_SIZE + off) < 0)
266
        return AVERROR(ENOMEM);
267 268 269
    if(wc->multichannel)
        AV_WL32(pkt->data, wc->blksize + WV_EXTRA_SIZE + 12);
    memcpy(pkt->data + off, wc->extra, WV_EXTRA_SIZE);
270
    ret = avio_read(s->pb, pkt->data + WV_EXTRA_SIZE + off, wc->blksize);
271 272
    if(ret != wc->blksize){
        av_free_packet(pkt);
273
        return AVERROR(EIO);
274
    }
275
    while(!(wc->flags & WV_END_BLOCK)){
276
        if(avio_rl32(s->pb) != MKTAG('w', 'v', 'p', 'k')){
277 278 279 280 281 282 283 284 285 286 287 288 289 290
            av_free_packet(pkt);
            return -1;
        }
        if((ret = av_append_packet(s->pb, pkt, 4)) < 0){
            av_free_packet(pkt);
            return ret;
        }
        size = AV_RL32(pkt->data + pkt->size - 4);
        if(size < 24 || size > WV_BLOCK_LIMIT){
            av_free_packet(pkt);
            av_log(s, AV_LOG_ERROR, "Incorrect block size %d\n", size);
            return -1;
        }
        wc->blksize = size;
291
        ver = avio_rl16(s->pb);
292 293 294 295 296
        if(ver < 0x402 || ver > 0x410){
            av_free_packet(pkt);
            av_log(s, AV_LOG_ERROR, "Unsupported version %03X\n", ver);
            return -1;
        }
297 298 299 300
        avio_r8(s->pb); // track no
        avio_r8(s->pb); // track sub index
        wc->samples = avio_rl32(s->pb); // total samples in file
        wc->soff = avio_rl32(s->pb); // offset in samples of current block
301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316
        if((ret = av_append_packet(s->pb, pkt, WV_EXTRA_SIZE)) < 0){
            av_free_packet(pkt);
            return ret;
        }
        memcpy(wc->extra, pkt->data + pkt->size - WV_EXTRA_SIZE, WV_EXTRA_SIZE);

        if(wv_read_block_header(s, s->pb, 1) < 0){
            av_free_packet(pkt);
            return -1;
        }
        ret = av_append_packet(s->pb, pkt, wc->blksize);
        if(ret < 0){
            av_free_packet(pkt);
            return ret;
        }
    }
317 318
    pkt->stream_index = 0;
    wc->block_parsed = 1;
319
    pkt->pts = wc->soff;
320 321 322 323 324 325
    block_samples = AV_RN32(wc->extra);
    if (block_samples > INT32_MAX)
        av_log(s, AV_LOG_WARNING, "Too many samples in block: %"PRIu32"\n", block_samples);
    else
        pkt->duration = block_samples;

326
    av_add_index_entry(s->streams[0], pos, pkt->pts, 0, 0, AVINDEX_KEYFRAME);
327 328 329
    return 0;
}

330 331 332 333 334 335 336 337 338 339
static int wv_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
{
    AVStream *st = s->streams[stream_index];
    WVContext *wc = s->priv_data;
    AVPacket pkt1, *pkt = &pkt1;
    int ret;
    int index = av_index_search_timestamp(st, timestamp, flags);
    int64_t pos, pts;

    /* if found, seek there */
340 341
    if (index >= 0 &&
        timestamp <= st->index_entries[st->nb_index_entries - 1].timestamp) {
342
        wc->block_parsed = 1;
343
        avio_seek(s->pb, st->index_entries[index].pos, SEEK_SET);
344 345 346 347 348 349
        return 0;
    }
    /* if timestamp is out of bounds, return error */
    if(timestamp < 0 || timestamp >= s->duration)
        return -1;

350
    pos = avio_tell(s->pb);
351 352 353
    do{
        ret = av_read_frame(s, pkt);
        if (ret < 0){
354
            avio_seek(s->pb, pos, SEEK_SET);
355 356 357 358 359 360 361 362
            return -1;
        }
        pts = pkt->pts;
        av_free_packet(pkt);
    }while(pts < timestamp);
    return 0;
}

363
AVInputFormat ff_wv_demuxer = {
364 365 366 367 368 369 370
    .name           = "wv",
    .long_name      = NULL_IF_CONFIG_SMALL("WavPack"),
    .priv_data_size = sizeof(WVContext),
    .read_probe     = wv_probe,
    .read_header    = wv_read_header,
    .read_packet    = wv_read_packet,
    .read_seek      = wv_read_seek,
371
};