nellymoserdec.c 6.83 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * NellyMoser audio decoder
 * Copyright (c) 2007 a840bda5870ba11f19698ff6eb9581dfb0f95fa5,
 *                    539459aeb7d425140b62a3ec7dbf6dc8e408a306, and
 *                    520e17cd55896441042b14df2566a6eb610ed444
 * Copyright (c) 2007 Loic Minier <lool at dooz.org>
 *                    Benjamin Larsson
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 * DEALINGS IN THE SOFTWARE.
 */

/**
29
 * @file
30 31 32
 * The 3 alphanumeric copyright notices are md5summed they are from the original
 * implementors. The original code is available from http://code.google.com/p/nelly2pcm/
 */
33

34
#include "libavutil/channel_layout.h"
35
#include "libavutil/float_dsp.h"
36 37
#include "libavutil/lfg.h"
#include "libavutil/random_seed.h"
38 39

#define BITSTREAM_READER_LE
40
#include "avcodec.h"
41
#include "fft.h"
42
#include "get_bits.h"
43
#include "internal.h"
44
#include "nellymoser.h"
45
#include "sinewin.h"
46 47 48 49


typedef struct NellyMoserDecodeContext {
    AVCodecContext* avctx;
50
    AVLFG           random_state;
51
    GetBitContext   gb;
52
    float           scale_bias;
53
    AVFloatDSPContext *fdsp;
54
    FFTContext      imdct_ctx;
55 56 57
    DECLARE_ALIGNED(32, float, imdct_buf)[2][NELLY_BUF_LEN];
    float          *imdct_out;
    float          *imdct_prev;
58 59
} NellyMoserDecodeContext;

60 61 62
static void nelly_decode_block(NellyMoserDecodeContext *s,
                               const unsigned char block[NELLY_BLOCK_LEN],
                               float audio[NELLY_SAMPLES])
63 64
{
    int i,j;
65
    float buf[NELLY_FILL_LEN], pows[NELLY_FILL_LEN];
66 67 68 69 70 71 72 73
    float *aptr, *bptr, *pptr, val, pval;
    int bits[NELLY_BUF_LEN];
    unsigned char v;

    init_get_bits(&s->gb, block, NELLY_BLOCK_LEN * 8);

    bptr = buf;
    pptr = pows;
74
    val = ff_nelly_init_table[get_bits(&s->gb, 6)];
75 76
    for (i=0 ; i<NELLY_BANDS ; i++) {
        if (i > 0)
77
            val += ff_nelly_delta_table[get_bits(&s->gb, 5)];
78
        pval = -exp2(val/2048) * s->scale_bias;
79
        for (j = 0; j < ff_nelly_band_sizes_table[i]; j++) {
80 81 82 83 84 85
            *bptr++ = val;
            *pptr++ = pval;
        }

    }

86
    ff_nelly_get_sample_bits(buf, bits);
87 88

    for (i = 0; i < 2; i++) {
89 90
        aptr = audio + i * NELLY_BUF_LEN;

91
        init_get_bits(&s->gb, block, NELLY_BLOCK_LEN * 8);
92
        skip_bits_long(&s->gb, NELLY_HEADER_BITS + i*NELLY_DETAIL_BITS);
93 94 95

        for (j = 0; j < NELLY_FILL_LEN; j++) {
            if (bits[j] <= 0) {
96
                aptr[j] = M_SQRT1_2*pows[j];
97
                if (av_lfg_get(&s->random_state) & 1)
98
                    aptr[j] *= -1.0;
99 100
            } else {
                v = get_bits(&s->gb, bits[j]);
101
                aptr[j] = ff_nelly_dequantization_table[(1<<bits[j])-1+v]*pows[j];
102 103
            }
        }
104 105 106
        memset(&aptr[NELLY_FILL_LEN], 0,
               (NELLY_BUF_LEN - NELLY_FILL_LEN) * sizeof(float));

107
        s->imdct_ctx.imdct_half(&s->imdct_ctx, s->imdct_out, aptr);
108
        s->fdsp->vector_fmul_window(aptr, s->imdct_prev + NELLY_BUF_LEN / 2,
109 110
                                   s->imdct_out, ff_sine_128,
                                   NELLY_BUF_LEN / 2);
111
        FFSWAP(float *, s->imdct_out, s->imdct_prev);
112 113 114
    }
}

115
static av_cold int decode_init(AVCodecContext * avctx) {
116 117 118
    NellyMoserDecodeContext *s = avctx->priv_data;

    s->avctx = avctx;
119 120
    s->imdct_out = s->imdct_buf[0];
    s->imdct_prev = s->imdct_buf[1];
121
    av_lfg_init(&s->random_state, 0);
122
    ff_mdct_init(&s->imdct_ctx, 8, 1, 1.0);
123

124
    s->fdsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT);
125 126
    if (!s->fdsp)
        return AVERROR(ENOMEM);
127

128 129
    s->scale_bias = 1.0/(32768*8);
    avctx->sample_fmt = AV_SAMPLE_FMT_FLT;
130 131

    /* Generate overlap window */
132
    if (!ff_sine_128[127])
133
        ff_init_ff_sine_windows(7);
134

135
    avctx->channels       = 1;
136
    avctx->channel_layout = AV_CH_LAYOUT_MONO;
137

138 139 140
    return 0;
}

141 142 143
static int decode_tag(AVCodecContext *avctx, void *data,
                      int *got_frame_ptr, AVPacket *avpkt)
{
144
    AVFrame *frame     = data;
145
    const uint8_t *buf = avpkt->data;
146
    const uint8_t *side=av_packet_get_side_data(avpkt, 'F', NULL);
147
    int buf_size = avpkt->size;
148
    NellyMoserDecodeContext *s = avctx->priv_data;
149 150
    int blocks, i, ret;
    float   *samples_flt;
151

152
    blocks     = buf_size / NELLY_BLOCK_LEN;
153

154
    if (blocks <= 0) {
155 156 157
        av_log(avctx, AV_LOG_ERROR, "Packet is too small\n");
        return AVERROR_INVALIDDATA;
    }
158

159 160 161 162
    if (buf_size % NELLY_BLOCK_LEN) {
        av_log(avctx, AV_LOG_WARNING, "Leftover bytes: %d.\n",
               buf_size % NELLY_BLOCK_LEN);
    }
163 164 165 166 167 168 169
    /* Normal numbers of blocks for sample rates:
     *  8000 Hz - 1
     * 11025 Hz - 2
     * 16000 Hz - 3
     * 22050 Hz - 4
     * 44100 Hz - 8
     */
170 171
    if(side && blocks>1 && avctx->sample_rate%11025==0 && (1<<((side[0]>>2)&3)) == blocks)
        avctx->sample_rate= 11025*(blocks/2);
172

173
    /* get output buffer */
174
    frame->nb_samples = NELLY_SAMPLES * blocks;
175
    if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
176
        return ret;
177
    samples_flt = (float *)frame->data[0];
178

179
    for (i=0 ; i<blocks ; i++) {
180 181
        nelly_decode_block(s, buf, samples_flt);
        samples_flt += NELLY_SAMPLES;
182
        buf += NELLY_BLOCK_LEN;
183
    }
184

185
    *got_frame_ptr = 1;
186

187
    return buf_size;
188 189
}

190
static av_cold int decode_end(AVCodecContext * avctx) {
191 192
    NellyMoserDecodeContext *s = avctx->priv_data;

193
    ff_mdct_end(&s->imdct_ctx);
194
    av_freep(&s->fdsp);
195

196 197 198
    return 0;
}

199
AVCodec ff_nellymoser_decoder = {
200
    .name           = "nellymoser",
201
    .long_name      = NULL_IF_CONFIG_SMALL("Nellymoser Asao"),
202
    .type           = AVMEDIA_TYPE_AUDIO,
203
    .id             = AV_CODEC_ID_NELLYMOSER,
204 205 206 207
    .priv_data_size = sizeof(NellyMoserDecodeContext),
    .init           = decode_init,
    .close          = decode_end,
    .decode         = decode_tag,
208
    .capabilities   = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_PARAM_CHANGE,
209 210
    .sample_fmts    = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLT,
                                                      AV_SAMPLE_FMT_NONE },
211
};