mpegaudiodec.c 80 KB
Newer Older
Fabrice Bellard's avatar
Fabrice Bellard committed
1 2
/*
 * MPEG Audio decoder
3
 * Copyright (c) 2001, 2002 Fabrice Bellard.
Fabrice Bellard's avatar
Fabrice Bellard committed
4
 *
5 6 7
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
8 9
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
10
 * version 2.1 of the License, or (at your option) any later version.
Fabrice Bellard's avatar
Fabrice Bellard committed
11
 *
12
 * FFmpeg is distributed in the hope that it will be useful,
Fabrice Bellard's avatar
Fabrice Bellard committed
13
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 15
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
Fabrice Bellard's avatar
Fabrice Bellard committed
16
 *
17
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with FFmpeg; if not, write to the Free Software
19
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
Fabrice Bellard's avatar
Fabrice Bellard committed
20
 */
Michael Niedermayer's avatar
Michael Niedermayer committed
21 22 23 24

/**
 * @file mpegaudiodec.c
 * MPEG Audio decoder.
25
 */
Michael Niedermayer's avatar
Michael Niedermayer committed
26

27
//#define DEBUG
Fabrice Bellard's avatar
Fabrice Bellard committed
28
#include "avcodec.h"
29
#include "bitstream.h"
30
#include "dsputil.h"
Fabrice Bellard's avatar
Fabrice Bellard committed
31 32

/*
33 34 35
 * TODO:
 *  - in low precision mode, use more 16 bit multiplies in synth filter
 *  - test lsf / mpeg25 extensively.
Fabrice Bellard's avatar
Fabrice Bellard committed
36 37
 */

38 39
/* define USE_HIGHPRECISION to have a bit exact (but slower) mpeg
   audio decoder */
40
#ifdef CONFIG_MPEGAUDIO_HP
41
#   define USE_HIGHPRECISION
42
#endif
43

Roberto Togni's avatar
Roberto Togni committed
44
#include "mpegaudio.h"
45
#include "mpegaudiodecheader.h"
46

Luca Barbato's avatar
Luca Barbato committed
47 48
#include "mathops.h"

49 50 51 52
/* WARNING: only correct for posititive numbers */
#define FIXR(a)   ((int)((a) * FRAC_ONE + 0.5))
#define FRAC_RND(a) (((a) + (FRAC_ONE/2)) >> FRAC_BITS)

53 54
#define FIXHR(a) ((int)((a) * (1LL<<32) + 0.5))

55 56
/****************/

Fabrice Bellard's avatar
Fabrice Bellard committed
57 58
#define HEADER_SIZE 4

59 60
/* layer 3 "granule" */
typedef struct GranuleDef {
61
    uint8_t scfsi;
62 63 64 65
    int part2_3_length;
    int big_values;
    int global_gain;
    int scalefac_compress;
66 67
    uint8_t block_type;
    uint8_t switch_point;
68 69
    int table_select[3];
    int subblock_gain[3];
70 71
    uint8_t scalefac_scale;
    uint8_t count1table_select;
72 73 74
    int region_size[3]; /* number of huffman codes in each region */
    int preflag;
    int short_start, long_end; /* long/short band indexes */
75 76
    uint8_t scale_factors[40];
    int32_t sb_hybrid[SBLIMIT * 18]; /* 576 samples */
77
} GranuleDef;
Fabrice Bellard's avatar
Fabrice Bellard committed
78

79
#include "mpegaudiodata.h"
80 81
#include "mpegaudiodectab.h"

82 83 84
static void compute_antialias_integer(MPADecodeContext *s, GranuleDef *g);
static void compute_antialias_float(MPADecodeContext *s, GranuleDef *g);

85
/* vlc structure for decoding layer 3 huffman tables */
86
static VLC huff_vlc[16];
87 88
static VLC huff_quad_vlc[2];
/* computed from band_size_long */
89
static uint16_t band_index_long[9][23];
90
/* XXX: free when all decoders are closed */
91
#define TABLE_4_3_SIZE (8191 + 16)*4
92 93
static int8_t  table_4_3_exp[TABLE_4_3_SIZE];
static uint32_t table_4_3_value[TABLE_4_3_SIZE];
94
static uint32_t exp_table[512];
95
static uint32_t expval_table[512][16];
96
/* intensity stereo coef table */
97 98
static int32_t is_table[2][16];
static int32_t is_table_lsf[2][2][16];
99 100
static int32_t csa_table[8][4];
static float csa_table_float[8][4];
101
static int32_t mdct_win[8][36];
102 103

/* lower 2 bits: modulo 3, higher bits: shift */
104
static uint16_t scale_factor_modshift[64];
105
/* [i][j]:  2^(-j/3) * FRAC_ONE * 2^(i+2) / (2^(i+2) - 1) */
106
static int32_t scale_factor_mult[15][3];
107 108 109 110 111
/* mult table for layer 2 group quantization */

#define SCALE_GEN(v) \
{ FIXR(1.0 * (v)), FIXR(0.7937005259 * (v)), FIXR(0.6299605249 * (v)) }

Michael Niedermayer's avatar
Michael Niedermayer committed
112
static const int32_t scale_factor_mult2[3][3] = {
113 114 115
    SCALE_GEN(4.0 / 3.0), /* 3 steps */
    SCALE_GEN(4.0 / 5.0), /* 5 steps */
    SCALE_GEN(4.0 / 9.0), /* 9 steps */
116 117
};

118
static DECLARE_ALIGNED_16(MPA_INT, window[512]);
119

120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181
/**
 * Convert region offsets to region sizes and truncate
 * size to big_values.
 */
void ff_region_offset2size(GranuleDef *g){
    int i, k, j=0;
    g->region_size[2] = (576 / 2);
    for(i=0;i<3;i++) {
        k = FFMIN(g->region_size[i], g->big_values);
        g->region_size[i] = k - j;
        j = k;
    }
}

void ff_init_short_region(MPADecodeContext *s, GranuleDef *g){
    if (g->block_type == 2)
        g->region_size[0] = (36 / 2);
    else {
        if (s->sample_rate_index <= 2)
            g->region_size[0] = (36 / 2);
        else if (s->sample_rate_index != 8)
            g->region_size[0] = (54 / 2);
        else
            g->region_size[0] = (108 / 2);
    }
    g->region_size[1] = (576 / 2);
}

void ff_init_long_region(MPADecodeContext *s, GranuleDef *g, int ra1, int ra2){
    int l;
    g->region_size[0] =
        band_index_long[s->sample_rate_index][ra1 + 1] >> 1;
    /* should not overflow */
    l = FFMIN(ra1 + ra2 + 2, 22);
    g->region_size[1] =
        band_index_long[s->sample_rate_index][l] >> 1;
}

void ff_compute_band_indexes(MPADecodeContext *s, GranuleDef *g){
    if (g->block_type == 2) {
        if (g->switch_point) {
            /* if switched mode, we handle the 36 first samples as
                long blocks.  For 8000Hz, we handle the 48 first
                exponents as long blocks (XXX: check this!) */
            if (s->sample_rate_index <= 2)
                g->long_end = 8;
            else if (s->sample_rate_index != 8)
                g->long_end = 6;
            else
                g->long_end = 4; /* 8000 Hz */

            g->short_start = 2 + (s->sample_rate_index != 8);
        } else {
            g->long_end = 0;
            g->short_start = 0;
        }
    } else {
        g->short_start = 13;
        g->long_end = 22;
    }
}

182 183 184 185 186
/* layer 1 unscaling */
/* n = number of bits of the mantissa minus 1 */
static inline int l1_unscale(int n, int mant, int scale_factor)
{
    int shift, mod;
187
    int64_t val;
188 189 190 191 192 193

    shift = scale_factor_modshift[scale_factor];
    mod = shift & 3;
    shift >>= 2;
    val = MUL64(mant + (-1 << n) + 1, scale_factor_mult[n-1][mod]);
    shift += n;
194 195
    /* NOTE: at this point, 1 <= shift >= 21 + 15 */
    return (int)((val + (1LL << (shift - 1))) >> shift);
196 197 198 199 200 201 202 203 204
}

static inline int l2_unscale_group(int steps, int mant, int scale_factor)
{
    int shift, mod, val;

    shift = scale_factor_modshift[scale_factor];
    mod = shift & 3;
    shift >>= 2;
205 206 207 208 209 210

    val = (mant - (steps >> 1)) * scale_factor_mult2[steps >> 2][mod];
    /* NOTE: at this point, 0 <= shift <= 21 */
    if (shift > 0)
        val = (val + (1 << (shift - 1))) >> shift;
    return val;
211 212 213 214 215 216 217 218
}

/* compute value^(4/3) * 2^(exponent/4). It normalized to FRAC_BITS */
static inline int l3_unscale(int value, int exponent)
{
    unsigned int m;
    int e;

219 220 221 222
    e = table_4_3_exp  [4*value + (exponent&3)];
    m = table_4_3_value[4*value + (exponent&3)];
    e -= (exponent >> 2);
    assert(e>=1);
223
    if (e > 31)
224
        return 0;
225
    m = (m + (1 << (e-1))) >> e;
226

227 228 229
    return m;
}

230 231 232 233 234 235
/* all integer n^(4/3) computation code */
#define DEV_ORDER 13

#define POW_FRAC_BITS 24
#define POW_FRAC_ONE    (1 << POW_FRAC_BITS)
#define POW_FIX(a)   ((int)((a) * POW_FRAC_ONE))
236
#define POW_MULL(a,b) (((int64_t)(a) * (int64_t)(b)) >> POW_FRAC_BITS)
237 238 239

static int dev_4_3_coefs[DEV_ORDER];

240
#if 0 /* unused */
241 242 243 244 245
static int pow_mult3[3] = {
    POW_FIX(1.0),
    POW_FIX(1.25992104989487316476),
    POW_FIX(1.58740105196819947474),
};
246
#endif
247 248 249 250 251 252 253 254 255 256 257 258

static void int_pow_init(void)
{
    int i, a;

    a = POW_FIX(1.0);
    for(i=0;i<DEV_ORDER;i++) {
        a = POW_MULL(a, POW_FIX(4.0 / 3.0) - i * POW_FIX(1.0)) / (i + 1);
        dev_4_3_coefs[i] = a;
    }
}

259
#if 0 /* unused, remove? */
260 261 262 263 264
/* return the mantissa and the binary exponent */
static int int_pow(int i, int *exp_ptr)
{
    int e, er, eq, j;
    int a, a1;
265

266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291
    /* renormalize */
    a = i;
    e = POW_FRAC_BITS;
    while (a < (1 << (POW_FRAC_BITS - 1))) {
        a = a << 1;
        e--;
    }
    a -= (1 << POW_FRAC_BITS);
    a1 = 0;
    for(j = DEV_ORDER - 1; j >= 0; j--)
        a1 = POW_MULL(a, dev_4_3_coefs[j] + a1);
    a = (1 << POW_FRAC_BITS) + a1;
    /* exponent compute (exact) */
    e = e * 4;
    er = e % 3;
    eq = e / 3;
    a = POW_MULL(a, pow_mult3[er]);
    while (a >= 2 * POW_FRAC_ONE) {
        a = a >> 1;
        eq++;
    }
    /* convert to float */
    while (a < POW_FRAC_ONE) {
        a = a << 1;
        eq--;
    }
292
    /* now POW_FRAC_ONE <= a < 2 * POW_FRAC_ONE */
293
#if POW_FRAC_BITS > FRAC_BITS
294 295 296 297 298 299 300
    a = (a + (1 << (POW_FRAC_BITS - FRAC_BITS - 1))) >> (POW_FRAC_BITS - FRAC_BITS);
    /* correct overflow */
    if (a >= 2 * (1 << FRAC_BITS)) {
        a = a >> 1;
        eq++;
    }
#endif
301 302 303
    *exp_ptr = eq;
    return a;
}
304
#endif
Fabrice Bellard's avatar
Fabrice Bellard committed
305 306 307 308

static int decode_init(AVCodecContext * avctx)
{
    MPADecodeContext *s = avctx->priv_data;
309
    static int init=0;
310
    int i, j, k;
Fabrice Bellard's avatar
Fabrice Bellard committed
311

312 313
    s->avctx = avctx;

314
#if defined(USE_HIGHPRECISION) && defined(CONFIG_AUDIO_NONSHORT)
315 316 317
    avctx->sample_fmt= SAMPLE_FMT_S32;
#else
    avctx->sample_fmt= SAMPLE_FMT_S16;
318
#endif
319
    s->error_resilience= avctx->error_resilience;
320

Michael Niedermayer's avatar
Michael Niedermayer committed
321
    if(avctx->antialias_algo != FF_AA_FLOAT)
Michael Niedermayer's avatar
Michael Niedermayer committed
322 323 324 325
        s->compute_antialias= compute_antialias_integer;
    else
        s->compute_antialias= compute_antialias_float;

326
    if (!init && !avctx->parse_only) {
327 328 329 330
        /* scale factors table for layer 1/2 */
        for(i=0;i<64;i++) {
            int shift, mod;
            /* 1.0 (i = 3) is normalized to 2 ^ FRAC_BITS */
331
            shift = (i / 3);
332 333 334 335 336 337 338 339
            mod = i % 3;
            scale_factor_modshift[i] = mod | (shift << 2);
        }

        /* scale factor multiply for layer 1 */
        for(i=0;i<15;i++) {
            int n, norm;
            n = i + 2;
340
            norm = ((INT64_C(1) << n) * FRAC_ONE) / ((1 << n) - 1);
341 342 343
            scale_factor_mult[i][0] = MULL(FIXR(1.0 * 2.0), norm);
            scale_factor_mult[i][1] = MULL(FIXR(0.7937005259 * 2.0), norm);
            scale_factor_mult[i][2] = MULL(FIXR(0.6299605249 * 2.0), norm);
344
            dprintf(avctx, "%d: norm=%x s=%x %x %x\n",
345
                    i, norm,
346 347 348 349
                    scale_factor_mult[i][0],
                    scale_factor_mult[i][1],
                    scale_factor_mult[i][2]);
        }
350

351
        ff_mpa_synth_init(window);
352

353 354 355
        /* huffman decode tables */
        for(i=1;i<16;i++) {
            const HuffTable *h = &mpa_huff_tables[i];
356
            int xsize, x, y;
357
            unsigned int n;
Michael Niedermayer's avatar
Michael Niedermayer committed
358 359
            uint8_t  tmp_bits [512];
            uint16_t tmp_codes[512];
Michael Niedermayer's avatar
Michael Niedermayer committed
360 361 362

            memset(tmp_bits , 0, sizeof(tmp_bits ));
            memset(tmp_codes, 0, sizeof(tmp_codes));
363 364 365

            xsize = h->xsize;
            n = xsize * xsize;
366

367 368
            j = 0;
            for(x=0;x<xsize;x++) {
Michael Niedermayer's avatar
Michael Niedermayer committed
369
                for(y=0;y<xsize;y++){
Michael Niedermayer's avatar
Michael Niedermayer committed
370 371
                    tmp_bits [(x << 5) | y | ((x&&y)<<4)]= h->bits [j  ];
                    tmp_codes[(x << 5) | y | ((x&&y)<<4)]= h->codes[j++];
Michael Niedermayer's avatar
Michael Niedermayer committed
372
                }
373
            }
Michael Niedermayer's avatar
Michael Niedermayer committed
374 375

            /* XXX: fail test */
Michael Niedermayer's avatar
Michael Niedermayer committed
376
            init_vlc(&huff_vlc[i], 7, 512,
Michael Niedermayer's avatar
Michael Niedermayer committed
377
                     tmp_bits, 1, 1, tmp_codes, 2, 2, 1);
378 379
        }
        for(i=0;i<2;i++) {
380
            init_vlc(&huff_quad_vlc[i], i == 0 ? 7 : 4, 16,
381
                     mpa_quad_bits[i], 1, 1, mpa_quad_codes[i], 1, 1, 1);
382 383 384 385 386 387 388 389 390 391 392
        }

        for(i=0;i<9;i++) {
            k = 0;
            for(j=0;j<22;j++) {
                band_index_long[i][j] = k;
                k += band_size_long[i][j];
            }
            band_index_long[i][22] = k;
        }

393
        /* compute n ^ (4/3) and store it in mantissa/exp format */
394

395
        int_pow_init();
396
        for(i=1;i<TABLE_4_3_SIZE;i++) {
397
            double f, fm;
398
            int e, m;
399 400
            f = pow((double)(i/4), 4.0 / 3.0) * pow(2, (i&3)*0.25);
            fm = frexp(f, &e);
401
            m = (uint32_t)(fm*(1LL<<31) + 0.5);
402
            e+= FRAC_BITS - 31 + 5 - 100;
403

404 405
            /* normalized to FRAC_BITS */
            table_4_3_value[i] = m;
406 407
//            av_log(NULL, AV_LOG_DEBUG, "%d %d %f\n", i, m, pow((double)i, 4.0 / 3.0));
            table_4_3_exp[i] = -e;
408
        }
409
        for(i=0; i<512*16; i++){
410 411
            int exponent= (i>>4);
            double f= pow(i&15, 4.0 / 3.0) * pow(2, (exponent-400)*0.25 + FRAC_BITS + 5);
412
            expval_table[exponent][i&15]= llrint(f);
413
            if((i&15)==1)
414
                exp_table[exponent]= llrint(f);
415
        }
416

417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442
        for(i=0;i<7;i++) {
            float f;
            int v;
            if (i != 6) {
                f = tan((double)i * M_PI / 12.0);
                v = FIXR(f / (1.0 + f));
            } else {
                v = FIXR(1.0);
            }
            is_table[0][i] = v;
            is_table[1][6 - i] = v;
        }
        /* invalid values */
        for(i=7;i<16;i++)
            is_table[0][i] = is_table[1][i] = 0.0;

        for(i=0;i<16;i++) {
            double f;
            int e, k;

            for(j=0;j<2;j++) {
                e = -(j + 1) * ((i + 1) >> 1);
                f = pow(2.0, e / 4.0);
                k = i & 1;
                is_table_lsf[j][k ^ 1][i] = FIXR(f);
                is_table_lsf[j][k][i] = FIXR(1.0);
443
                dprintf(avctx, "is_table_lsf %d %d: %x %x\n",
444 445 446 447 448 449 450 451 452
                        i, j, is_table_lsf[j][0][i], is_table_lsf[j][1][i]);
            }
        }

        for(i=0;i<8;i++) {
            float ci, cs, ca;
            ci = ci_table[i];
            cs = 1.0 / sqrt(1.0 + ci * ci);
            ca = cs * ci;
Michael Niedermayer's avatar
Michael Niedermayer committed
453 454 455
            csa_table[i][0] = FIXHR(cs/4);
            csa_table[i][1] = FIXHR(ca/4);
            csa_table[i][2] = FIXHR(ca/4) + FIXHR(cs/4);
456
            csa_table[i][3] = FIXHR(ca/4) - FIXHR(cs/4);
457 458 459
            csa_table_float[i][0] = cs;
            csa_table_float[i][1] = ca;
            csa_table_float[i][2] = ca + cs;
460
            csa_table_float[i][3] = ca - cs;
461
//            printf("%d %d %d %d\n", FIX(cs), FIX(cs-1), FIX(ca), FIX(cs)-FIX(ca));
462
//            av_log(NULL, AV_LOG_DEBUG,"%f %f %f %f\n", cs, ca, ca+cs, ca-cs);
463 464 465 466
        }

        /* compute mdct windows */
        for(i=0;i<36;i++) {
467 468
            for(j=0; j<4; j++){
                double d;
469

Michael Niedermayer's avatar
Michael Niedermayer committed
470 471
                if(j==2 && i%3 != 1)
                    continue;
472

473 474 475 476 477 478 479 480 481 482 483
                d= sin(M_PI * (i + 0.5) / 36.0);
                if(j==1){
                    if     (i>=30) d= 0;
                    else if(i>=24) d= sin(M_PI * (i - 18 + 0.5) / 12.0);
                    else if(i>=18) d= 1;
                }else if(j==3){
                    if     (i<  6) d= 0;
                    else if(i< 12) d= sin(M_PI * (i -  6 + 0.5) / 12.0);
                    else if(i< 18) d= 1;
                }
                //merge last stage of imdct into the window coefficients
Michael Niedermayer's avatar
Michael Niedermayer committed
484 485 486 487 488 489
                d*= 0.5 / cos(M_PI*(2*i + 19)/72);

                if(j==2)
                    mdct_win[j][i/3] = FIXHR((d / (1<<5)));
                else
                    mdct_win[j][i  ] = FIXHR((d / (1<<5)));
490 491
//                av_log(NULL, AV_LOG_DEBUG, "%2d %d %f\n", i,j,d / (1<<5));
            }
492 493 494 495 496 497 498 499 500 501 502 503 504
        }

        /* NOTE: we do frequency inversion adter the MDCT by changing
           the sign of the right window coefs */
        for(j=0;j<4;j++) {
            for(i=0;i<36;i+=2) {
                mdct_win[j + 4][i] = mdct_win[j][i];
                mdct_win[j + 4][i + 1] = -mdct_win[j][i + 1];
            }
        }

#if defined(DEBUG)
        for(j=0;j<8;j++) {
505
            av_log(avctx, AV_LOG_DEBUG, "win%d=\n", j);
506
            for(i=0;i<36;i++)
507 508
                av_log(avctx, AV_LOG_DEBUG, "%f, ", (double)mdct_win[j][i] / FRAC_ONE);
            av_log(avctx, AV_LOG_DEBUG, "\n");
509 510
        }
#endif
Fabrice Bellard's avatar
Fabrice Bellard committed
511 512 513
        init = 1;
    }

514 515 516
#ifdef DEBUG
    s->frame_count = 0;
#endif
Roberto Togni's avatar
Roberto Togni committed
517 518
    if (avctx->codec_id == CODEC_ID_MP3ADU)
        s->adu_mode = 1;
Fabrice Bellard's avatar
Fabrice Bellard committed
519 520 521
    return 0;
}

522
/* tab[i][j] = 1.0 / (2.0 * cos(pi*(2*k+1) / 2^(6 - j))) */
523 524 525

/* cos(i*pi/64) */

526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560
#define COS0_0  FIXHR(0.50060299823519630134/2)
#define COS0_1  FIXHR(0.50547095989754365998/2)
#define COS0_2  FIXHR(0.51544730992262454697/2)
#define COS0_3  FIXHR(0.53104259108978417447/2)
#define COS0_4  FIXHR(0.55310389603444452782/2)
#define COS0_5  FIXHR(0.58293496820613387367/2)
#define COS0_6  FIXHR(0.62250412303566481615/2)
#define COS0_7  FIXHR(0.67480834145500574602/2)
#define COS0_8  FIXHR(0.74453627100229844977/2)
#define COS0_9  FIXHR(0.83934964541552703873/2)
#define COS0_10 FIXHR(0.97256823786196069369/2)
#define COS0_11 FIXHR(1.16943993343288495515/4)
#define COS0_12 FIXHR(1.48416461631416627724/4)
#define COS0_13 FIXHR(2.05778100995341155085/8)
#define COS0_14 FIXHR(3.40760841846871878570/8)
#define COS0_15 FIXHR(10.19000812354805681150/32)

#define COS1_0 FIXHR(0.50241928618815570551/2)
#define COS1_1 FIXHR(0.52249861493968888062/2)
#define COS1_2 FIXHR(0.56694403481635770368/2)
#define COS1_3 FIXHR(0.64682178335999012954/2)
#define COS1_4 FIXHR(0.78815462345125022473/2)
#define COS1_5 FIXHR(1.06067768599034747134/4)
#define COS1_6 FIXHR(1.72244709823833392782/4)
#define COS1_7 FIXHR(5.10114861868916385802/16)

#define COS2_0 FIXHR(0.50979557910415916894/2)
#define COS2_1 FIXHR(0.60134488693504528054/2)
#define COS2_2 FIXHR(0.89997622313641570463/2)
#define COS2_3 FIXHR(2.56291544774150617881/8)

#define COS3_0 FIXHR(0.54119610014619698439/2)
#define COS3_1 FIXHR(1.30656296487637652785/4)

#define COS4_0 FIXHR(0.70710678118654752439/2)
561 562

/* butterfly operator */
563
#define BF(a, b, c, s)\
564 565 566 567
{\
    tmp0 = tab[a] + tab[b];\
    tmp1 = tab[a] - tab[b];\
    tab[a] = tmp0;\
568
    tab[b] = MULH(tmp1<<(s), c);\
569 570 571 572
}

#define BF1(a, b, c, d)\
{\
573 574
    BF(a, b, COS4_0, 1);\
    BF(c, d,-COS4_0, 1);\
575 576 577 578 579
    tab[c] += tab[d];\
}

#define BF2(a, b, c, d)\
{\
580 581
    BF(a, b, COS4_0, 1);\
    BF(c, d,-COS4_0, 1);\
582 583 584 585 586 587 588 589 590
    tab[c] += tab[d];\
    tab[a] += tab[c];\
    tab[c] += tab[b];\
    tab[b] += tab[d];\
}

#define ADD(a, b) tab[a] += tab[b]

/* DCT32 without 1/sqrt(2) coef zero scaling. */
591
static void dct32(int32_t *out, int32_t *tab)
592 593 594 595
{
    int tmp0, tmp1;

    /* pass 1 */
596 597
    BF( 0, 31, COS0_0 , 1);
    BF(15, 16, COS0_15, 5);
598
    /* pass 2 */
599 600
    BF( 0, 15, COS1_0 , 1);
    BF(16, 31,-COS1_0 , 1);
601
    /* pass 1 */
602 603
    BF( 7, 24, COS0_7 , 1);
    BF( 8, 23, COS0_8 , 1);
604
    /* pass 2 */
605 606
    BF( 7,  8, COS1_7 , 4);
    BF(23, 24,-COS1_7 , 4);
607
    /* pass 3 */
608 609 610 611
    BF( 0,  7, COS2_0 , 1);
    BF( 8, 15,-COS2_0 , 1);
    BF(16, 23, COS2_0 , 1);
    BF(24, 31,-COS2_0 , 1);
612
    /* pass 1 */
613 614
    BF( 3, 28, COS0_3 , 1);
    BF(12, 19, COS0_12, 2);
615
    /* pass 2 */
616 617
    BF( 3, 12, COS1_3 , 1);
    BF(19, 28,-COS1_3 , 1);
618
    /* pass 1 */
619 620
    BF( 4, 27, COS0_4 , 1);
    BF(11, 20, COS0_11, 2);
621
    /* pass 2 */
622 623
    BF( 4, 11, COS1_4 , 1);
    BF(20, 27,-COS1_4 , 1);
624
    /* pass 3 */
625 626 627 628
    BF( 3,  4, COS2_3 , 3);
    BF(11, 12,-COS2_3 , 3);
    BF(19, 20, COS2_3 , 3);
    BF(27, 28,-COS2_3 , 3);
629
    /* pass 4 */
630 631 632 633 634 635 636 637
    BF( 0,  3, COS3_0 , 1);
    BF( 4,  7,-COS3_0 , 1);
    BF( 8, 11, COS3_0 , 1);
    BF(12, 15,-COS3_0 , 1);
    BF(16, 19, COS3_0 , 1);
    BF(20, 23,-COS3_0 , 1);
    BF(24, 27, COS3_0 , 1);
    BF(28, 31,-COS3_0 , 1);
638

639 640 641


    /* pass 1 */
642 643
    BF( 1, 30, COS0_1 , 1);
    BF(14, 17, COS0_14, 3);
644
    /* pass 2 */
645 646
    BF( 1, 14, COS1_1 , 1);
    BF(17, 30,-COS1_1 , 1);
647
    /* pass 1 */
648 649
    BF( 6, 25, COS0_6 , 1);
    BF( 9, 22, COS0_9 , 1);
650
    /* pass 2 */
651 652
    BF( 6,  9, COS1_6 , 2);
    BF(22, 25,-COS1_6 , 2);
653
    /* pass 3 */
654 655 656 657
    BF( 1,  6, COS2_1 , 1);
    BF( 9, 14,-COS2_1 , 1);
    BF(17, 22, COS2_1 , 1);
    BF(25, 30,-COS2_1 , 1);
658

659
    /* pass 1 */
660 661
    BF( 2, 29, COS0_2 , 1);
    BF(13, 18, COS0_13, 3);
662
    /* pass 2 */
663 664
    BF( 2, 13, COS1_2 , 1);
    BF(18, 29,-COS1_2 , 1);
665
    /* pass 1 */
666 667
    BF( 5, 26, COS0_5 , 1);
    BF(10, 21, COS0_10, 1);
668
    /* pass 2 */
669 670
    BF( 5, 10, COS1_5 , 2);
    BF(21, 26,-COS1_5 , 2);
671
    /* pass 3 */
672 673 674 675
    BF( 2,  5, COS2_2 , 1);
    BF(10, 13,-COS2_2 , 1);
    BF(18, 21, COS2_2 , 1);
    BF(26, 29,-COS2_2 , 1);
676
    /* pass 4 */
677 678 679 680 681 682 683 684
    BF( 1,  2, COS3_1 , 2);
    BF( 5,  6,-COS3_1 , 2);
    BF( 9, 10, COS3_1 , 2);
    BF(13, 14,-COS3_1 , 2);
    BF(17, 18, COS3_1 , 2);
    BF(21, 22,-COS3_1 , 2);
    BF(25, 26, COS3_1 , 2);
    BF(29, 30,-COS3_1 , 2);
685

686
    /* pass 5 */
687 688 689
    BF1( 0,  1,  2,  3);
    BF2( 4,  5,  6,  7);
    BF1( 8,  9, 10, 11);
690 691 692 693 694
    BF2(12, 13, 14, 15);
    BF1(16, 17, 18, 19);
    BF2(20, 21, 22, 23);
    BF1(24, 25, 26, 27);
    BF2(28, 29, 30, 31);
695

696
    /* pass 6 */
697

698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721
    ADD( 8, 12);
    ADD(12, 10);
    ADD(10, 14);
    ADD(14,  9);
    ADD( 9, 13);
    ADD(13, 11);
    ADD(11, 15);

    out[ 0] = tab[0];
    out[16] = tab[1];
    out[ 8] = tab[2];
    out[24] = tab[3];
    out[ 4] = tab[4];
    out[20] = tab[5];
    out[12] = tab[6];
    out[28] = tab[7];
    out[ 2] = tab[8];
    out[18] = tab[9];
    out[10] = tab[10];
    out[26] = tab[11];
    out[ 6] = tab[12];
    out[22] = tab[13];
    out[14] = tab[14];
    out[30] = tab[15];
722

723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750
    ADD(24, 28);
    ADD(28, 26);
    ADD(26, 30);
    ADD(30, 25);
    ADD(25, 29);
    ADD(29, 27);
    ADD(27, 31);

    out[ 1] = tab[16] + tab[24];
    out[17] = tab[17] + tab[25];
    out[ 9] = tab[18] + tab[26];
    out[25] = tab[19] + tab[27];
    out[ 5] = tab[20] + tab[28];
    out[21] = tab[21] + tab[29];
    out[13] = tab[22] + tab[30];
    out[29] = tab[23] + tab[31];
    out[ 3] = tab[24] + tab[20];
    out[19] = tab[25] + tab[21];
    out[11] = tab[26] + tab[22];
    out[27] = tab[27] + tab[23];
    out[ 7] = tab[28] + tab[18];
    out[23] = tab[29] + tab[19];
    out[15] = tab[30] + tab[17];
    out[31] = tab[31];
}

#if FRAC_BITS <= 15

751
static inline int round_sample(int *sum)
752 753
{
    int sum1;
754 755
    sum1 = (*sum) >> OUT_SHIFT;
    *sum &= (1<<OUT_SHIFT)-1;
756 757 758 759
    if (sum1 < OUT_MIN)
        sum1 = OUT_MIN;
    else if (sum1 > OUT_MAX)
        sum1 = OUT_MAX;
760
    return sum1;
761 762
}

Luca Barbato's avatar
Luca Barbato committed
763 764
/* signed 16x16 -> 32 multiply add accumulate */
#define MACS(rt, ra, rb) MAC16(rt, ra, rb)
Siarhei Siamashka's avatar
Siarhei Siamashka committed
765

Luca Barbato's avatar
Luca Barbato committed
766 767
/* signed 16x16 -> 32 multiply */
#define MULS(ra, rb) MUL16(ra, rb)
768

769 770
#else

771
static inline int round_sample(int64_t *sum)
772 773
{
    int sum1;
774 775
    sum1 = (int)((*sum) >> OUT_SHIFT);
    *sum &= (1<<OUT_SHIFT)-1;
776 777 778 779
    if (sum1 < OUT_MIN)
        sum1 = OUT_MIN;
    else if (sum1 > OUT_MAX)
        sum1 = OUT_MAX;
780
    return sum1;
781 782
}

783
#   define MULS(ra, rb) MUL64(ra, rb)
784 785 786
#endif

#define SUM8(sum, op, w, p) \
787
{                                               \
788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824
    sum op MULS((w)[0 * 64], p[0 * 64]);\
    sum op MULS((w)[1 * 64], p[1 * 64]);\
    sum op MULS((w)[2 * 64], p[2 * 64]);\
    sum op MULS((w)[3 * 64], p[3 * 64]);\
    sum op MULS((w)[4 * 64], p[4 * 64]);\
    sum op MULS((w)[5 * 64], p[5 * 64]);\
    sum op MULS((w)[6 * 64], p[6 * 64]);\
    sum op MULS((w)[7 * 64], p[7 * 64]);\
}

#define SUM8P2(sum1, op1, sum2, op2, w1, w2, p) \
{                                               \
    int tmp;\
    tmp = p[0 * 64];\
    sum1 op1 MULS((w1)[0 * 64], tmp);\
    sum2 op2 MULS((w2)[0 * 64], tmp);\
    tmp = p[1 * 64];\
    sum1 op1 MULS((w1)[1 * 64], tmp);\
    sum2 op2 MULS((w2)[1 * 64], tmp);\
    tmp = p[2 * 64];\
    sum1 op1 MULS((w1)[2 * 64], tmp);\
    sum2 op2 MULS((w2)[2 * 64], tmp);\
    tmp = p[3 * 64];\
    sum1 op1 MULS((w1)[3 * 64], tmp);\
    sum2 op2 MULS((w2)[3 * 64], tmp);\
    tmp = p[4 * 64];\
    sum1 op1 MULS((w1)[4 * 64], tmp);\
    sum2 op2 MULS((w2)[4 * 64], tmp);\
    tmp = p[5 * 64];\
    sum1 op1 MULS((w1)[5 * 64], tmp);\
    sum2 op2 MULS((w2)[5 * 64], tmp);\
    tmp = p[6 * 64];\
    sum1 op1 MULS((w1)[6 * 64], tmp);\
    sum2 op2 MULS((w2)[6 * 64], tmp);\
    tmp = p[7 * 64];\
    sum1 op1 MULS((w1)[7 * 64], tmp);\
    sum2 op2 MULS((w2)[7 * 64], tmp);\
825 826
}

827 828 829 830 831 832 833
void ff_mpa_synth_init(MPA_INT *window)
{
    int i;

    /* max = 18760, max sum over all 16 coefs : 44736 */
    for(i=0;i<257;i++) {
        int v;
834
        v = ff_mpa_enwindow[i];
835 836 837 838 839 840 841 842
#if WFRAC_BITS < 16
        v = (v + (1 << (16 - WFRAC_BITS - 1))) >> (16 - WFRAC_BITS);
#endif
        window[i] = v;
        if ((i & 63) != 0)
            v = -v;
        if (i != 0)
            window[512 - i] = v;
843
    }
844
}
845 846 847 848

/* 32 sub band synthesis filter. Input: 32 sub band samples, Output:
   32 samples. */
/* XXX: optimize by avoiding ring buffer usage */
849
void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
850
                         MPA_INT *window, int *dither_state,
851
                         OUT_INT *samples, int incr,
852
                         int32_t sb_samples[SBLIMIT])
853
{
854
    int32_t tmp[32];
855
    register MPA_INT *synth_buf;
Alex Beregszaszi's avatar
Alex Beregszaszi committed
856
    register const MPA_INT *w, *w2, *p;
857
    int j, offset, v;
858
    OUT_INT *samples2;
859
#if FRAC_BITS <= 15
860
    int sum, sum2;
861
#else
862
    int64_t sum, sum2;
863
#endif
864

865
    dct32(tmp, sb_samples);
866

867 868
    offset = *synth_buf_offset;
    synth_buf = synth_buf_ptr + offset;
869 870 871 872

    for(j=0;j<32;j++) {
        v = tmp[j];
#if FRAC_BITS <= 15
873 874
        /* NOTE: can cause a loss in precision if very high amplitude
           sound */
875
        v = av_clip_int16(v);
876 877 878 879 880 881
#endif
        synth_buf[j] = v;
    }
    /* copy to avoid wrap */
    memcpy(synth_buf + 512, synth_buf, 32 * sizeof(MPA_INT));

882
    samples2 = samples + 31 * incr;
883
    w = window;
884 885
    w2 = window + 31;

886
    sum = *dither_state;
887 888 889 890
    p = synth_buf + 16;
    SUM8(sum, +=, w, p);
    p = synth_buf + 48;
    SUM8(sum, -=, w + 32, p);
891
    *samples = round_sample(&sum);
892
    samples += incr;
893 894
    w++;

895 896 897 898 899 900 901 902 903
    /* we calculate two samples at the same time to avoid one memory
       access per two sample */
    for(j=1;j<16;j++) {
        sum2 = 0;
        p = synth_buf + 16 + j;
        SUM8P2(sum, +=, sum2, -=, w, w2, p);
        p = synth_buf + 48 - j;
        SUM8P2(sum, -=, sum2, -=, w + 32, w2 + 32, p);

904
        *samples = round_sample(&sum);
905
        samples += incr;
906 907
        sum += sum2;
        *samples2 = round_sample(&sum);
908
        samples2 -= incr;
909
        w++;
910
        w2--;
911
    }
912

913 914
    p = synth_buf + 32;
    SUM8(sum, -=, w + 32, p);
915
    *samples = round_sample(&sum);
916
    *dither_state= sum;
917

918
    offset = (offset - 32) & 511;
919
    *synth_buf_offset = offset;
920 921
}

Michael Niedermayer's avatar
Michael Niedermayer committed
922 923 924 925 926 927 928 929 930 931 932 933 934 935
#define C3 FIXHR(0.86602540378443864676/2)

/* 0.5 / cos(pi*(2*i+1)/36) */
static const int icos36[9] = {
    FIXR(0.50190991877167369479),
    FIXR(0.51763809020504152469), //0
    FIXR(0.55168895948124587824),
    FIXR(0.61038729438072803416),
    FIXR(0.70710678118654752439), //1
    FIXR(0.87172339781054900991),
    FIXR(1.18310079157624925896),
    FIXR(1.93185165257813657349), //2
    FIXR(5.73685662283492756461),
};
936

937 938 939 940 941 942 943 944 945 946 947 948 949
/* 0.5 / cos(pi*(2*i+1)/36) */
static const int icos36h[9] = {
    FIXHR(0.50190991877167369479/2),
    FIXHR(0.51763809020504152469/2), //0
    FIXHR(0.55168895948124587824/2),
    FIXHR(0.61038729438072803416/2),
    FIXHR(0.70710678118654752439/2), //1
    FIXHR(0.87172339781054900991/2),
    FIXHR(1.18310079157624925896/4),
    FIXHR(1.93185165257813657349/4), //2
//    FIXHR(5.73685662283492756461),
};

950 951 952 953
/* 12 points IMDCT. We compute it "by hand" by factorizing obvious
   cases. */
static void imdct12(int *out, int *in)
{
Michael Niedermayer's avatar
Michael Niedermayer committed
954
    int in0, in1, in2, in3, in4, in5, t1, t2;
955 956 957 958 959 960 961

    in0= in[0*3];
    in1= in[1*3] + in[0*3];
    in2= in[2*3] + in[1*3];
    in3= in[3*3] + in[2*3];
    in4= in[4*3] + in[3*3];
    in5= in[5*3] + in[4*3];
Michael Niedermayer's avatar
Michael Niedermayer committed
962 963 964 965
    in5 += in3;
    in3 += in1;

    in2= MULH(2*in2, C3);
966
    in3= MULH(4*in3, C3);
967

Michael Niedermayer's avatar
Michael Niedermayer committed
968
    t1 = in0 - in4;
969
    t2 = MULH(2*(in1 - in5), icos36h[4]);
Michael Niedermayer's avatar
Michael Niedermayer committed
970

971
    out[ 7]=
Michael Niedermayer's avatar
Michael Niedermayer committed
972 973 974 975 976 977
    out[10]= t1 + t2;
    out[ 1]=
    out[ 4]= t1 - t2;

    in0 += in4>>1;
    in4 = in0 + in2;
978 979
    in5 += 2*in1;
    in1 = MULH(in5 + in3, icos36h[1]);
980
    out[ 8]=
981
    out[ 9]= in4 + in1;
Michael Niedermayer's avatar
Michael Niedermayer committed
982
    out[ 2]=
983
    out[ 3]= in4 - in1;
984

Michael Niedermayer's avatar
Michael Niedermayer committed
985
    in0 -= in2;
986
    in5 = MULH(2*(in5 - in3), icos36h[7]);
Michael Niedermayer's avatar
Michael Niedermayer committed
987
    out[ 0]=
988
    out[ 5]= in0 - in5;
Michael Niedermayer's avatar
Michael Niedermayer committed
989
    out[ 6]=
990
    out[11]= in0 + in5;
991 992 993
}

/* cos(pi*i/18) */
994 995 996 997 998 999 1000 1001 1002
#define C1 FIXHR(0.98480775301220805936/2)
#define C2 FIXHR(0.93969262078590838405/2)
#define C3 FIXHR(0.86602540378443864676/2)
#define C4 FIXHR(0.76604444311897803520/2)
#define C5 FIXHR(0.64278760968653932632/2)
#define C6 FIXHR(0.5/2)
#define C7 FIXHR(0.34202014332566873304/2)
#define C8 FIXHR(0.17364817766693034885/2)

1003 1004

/* using Lee like decomposition followed by hand coded 9 points DCT */
1005
static void imdct36(int *out, int *buf, int *in, int *win)
1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017
{
    int i, j, t0, t1, t2, t3, s0, s1, s2, s3;
    int tmp[18], *tmp1, *in1;

    for(i=17;i>=1;i--)
        in[i] += in[i-1];
    for(i=17;i>=3;i-=2)
        in[i] += in[i-2];

    for(j=0;j<2;j++) {
        tmp1 = tmp + j;
        in1 = in + j;
1018 1019 1020 1021
#if 0
//more accurate but slower
        int64_t t0, t1, t2, t3;
        t2 = in1[2*4] + in1[2*8] - in1[2*2];
1022

1023 1024 1025 1026 1027 1028 1029 1030
        t3 = (in1[2*0] + (int64_t)(in1[2*6]>>1))<<32;
        t1 = in1[2*0] - in1[2*6];
        tmp1[ 6] = t1 - (t2>>1);
        tmp1[16] = t1 + t2;

        t0 = MUL64(2*(in1[2*2] + in1[2*4]),    C2);
        t1 = MUL64(   in1[2*4] - in1[2*8] , -2*C8);
        t2 = MUL64(2*(in1[2*2] + in1[2*8]),   -C4);
1031

1032 1033 1034
        tmp1[10] = (t3 - t0 - t2) >> 32;
        tmp1[ 2] = (t3 + t0 + t1) >> 32;
        tmp1[14] = (t3 + t2 - t1) >> 32;
1035

1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047
        tmp1[ 4] = MULH(2*(in1[2*5] + in1[2*7] - in1[2*1]), -C3);
        t2 = MUL64(2*(in1[2*1] + in1[2*5]),    C1);
        t3 = MUL64(   in1[2*5] - in1[2*7] , -2*C7);
        t0 = MUL64(2*in1[2*3], C3);

        t1 = MUL64(2*(in1[2*1] + in1[2*7]),   -C5);

        tmp1[ 0] = (t2 + t3 + t0) >> 32;
        tmp1[12] = (t2 + t1 - t0) >> 32;
        tmp1[ 8] = (t3 - t1 - t0) >> 32;
#else
        t2 = in1[2*4] + in1[2*8] - in1[2*2];
1048

1049 1050 1051 1052 1053 1054 1055 1056
        t3 = in1[2*0] + (in1[2*6]>>1);
        t1 = in1[2*0] - in1[2*6];
        tmp1[ 6] = t1 - (t2>>1);
        tmp1[16] = t1 + t2;

        t0 = MULH(2*(in1[2*2] + in1[2*4]),    C2);
        t1 = MULH(   in1[2*4] - in1[2*8] , -2*C8);
        t2 = MULH(2*(in1[2*2] + in1[2*8]),   -C4);
1057

1058 1059 1060
        tmp1[10] = t3 - t0 - t2;
        tmp1[ 2] = t3 + t0 + t1;
        tmp1[14] = t3 + t2 - t1;
1061

1062 1063 1064 1065
        tmp1[ 4] = MULH(2*(in1[2*5] + in1[2*7] - in1[2*1]), -C3);
        t2 = MULH(2*(in1[2*1] + in1[2*5]),    C1);
        t3 = MULH(   in1[2*5] - in1[2*7] , -2*C7);
        t0 = MULH(2*in1[2*3], C3);
1066

1067 1068 1069 1070 1071 1072
        t1 = MULH(2*(in1[2*1] + in1[2*7]),   -C5);

        tmp1[ 0] = t2 + t3 + t0;
        tmp1[12] = t2 + t1 - t0;
        tmp1[ 8] = t3 - t1 - t0;
#endif
1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083
    }

    i = 0;
    for(j=0;j<4;j++) {
        t0 = tmp[i];
        t1 = tmp[i + 2];
        s0 = t1 + t0;
        s2 = t1 - t0;

        t2 = tmp[i + 1];
        t3 = tmp[i + 3];
1084
        s1 = MULH(2*(t3 + t2), icos36h[j]);
1085
        s3 = MULL(t3 - t2, icos36[8 - j]);
1086

1087 1088
        t0 = s0 + s1;
        t1 = s0 - s1;
Michael Niedermayer's avatar
Michael Niedermayer committed
1089
        out[(9 + j)*SBLIMIT] =  MULH(t1, win[9 + j]) + buf[9 + j];
1090 1091 1092
        out[(8 - j)*SBLIMIT] =  MULH(t1, win[8 - j]) + buf[8 - j];
        buf[9 + j] = MULH(t0, win[18 + 9 + j]);
        buf[8 - j] = MULH(t0, win[18 + 8 - j]);
1093

1094 1095
        t0 = s2 + s3;
        t1 = s2 - s3;
Michael Niedermayer's avatar
Michael Niedermayer committed
1096
        out[(9 + 8 - j)*SBLIMIT] =  MULH(t1, win[9 + 8 - j]) + buf[9 + 8 - j];
1097 1098 1099
        out[(        j)*SBLIMIT] =  MULH(t1, win[        j]) + buf[        j];
        buf[9 + 8 - j] = MULH(t0, win[18 + 9 + 8 - j]);
        buf[      + j] = MULH(t0, win[18         + j]);
1100 1101 1102 1103
        i += 4;
    }

    s0 = tmp[16];
1104
    s1 = MULH(2*tmp[17], icos36h[4]);
1105 1106
    t0 = s0 + s1;
    t1 = s0 - s1;
Michael Niedermayer's avatar
Michael Niedermayer committed
1107
    out[(9 + 4)*SBLIMIT] =  MULH(t1, win[9 + 4]) + buf[9 + 4];
1108 1109 1110
    out[(8 - 4)*SBLIMIT] =  MULH(t1, win[8 - 4]) + buf[8 - 4];
    buf[9 + 4] = MULH(t0, win[18 + 9 + 4]);
    buf[8 - 4] = MULH(t0, win[18 + 8 - 4]);
1111 1112 1113 1114
}

/* return the number of decoded frames */
static int mp_decode_layer1(MPADecodeContext *s)
Fabrice Bellard's avatar
Fabrice Bellard committed
1115
{
1116
    int bound, i, v, n, ch, j, mant;
1117 1118
    uint8_t allocation[MPA_MAX_CHANNELS][SBLIMIT];
    uint8_t scale_factors[MPA_MAX_CHANNELS][SBLIMIT];
1119

1120
    if (s->mode == MPA_JSTEREO)
1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147
        bound = (s->mode_ext + 1) * 4;
    else
        bound = SBLIMIT;

    /* allocation bits */
    for(i=0;i<bound;i++) {
        for(ch=0;ch<s->nb_channels;ch++) {
            allocation[ch][i] = get_bits(&s->gb, 4);
        }
    }
    for(i=bound;i<SBLIMIT;i++) {
        allocation[0][i] = get_bits(&s->gb, 4);
    }

    /* scale factors */
    for(i=0;i<bound;i++) {
        for(ch=0;ch<s->nb_channels;ch++) {
            if (allocation[ch][i])
                scale_factors[ch][i] = get_bits(&s->gb, 6);
        }
    }
    for(i=bound;i<SBLIMIT;i++) {
        if (allocation[0][i]) {
            scale_factors[0][i] = get_bits(&s->gb, 6);
            scale_factors[1][i] = get_bits(&s->gb, 6);
        }
    }
1148

1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188
    /* compute samples */
    for(j=0;j<12;j++) {
        for(i=0;i<bound;i++) {
            for(ch=0;ch<s->nb_channels;ch++) {
                n = allocation[ch][i];
                if (n) {
                    mant = get_bits(&s->gb, n + 1);
                    v = l1_unscale(n, mant, scale_factors[ch][i]);
                } else {
                    v = 0;
                }
                s->sb_samples[ch][j][i] = v;
            }
        }
        for(i=bound;i<SBLIMIT;i++) {
            n = allocation[0][i];
            if (n) {
                mant = get_bits(&s->gb, n + 1);
                v = l1_unscale(n, mant, scale_factors[0][i]);
                s->sb_samples[0][j][i] = v;
                v = l1_unscale(n, mant, scale_factors[1][i]);
                s->sb_samples[1][j][i] = v;
            } else {
                s->sb_samples[0][j][i] = 0;
                s->sb_samples[1][j][i] = 0;
            }
        }
    }
    return 12;
}

static int mp_decode_layer2(MPADecodeContext *s)
{
    int sblimit; /* number of used subbands */
    const unsigned char *alloc_table;
    int table, bit_alloc_bits, i, j, ch, bound, v;
    unsigned char bit_alloc[MPA_MAX_CHANNELS][SBLIMIT];
    unsigned char scale_code[MPA_MAX_CHANNELS][SBLIMIT];
    unsigned char scale_factors[MPA_MAX_CHANNELS][SBLIMIT][3], *sf;
    int scale, qindex, bits, steps, k, l, m, b;
Fabrice Bellard's avatar
Fabrice Bellard committed
1189

1190
    /* select decoding table */
1191
    table = ff_mpa_l2_select_table(s->bit_rate / 1000, s->nb_channels,
1192
                            s->sample_rate, s->lsf);
1193 1194
    sblimit = ff_mpa_sblimit_table[table];
    alloc_table = ff_mpa_alloc_tables[table];
1195

1196
    if (s->mode == MPA_JSTEREO)
1197 1198 1199 1200
        bound = (s->mode_ext + 1) * 4;
    else
        bound = sblimit;

1201
    dprintf(s->avctx, "bound=%d sblimit=%d\n", bound, sblimit);
1202 1203 1204 1205

    /* sanity check */
    if( bound > sblimit ) bound = sblimit;

1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220
    /* parse bit allocation */
    j = 0;
    for(i=0;i<bound;i++) {
        bit_alloc_bits = alloc_table[j];
        for(ch=0;ch<s->nb_channels;ch++) {
            bit_alloc[ch][i] = get_bits(&s->gb, bit_alloc_bits);
        }
        j += 1 << bit_alloc_bits;
    }
    for(i=bound;i<sblimit;i++) {
        bit_alloc_bits = alloc_table[j];
        v = get_bits(&s->gb, bit_alloc_bits);
        bit_alloc[0][i] = v;
        bit_alloc[1][i] = v;
        j += 1 << bit_alloc_bits;
Fabrice Bellard's avatar
Fabrice Bellard committed
1221
    }
1222 1223 1224 1225 1226

#ifdef DEBUG
    {
        for(ch=0;ch<s->nb_channels;ch++) {
            for(i=0;i<sblimit;i++)
1227 1228
                dprintf(s->avctx, " %d", bit_alloc[ch][i]);
            dprintf(s->avctx, "\n");
1229 1230 1231 1232 1233 1234 1235
        }
    }
#endif

    /* scale codes */
    for(i=0;i<sblimit;i++) {
        for(ch=0;ch<s->nb_channels;ch++) {
1236
            if (bit_alloc[ch][i])
1237 1238 1239
                scale_code[ch][i] = get_bits(&s->gb, 2);
        }
    }
1240

1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277
    /* scale factors */
    for(i=0;i<sblimit;i++) {
        for(ch=0;ch<s->nb_channels;ch++) {
            if (bit_alloc[ch][i]) {
                sf = scale_factors[ch][i];
                switch(scale_code[ch][i]) {
                default:
                case 0:
                    sf[0] = get_bits(&s->gb, 6);
                    sf[1] = get_bits(&s->gb, 6);
                    sf[2] = get_bits(&s->gb, 6);
                    break;
                case 2:
                    sf[0] = get_bits(&s->gb, 6);
                    sf[1] = sf[0];
                    sf[2] = sf[0];
                    break;
                case 1:
                    sf[0] = get_bits(&s->gb, 6);
                    sf[2] = get_bits(&s->gb, 6);
                    sf[1] = sf[0];
                    break;
                case 3:
                    sf[0] = get_bits(&s->gb, 6);
                    sf[2] = get_bits(&s->gb, 6);
                    sf[1] = sf[2];
                    break;
                }
            }
        }
    }

#ifdef DEBUG
    for(ch=0;ch<s->nb_channels;ch++) {
        for(i=0;i<sblimit;i++) {
            if (bit_alloc[ch][i]) {
                sf = scale_factors[ch][i];
1278
                dprintf(s->avctx, " %d %d %d", sf[0], sf[1], sf[2]);
1279
            } else {
1280
                dprintf(s->avctx, " -");
1281 1282
            }
        }
1283
        dprintf(s->avctx, "\n");
1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297
    }
#endif

    /* samples */
    for(k=0;k<3;k++) {
        for(l=0;l<12;l+=3) {
            j = 0;
            for(i=0;i<bound;i++) {
                bit_alloc_bits = alloc_table[j];
                for(ch=0;ch<s->nb_channels;ch++) {
                    b = bit_alloc[ch][i];
                    if (b) {
                        scale = scale_factors[ch][i][k];
                        qindex = alloc_table[j+b];
1298
                        bits = ff_mpa_quant_bits[qindex];
1299 1300 1301
                        if (bits < 0) {
                            /* 3 values at the same time */
                            v = get_bits(&s->gb, -bits);
1302
                            steps = ff_mpa_quant_steps[qindex];
1303
                            s->sb_samples[ch][k * 12 + l + 0][i] =
1304 1305
                                l2_unscale_group(steps, v % steps, scale);
                            v = v / steps;
1306
                            s->sb_samples[ch][k * 12 + l + 1][i] =
1307 1308
                                l2_unscale_group(steps, v % steps, scale);
                            v = v / steps;
1309
                            s->sb_samples[ch][k * 12 + l + 2][i] =
1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324
                                l2_unscale_group(steps, v, scale);
                        } else {
                            for(m=0;m<3;m++) {
                                v = get_bits(&s->gb, bits);
                                v = l1_unscale(bits - 1, v, scale);
                                s->sb_samples[ch][k * 12 + l + m][i] = v;
                            }
                        }
                    } else {
                        s->sb_samples[ch][k * 12 + l + 0][i] = 0;
                        s->sb_samples[ch][k * 12 + l + 1][i] = 0;
                        s->sb_samples[ch][k * 12 + l + 2][i] = 0;
                    }
                }
                /* next subband in alloc table */
1325
                j += 1 << bit_alloc_bits;
1326 1327 1328 1329 1330 1331 1332 1333 1334 1335
            }
            /* XXX: find a way to avoid this duplication of code */
            for(i=bound;i<sblimit;i++) {
                bit_alloc_bits = alloc_table[j];
                b = bit_alloc[0][i];
                if (b) {
                    int mant, scale0, scale1;
                    scale0 = scale_factors[0][i][k];
                    scale1 = scale_factors[1][i][k];
                    qindex = alloc_table[j+b];
1336
                    bits = ff_mpa_quant_bits[qindex];
1337 1338 1339
                    if (bits < 0) {
                        /* 3 values at the same time */
                        v = get_bits(&s->gb, -bits);
1340
                        steps = ff_mpa_quant_steps[qindex];
1341 1342
                        mant = v % steps;
                        v = v / steps;
1343
                        s->sb_samples[0][k * 12 + l + 0][i] =
1344
                            l2_unscale_group(steps, mant, scale0);
1345
                        s->sb_samples[1][k * 12 + l + 0][i] =
1346 1347 1348
                            l2_unscale_group(steps, mant, scale1);
                        mant = v % steps;
                        v = v / steps;
1349
                        s->sb_samples[0][k * 12 + l + 1][i] =
1350
                            l2_unscale_group(steps, mant, scale0);
1351
                        s->sb_samples[1][k * 12 + l + 1][i] =
1352
                            l2_unscale_group(steps, mant, scale1);
1353
                        s->sb_samples[0][k * 12 + l + 2][i] =
1354
                            l2_unscale_group(steps, v, scale0);
1355
                        s->sb_samples[1][k * 12 + l + 2][i] =
1356 1357 1358 1359
                            l2_unscale_group(steps, v, scale1);
                    } else {
                        for(m=0;m<3;m++) {
                            mant = get_bits(&s->gb, bits);
1360
                            s->sb_samples[0][k * 12 + l + m][i] =
1361
                                l1_unscale(bits - 1, mant, scale0);
1362
                            s->sb_samples[1][k * 12 + l + m][i] =
1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374
                                l1_unscale(bits - 1, mant, scale1);
                        }
                    }
                } else {
                    s->sb_samples[0][k * 12 + l + 0][i] = 0;
                    s->sb_samples[0][k * 12 + l + 1][i] = 0;
                    s->sb_samples[0][k * 12 + l + 2][i] = 0;
                    s->sb_samples[1][k * 12 + l + 0][i] = 0;
                    s->sb_samples[1][k * 12 + l + 1][i] = 0;
                    s->sb_samples[1][k * 12 + l + 2][i] = 0;
                }
                /* next subband in alloc table */
1375
                j += 1 << bit_alloc_bits;
1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387
            }
            /* fill remaining samples to zero */
            for(i=sblimit;i<SBLIMIT;i++) {
                for(ch=0;ch<s->nb_channels;ch++) {
                    s->sb_samples[ch][k * 12 + l + 0][i] = 0;
                    s->sb_samples[ch][k * 12 + l + 1][i] = 0;
                    s->sb_samples[ch][k * 12 + l + 2][i] = 0;
                }
            }
        }
    }
    return 3 * 12;
Fabrice Bellard's avatar
Fabrice Bellard committed
1388 1389
}

1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409
static inline void lsf_sf_expand(int *slen,
                                 int sf, int n1, int n2, int n3)
{
    if (n3) {
        slen[3] = sf % n3;
        sf /= n3;
    } else {
        slen[3] = 0;
    }
    if (n2) {
        slen[2] = sf % n2;
        sf /= n2;
    } else {
        slen[2] = 0;
    }
    slen[1] = sf % n1;
    sf /= n1;
    slen[0] = sf;
}

1410
static void exponents_from_scale_factors(MPADecodeContext *s,
1411
                                         GranuleDef *g,
1412
                                         int16_t *exponents)
1413
{
1414
    const uint8_t *bstab, *pretab;
1415
    int len, i, j, k, l, v0, shift, gain, gains[3];
1416
    int16_t *exp_ptr;
1417 1418 1419 1420 1421 1422 1423 1424

    exp_ptr = exponents;
    gain = g->global_gain - 210;
    shift = g->scalefac_scale + 1;

    bstab = band_size_long[s->sample_rate_index];
    pretab = mpa_pretab[g->preflag];
    for(i=0;i<g->long_end;i++) {
1425
        v0 = gain - ((g->scale_factors[i] + pretab[i]) << shift) + 400;
1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439
        len = bstab[i];
        for(j=len;j>0;j--)
            *exp_ptr++ = v0;
    }

    if (g->short_start < 13) {
        bstab = band_size_short[s->sample_rate_index];
        gains[0] = gain - (g->subblock_gain[0] << 3);
        gains[1] = gain - (g->subblock_gain[1] << 3);
        gains[2] = gain - (g->subblock_gain[2] << 3);
        k = g->long_end;
        for(i=g->short_start;i<13;i++) {
            len = bstab[i];
            for(l=0;l<3;l++) {
1440
                v0 = gains[l] - (g->scale_factors[k++] << shift) + 400;
1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456
                for(j=len;j>0;j--)
                *exp_ptr++ = v0;
            }
        }
    }
}

/* handle n = 0 too */
static inline int get_bitsz(GetBitContext *s, int n)
{
    if (n == 0)
        return 0;
    else
        return get_bits(s, n);
}

1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469

static void switch_buffer(MPADecodeContext *s, int *pos, int *end_pos, int *end_pos2){
    if(s->in_gb.buffer && *pos >= s->gb.size_in_bits){
        s->gb= s->in_gb;
        s->in_gb.buffer=NULL;
        assert((get_bits_count(&s->gb) & 7) == 0);
        skip_bits_long(&s->gb, *pos - *end_pos);
        *end_pos2=
        *end_pos= *end_pos2 + get_bits_count(&s->gb) - *pos;
        *pos= get_bits_count(&s->gb);
    }
}

1470
static int huffman_decode(MPADecodeContext *s, GranuleDef *g,
1471
                          int16_t *exponents, int end_pos2)
1472 1473
{
    int s_index;
1474
    int i;
1475
    int last_pos, bits_left;
1476
    VLC *vlc;
1477
    int end_pos= FFMIN(end_pos2, s->gb.size_in_bits);
1478 1479 1480 1481

    /* low frequencies (called big values) */
    s_index = 0;
    for(i=0;i<3;i++) {
1482
        int j, k, l, linbits;
1483 1484 1485 1486 1487 1488 1489 1490 1491
        j = g->region_size[i];
        if (j == 0)
            continue;
        /* select vlc table */
        k = g->table_select[i];
        l = mpa_huff_data[k][0];
        linbits = mpa_huff_data[k][1];
        vlc = &huff_vlc[l];

1492
        if(!l){
1493
            memset(&g->sb_hybrid[s_index], 0, sizeof(*g->sb_hybrid)*2*j);
1494 1495 1496 1497
            s_index += 2*j;
            continue;
        }

1498 1499
        /* read huffcode and compute each couple */
        for(;j>0;j--) {
1500
            int exponent, x, y, v;
1501 1502 1503 1504
            int pos= get_bits_count(&s->gb);

            if (pos >= end_pos){
//                av_log(NULL, AV_LOG_ERROR, "pos: %d %d %d %d\n", pos, end_pos, end_pos2, s_index);
1505
                switch_buffer(s, &pos, &end_pos, &end_pos2);
1506 1507 1508 1509
//                av_log(NULL, AV_LOG_ERROR, "new pos: %d %d\n", pos, end_pos);
                if(pos >= end_pos)
                    break;
            }
1510
            y = get_vlc2(&s->gb, vlc->table, 7, 3);
1511 1512 1513 1514 1515 1516 1517 1518

            if(!y){
                g->sb_hybrid[s_index  ] =
                g->sb_hybrid[s_index+1] = 0;
                s_index += 2;
                continue;
            }

1519
            exponent= exponents[s_index];
1520

1521
            dprintf(s->avctx, "region=%d n=%d x=%d y=%d exp=%d\n",
1522
                    i, g->region_size[i] - j, x, y, exponent);
Michael Niedermayer's avatar
Michael Niedermayer committed
1523 1524 1525
            if(y&16){
                x = y >> 5;
                y = y & 0x0f;
1526
                if (x < 15){
1527 1528
                    v = expval_table[ exponent ][ x ];
//                      v = expval_table[ (exponent&3) ][ x ] >> FFMIN(0 - (exponent>>2), 31);
1529 1530
                }else{
                    x += get_bitsz(&s->gb, linbits);
1531
                    v = l3_unscale(x, exponent);
1532
                }
1533 1534
                if (get_bits1(&s->gb))
                    v = -v;
Michael Niedermayer's avatar
Michael Niedermayer committed
1535
                g->sb_hybrid[s_index] = v;
1536
                if (y < 15){
1537
                    v = expval_table[ exponent ][ y ];
1538 1539
                }else{
                    y += get_bitsz(&s->gb, linbits);
1540
                    v = l3_unscale(y, exponent);
1541
                }
1542 1543
                if (get_bits1(&s->gb))
                    v = -v;
Michael Niedermayer's avatar
Michael Niedermayer committed
1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557
                g->sb_hybrid[s_index+1] = v;
            }else{
                x = y >> 5;
                y = y & 0x0f;
                x += y;
                if (x < 15){
                    v = expval_table[ exponent ][ x ];
                }else{
                    x += get_bitsz(&s->gb, linbits);
                    v = l3_unscale(x, exponent);
                }
                if (get_bits1(&s->gb))
                    v = -v;
                g->sb_hybrid[s_index+!!y] = v;
1558
                g->sb_hybrid[s_index+ !y] = 0;
1559
            }
Michael Niedermayer's avatar
Michael Niedermayer committed
1560
            s_index+=2;
1561 1562
        }
    }
1563

1564 1565
    /* high frequencies */
    vlc = &huff_quad_vlc[g->count1table_select];
1566
    last_pos=0;
1567
    while (s_index <= 572) {
1568
        int pos, code;
1569 1570
        pos = get_bits_count(&s->gb);
        if (pos >= end_pos) {
1571 1572 1573 1574 1575 1576
            if (pos > end_pos2 && last_pos){
                /* some encoders generate an incorrect size for this
                   part. We must go back into the data */
                s_index -= 4;
                skip_bits_long(&s->gb, last_pos - pos);
                av_log(NULL, AV_LOG_INFO, "overread, skip %d enddists: %d %d\n", last_pos - pos, end_pos-pos, end_pos2-pos);
1577 1578
                if(s->error_resilience >= FF_ER_COMPLIANT)
                    s_index=0;
1579 1580
                break;
            }
1581
//                av_log(NULL, AV_LOG_ERROR, "pos2: %d %d %d %d\n", pos, end_pos, end_pos2, s_index);
1582
            switch_buffer(s, &pos, &end_pos, &end_pos2);
1583 1584 1585
//                av_log(NULL, AV_LOG_ERROR, "new pos2: %d %d %d\n", pos, end_pos, s_index);
            if(pos >= end_pos)
                break;
1586
        }
1587
        last_pos= pos;
1588

1589
        code = get_vlc2(&s->gb, vlc->table, vlc->bits, 1);
1590
        dprintf(s->avctx, "t=%d code=%d\n", g->count1table_select, code);
1591 1592 1593 1594 1595
        g->sb_hybrid[s_index+0]=
        g->sb_hybrid[s_index+1]=
        g->sb_hybrid[s_index+2]=
        g->sb_hybrid[s_index+3]= 0;
        while(code){
1596
            static const int idxtab[16]={3,3,2,2,1,1,1,1,0,0,0,0,0,0,0,0};
1597
            int v;
1598 1599
            int pos= s_index+idxtab[code];
            code ^= 8>>idxtab[code];
1600 1601
            v = exp_table[ exponents[pos] ];
//            v = exp_table[ (exponents[pos]&3) ] >> FFMIN(0 - (exponents[pos]>>2), 31);
1602 1603 1604
            if(get_bits1(&s->gb))
                v = -v;
            g->sb_hybrid[pos] = v;
1605
        }
1606
        s_index+=4;
1607
    }
1608
    /* skip extension bits */
1609
    bits_left = end_pos2 - get_bits_count(&s->gb);
1610
//av_log(NULL, AV_LOG_ERROR, "left:%d buf:%p\n", bits_left, s->in_gb.buffer);
1611
    if (bits_left < 0/* || bits_left > 500*/) {
1612
        av_log(NULL, AV_LOG_ERROR, "bits_left=%d\n", bits_left);
1613 1614 1615 1616
        s_index=0;
    }else if(bits_left > 0 && s->error_resilience >= FF_ER_AGGRESSIVE){
        av_log(NULL, AV_LOG_ERROR, "bits_left=%d\n", bits_left);
        s_index=0;
1617
    }
1618
    memset(&g->sb_hybrid[s_index], 0, sizeof(*g->sb_hybrid)*(576 - s_index));
1619 1620
    skip_bits_long(&s->gb, bits_left);

1621
    i= get_bits_count(&s->gb);
1622
    switch_buffer(s, &i, &end_pos, &end_pos2);
1623

Fabrice Bellard's avatar
Fabrice Bellard committed
1624 1625 1626
    return 0;
}

1627 1628 1629 1630 1631
/* Reorder short blocks from bitstream order to interleaved order. It
   would be faster to do it in parsing, but the code would be far more
   complicated */
static void reorder_block(MPADecodeContext *s, GranuleDef *g)
{
1632
    int i, j, len;
1633 1634
    int32_t *ptr, *dst, *ptr1;
    int32_t tmp[576];
1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647

    if (g->block_type != 2)
        return;

    if (g->switch_point) {
        if (s->sample_rate_index != 8) {
            ptr = g->sb_hybrid + 36;
        } else {
            ptr = g->sb_hybrid + 48;
        }
    } else {
        ptr = g->sb_hybrid;
    }
1648

1649 1650 1651
    for(i=g->short_start;i<13;i++) {
        len = band_size_short[s->sample_rate_index][i];
        ptr1 = ptr;
1652 1653 1654 1655 1656 1657
        dst = tmp;
        for(j=len;j>0;j--) {
            *dst++ = ptr[0*len];
            *dst++ = ptr[1*len];
            *dst++ = ptr[2*len];
            ptr++;
1658
        }
1659 1660
        ptr+=2*len;
        memcpy(ptr1, tmp, len * 3 * sizeof(*ptr1));
1661 1662 1663 1664 1665 1666 1667 1668 1669
    }
}

#define ISQRT2 FIXR(0.70710678118654752440)

static void compute_stereo(MPADecodeContext *s,
                           GranuleDef *g0, GranuleDef *g1)
{
    int i, j, k, l;
1670
    int32_t v1, v2;
1671
    int sf_max, tmp0, tmp1, sf, len, non_zero_found;
1672 1673
    int32_t (*is_tab)[16];
    int32_t *tab0, *tab1;
1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684
    int non_zero_found_short[3];

    /* intensity stereo */
    if (s->mode_ext & MODE_EXT_I_STEREO) {
        if (!s->lsf) {
            is_tab = is_table;
            sf_max = 7;
        } else {
            is_tab = is_table_lsf[g1->scalefac_compress & 1];
            sf_max = 16;
        }
1685

1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735
        tab0 = g0->sb_hybrid + 576;
        tab1 = g1->sb_hybrid + 576;

        non_zero_found_short[0] = 0;
        non_zero_found_short[1] = 0;
        non_zero_found_short[2] = 0;
        k = (13 - g1->short_start) * 3 + g1->long_end - 3;
        for(i = 12;i >= g1->short_start;i--) {
            /* for last band, use previous scale factor */
            if (i != 11)
                k -= 3;
            len = band_size_short[s->sample_rate_index][i];
            for(l=2;l>=0;l--) {
                tab0 -= len;
                tab1 -= len;
                if (!non_zero_found_short[l]) {
                    /* test if non zero band. if so, stop doing i-stereo */
                    for(j=0;j<len;j++) {
                        if (tab1[j] != 0) {
                            non_zero_found_short[l] = 1;
                            goto found1;
                        }
                    }
                    sf = g1->scale_factors[k + l];
                    if (sf >= sf_max)
                        goto found1;

                    v1 = is_tab[0][sf];
                    v2 = is_tab[1][sf];
                    for(j=0;j<len;j++) {
                        tmp0 = tab0[j];
                        tab0[j] = MULL(tmp0, v1);
                        tab1[j] = MULL(tmp0, v2);
                    }
                } else {
                found1:
                    if (s->mode_ext & MODE_EXT_MS_STEREO) {
                        /* lower part of the spectrum : do ms stereo
                           if enabled */
                        for(j=0;j<len;j++) {
                            tmp0 = tab0[j];
                            tmp1 = tab1[j];
                            tab0[j] = MULL(tmp0 + tmp1, ISQRT2);
                            tab1[j] = MULL(tmp0 - tmp1, ISQRT2);
                        }
                    }
                }
            }
        }

1736 1737
        non_zero_found = non_zero_found_short[0] |
            non_zero_found_short[1] |
1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792
            non_zero_found_short[2];

        for(i = g1->long_end - 1;i >= 0;i--) {
            len = band_size_long[s->sample_rate_index][i];
            tab0 -= len;
            tab1 -= len;
            /* test if non zero band. if so, stop doing i-stereo */
            if (!non_zero_found) {
                for(j=0;j<len;j++) {
                    if (tab1[j] != 0) {
                        non_zero_found = 1;
                        goto found2;
                    }
                }
                /* for last band, use previous scale factor */
                k = (i == 21) ? 20 : i;
                sf = g1->scale_factors[k];
                if (sf >= sf_max)
                    goto found2;
                v1 = is_tab[0][sf];
                v2 = is_tab[1][sf];
                for(j=0;j<len;j++) {
                    tmp0 = tab0[j];
                    tab0[j] = MULL(tmp0, v1);
                    tab1[j] = MULL(tmp0, v2);
                }
            } else {
            found2:
                if (s->mode_ext & MODE_EXT_MS_STEREO) {
                    /* lower part of the spectrum : do ms stereo
                       if enabled */
                    for(j=0;j<len;j++) {
                        tmp0 = tab0[j];
                        tmp1 = tab1[j];
                        tab0[j] = MULL(tmp0 + tmp1, ISQRT2);
                        tab1[j] = MULL(tmp0 - tmp1, ISQRT2);
                    }
                }
            }
        }
    } else if (s->mode_ext & MODE_EXT_MS_STEREO) {
        /* ms stereo ONLY */
        /* NOTE: the 1/sqrt(2) normalization factor is included in the
           global gain */
        tab0 = g0->sb_hybrid;
        tab1 = g1->sb_hybrid;
        for(i=0;i<576;i++) {
            tmp0 = tab0[i];
            tmp1 = tab1[i];
            tab0[i] = tmp0 + tmp1;
            tab1[i] = tmp0 - tmp1;
        }
    }
}

1793
static void compute_antialias_integer(MPADecodeContext *s,
1794 1795
                              GranuleDef *g)
{
Michael Niedermayer's avatar
Michael Niedermayer committed
1796 1797
    int32_t *ptr, *csa;
    int n, i;
1798 1799 1800 1801 1802 1803 1804 1805 1806 1807

    /* we antialias only "long" bands */
    if (g->block_type == 2) {
        if (!g->switch_point)
            return;
        /* XXX: check this for 8000Hz case */
        n = 1;
    } else {
        n = SBLIMIT - 1;
    }
1808

1809 1810
    ptr = g->sb_hybrid + 18;
    for(i = n;i > 0;i--) {
Michael Niedermayer's avatar
Michael Niedermayer committed
1811 1812 1813
        int tmp0, tmp1, tmp2;
        csa = &csa_table[0][0];
#define INT_AA(j) \
1814 1815
            tmp0 = ptr[-1-j];\
            tmp1 = ptr[   j];\
Michael Niedermayer's avatar
Michael Niedermayer committed
1816
            tmp2= MULH(tmp0 + tmp1, csa[0+4*j]);\
1817 1818
            ptr[-1-j] = 4*(tmp2 - MULH(tmp1, csa[2+4*j]));\
            ptr[   j] = 4*(tmp2 + MULH(tmp0, csa[3+4*j]));
Michael Niedermayer's avatar
Michael Niedermayer committed
1819 1820 1821 1822 1823 1824 1825 1826 1827

        INT_AA(0)
        INT_AA(1)
        INT_AA(2)
        INT_AA(3)
        INT_AA(4)
        INT_AA(5)
        INT_AA(6)
        INT_AA(7)
1828 1829

        ptr += 18;
1830 1831 1832 1833 1834 1835
    }
}

static void compute_antialias_float(MPADecodeContext *s,
                              GranuleDef *g)
{
Michael Niedermayer's avatar
Michael Niedermayer committed
1836 1837
    int32_t *ptr;
    int n, i;
1838 1839 1840 1841 1842 1843 1844 1845 1846 1847

    /* we antialias only "long" bands */
    if (g->block_type == 2) {
        if (!g->switch_point)
            return;
        /* XXX: check this for 8000Hz case */
        n = 1;
    } else {
        n = SBLIMIT - 1;
    }
1848

1849 1850
    ptr = g->sb_hybrid + 18;
    for(i = n;i > 0;i--) {
Michael Niedermayer's avatar
Michael Niedermayer committed
1851
        float tmp0, tmp1;
1852
        float *csa = &csa_table_float[0][0];
Michael Niedermayer's avatar
Michael Niedermayer committed
1853 1854 1855 1856 1857
#define FLOAT_AA(j)\
        tmp0= ptr[-1-j];\
        tmp1= ptr[   j];\
        ptr[-1-j] = lrintf(tmp0 * csa[0+4*j] - tmp1 * csa[1+4*j]);\
        ptr[   j] = lrintf(tmp0 * csa[1+4*j] + tmp1 * csa[0+4*j]);
1858

Michael Niedermayer's avatar
Michael Niedermayer committed
1859 1860 1861 1862 1863 1864 1865 1866 1867
        FLOAT_AA(0)
        FLOAT_AA(1)
        FLOAT_AA(2)
        FLOAT_AA(3)
        FLOAT_AA(4)
        FLOAT_AA(5)
        FLOAT_AA(6)
        FLOAT_AA(7)

1868
        ptr += 18;
1869 1870 1871 1872
    }
}

static void compute_imdct(MPADecodeContext *s,
1873
                          GranuleDef *g,
1874 1875
                          int32_t *sb_samples,
                          int32_t *mdct_buf)
1876
{
Michael Niedermayer's avatar
Michael Niedermayer committed
1877
    int32_t *ptr, *win, *win1, *buf, *out_ptr, *ptr1;
1878
    int32_t out2[12];
Michael Niedermayer's avatar
Michael Niedermayer committed
1879
    int i, j, mdct_long_end, v, sblimit;
1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913

    /* find last non zero block */
    ptr = g->sb_hybrid + 576;
    ptr1 = g->sb_hybrid + 2 * 18;
    while (ptr >= ptr1) {
        ptr -= 6;
        v = ptr[0] | ptr[1] | ptr[2] | ptr[3] | ptr[4] | ptr[5];
        if (v != 0)
            break;
    }
    sblimit = ((ptr - g->sb_hybrid) / 18) + 1;

    if (g->block_type == 2) {
        /* XXX: check for 8000 Hz */
        if (g->switch_point)
            mdct_long_end = 2;
        else
            mdct_long_end = 0;
    } else {
        mdct_long_end = sblimit;
    }

    buf = mdct_buf;
    ptr = g->sb_hybrid;
    for(j=0;j<mdct_long_end;j++) {
        /* apply window & overlap with previous buffer */
        out_ptr = sb_samples + j;
        /* select window */
        if (g->switch_point && j < 2)
            win1 = mdct_win[0];
        else
            win1 = mdct_win[g->block_type];
        /* select frequency inversion */
        win = win1 + ((4 * 36) & -(j & 1));
1914 1915
        imdct36(out_ptr, buf, ptr, win);
        out_ptr += 18*SBLIMIT;
1916 1917 1918 1919 1920 1921 1922
        ptr += 18;
        buf += 18;
    }
    for(j=mdct_long_end;j<sblimit;j++) {
        /* select frequency inversion */
        win = mdct_win[2] + ((4 * 36) & -(j & 1));
        out_ptr = sb_samples + j;
1923

Michael Niedermayer's avatar
Michael Niedermayer committed
1924 1925 1926 1927 1928 1929 1930 1931
        for(i=0; i<6; i++){
            *out_ptr = buf[i];
            out_ptr += SBLIMIT;
        }
        imdct12(out2, ptr + 0);
        for(i=0;i<6;i++) {
            *out_ptr = MULH(out2[i], win[i]) + buf[i + 6*1];
            buf[i + 6*2] = MULH(out2[i + 6], win[i + 6]);
1932 1933
            out_ptr += SBLIMIT;
        }
Michael Niedermayer's avatar
Michael Niedermayer committed
1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945
        imdct12(out2, ptr + 1);
        for(i=0;i<6;i++) {
            *out_ptr = MULH(out2[i], win[i]) + buf[i + 6*2];
            buf[i + 6*0] = MULH(out2[i + 6], win[i + 6]);
            out_ptr += SBLIMIT;
        }
        imdct12(out2, ptr + 2);
        for(i=0;i<6;i++) {
            buf[i + 6*0] = MULH(out2[i], win[i]) + buf[i + 6*0];
            buf[i + 6*1] = MULH(out2[i + 6], win[i + 6]);
            buf[i + 6*2] = 0;
        }
1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961
        ptr += 18;
        buf += 18;
    }
    /* zero bands */
    for(j=sblimit;j<SBLIMIT;j++) {
        /* overlap */
        out_ptr = sb_samples + j;
        for(i=0;i<18;i++) {
            *out_ptr = buf[i];
            buf[i] = 0;
            out_ptr += SBLIMIT;
        }
        buf += 18;
    }
}

1962
#if defined(DEBUG)
1963
void sample_dump(int fnum, int32_t *tab, int n)
1964 1965 1966
{
    static FILE *files[16], *f;
    char buf[512];
1967
    int i;
1968
    int32_t v;
1969

1970 1971
    f = files[fnum];
    if (!f) {
1972 1973
        snprintf(buf, sizeof(buf), "/tmp/out%d.%s.pcm",
                fnum,
1974 1975 1976 1977 1978 1979
#ifdef USE_HIGHPRECISION
                "hp"
#else
                "lp"
#endif
                );
1980 1981 1982 1983 1984
        f = fopen(buf, "w");
        if (!f)
            return;
        files[fnum] = f;
    }
1985

1986 1987
    if (fnum == 0) {
        static int pos = 0;
1988
        av_log(NULL, AV_LOG_DEBUG, "pos=%d\n", pos);
1989
        for(i=0;i<n;i++) {
1990
            av_log(NULL, AV_LOG_DEBUG, " %0.4f", (double)tab[i] / FRAC_ONE);
1991
            if ((i % 18) == 17)
1992
                av_log(NULL, AV_LOG_DEBUG, "\n");
1993 1994 1995
        }
        pos += n;
    }
1996 1997 1998
    for(i=0;i<n;i++) {
        /* normalize to 23 frac bits */
        v = tab[i] << (23 - FRAC_BITS);
1999
        fwrite(&v, 1, sizeof(int32_t), f);
2000
    }
2001 2002 2003 2004 2005 2006 2007 2008
}
#endif


/* main layer3 decoding function */
static int mp_decode_layer3(MPADecodeContext *s)
{
    int nb_granules, main_data_begin, private_bits;
2009
    int gr, ch, blocksplit_flag, i, j, k, n, bits_pos;
2010
    GranuleDef granules[2][2], *g;
2011
    int16_t exponents[576];
2012 2013 2014 2015

    /* read side info */
    if (s->lsf) {
        main_data_begin = get_bits(&s->gb, 8);
Michael Niedermayer's avatar
Michael Niedermayer committed
2016
        private_bits = get_bits(&s->gb, s->nb_channels);
2017 2018 2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029
        nb_granules = 1;
    } else {
        main_data_begin = get_bits(&s->gb, 9);
        if (s->nb_channels == 2)
            private_bits = get_bits(&s->gb, 3);
        else
            private_bits = get_bits(&s->gb, 5);
        nb_granules = 2;
        for(ch=0;ch<s->nb_channels;ch++) {
            granules[ch][0].scfsi = 0; /* all scale factors are transmitted */
            granules[ch][1].scfsi = get_bits(&s->gb, 4);
        }
    }
2030

2031 2032
    for(gr=0;gr<nb_granules;gr++) {
        for(ch=0;ch<s->nb_channels;ch++) {
2033
            dprintf(s->avctx, "gr=%d ch=%d: side_info\n", gr, ch);
2034 2035 2036
            g = &granules[ch][gr];
            g->part2_3_length = get_bits(&s->gb, 12);
            g->big_values = get_bits(&s->gb, 9);
2037
            if(g->big_values > 288){
2038
                av_log(s->avctx, AV_LOG_ERROR, "big_values too big\n");
2039 2040 2041
                return -1;
            }

2042 2043 2044
            g->global_gain = get_bits(&s->gb, 8);
            /* if MS stereo only is selected, we precompute the
               1/sqrt(2) renormalization factor */
2045
            if ((s->mode_ext & (MODE_EXT_MS_STEREO | MODE_EXT_I_STEREO)) ==
2046 2047 2048 2049 2050 2051
                MODE_EXT_MS_STEREO)
                g->global_gain -= 2;
            if (s->lsf)
                g->scalefac_compress = get_bits(&s->gb, 9);
            else
                g->scalefac_compress = get_bits(&s->gb, 4);
2052
            blocksplit_flag = get_bits1(&s->gb);
2053 2054
            if (blocksplit_flag) {
                g->block_type = get_bits(&s->gb, 2);
2055 2056
                if (g->block_type == 0){
                    av_log(NULL, AV_LOG_ERROR, "invalid block type\n");
2057
                    return -1;
2058
                }
2059
                g->switch_point = get_bits1(&s->gb);
2060 2061
                for(i=0;i<2;i++)
                    g->table_select[i] = get_bits(&s->gb, 5);
2062
                for(i=0;i<3;i++)
2063
                    g->subblock_gain[i] = get_bits(&s->gb, 3);
2064
                ff_init_short_region(s, g);
2065
            } else {
2066
                int region_address1, region_address2;
2067 2068 2069 2070 2071 2072 2073
                g->block_type = 0;
                g->switch_point = 0;
                for(i=0;i<3;i++)
                    g->table_select[i] = get_bits(&s->gb, 5);
                /* compute huffman coded region sizes */
                region_address1 = get_bits(&s->gb, 4);
                region_address2 = get_bits(&s->gb, 3);
2074
                dprintf(s->avctx, "region1=%d region2=%d\n",
2075
                        region_address1, region_address2);
2076
                ff_init_long_region(s, g, region_address1, region_address2);
2077
            }
2078 2079
            ff_region_offset2size(g);
            ff_compute_band_indexes(s, g);
2080

2081 2082
            g->preflag = 0;
            if (!s->lsf)
2083 2084 2085
                g->preflag = get_bits1(&s->gb);
            g->scalefac_scale = get_bits1(&s->gb);
            g->count1table_select = get_bits1(&s->gb);
2086
            dprintf(s->avctx, "block_type=%d switch_point=%d\n",
2087 2088 2089 2090
                    g->block_type, g->switch_point);
        }
    }

Roberto Togni's avatar
Roberto Togni committed
2091
  if (!s->adu_mode) {
2092
    const uint8_t *ptr = s->gb.buffer + (get_bits_count(&s->gb)>>3);
2093
    assert((get_bits_count(&s->gb) & 7) == 0);
2094
    /* now we get bits from the main_data_begin offset */
2095
    dprintf(s->avctx, "seekback: %d\n", main_data_begin);
2096 2097 2098 2099
//av_log(NULL, AV_LOG_ERROR, "backstep:%d, lastbuf:%d\n", main_data_begin, s->last_buf_size);

    memcpy(s->last_buf + s->last_buf_size, ptr, EXTRABYTES);
    s->in_gb= s->gb;
2100 2101
        init_get_bits(&s->gb, s->last_buf, s->last_buf_size*8);
        skip_bits_long(&s->gb, 8*(s->last_buf_size - main_data_begin));
Roberto Togni's avatar
Roberto Togni committed
2102
  }
2103 2104 2105 2106

    for(gr=0;gr<nb_granules;gr++) {
        for(ch=0;ch<s->nb_channels;ch++) {
            g = &granules[ch][gr];
2107
            if(get_bits_count(&s->gb)<0){
Diego Biurrun's avatar
Diego Biurrun committed
2108
                av_log(NULL, AV_LOG_ERROR, "mdb:%d, lastbuf:%d skipping granule %d\n",
2109 2110 2111 2112 2113 2114 2115 2116 2117 2118
                                            main_data_begin, s->last_buf_size, gr);
                skip_bits_long(&s->gb, g->part2_3_length);
                memset(g->sb_hybrid, 0, sizeof(g->sb_hybrid));
                if(get_bits_count(&s->gb) >= s->gb.size_in_bits && s->in_gb.buffer){
                    skip_bits_long(&s->in_gb, get_bits_count(&s->gb) - s->gb.size_in_bits);
                    s->gb= s->in_gb;
                    s->in_gb.buffer=NULL;
                }
                continue;
            }
2119

2120
            bits_pos = get_bits_count(&s->gb);
2121

2122
            if (!s->lsf) {
2123
                uint8_t *sc;
2124 2125 2126 2127 2128
                int slen, slen1, slen2;

                /* MPEG1 scale factors */
                slen1 = slen_table[0][g->scalefac_compress];
                slen2 = slen_table[1][g->scalefac_compress];
2129
                dprintf(s->avctx, "slen1=%d slen2=%d\n", slen1, slen2);
2130 2131 2132
                if (g->block_type == 2) {
                    n = g->switch_point ? 17 : 18;
                    j = 0;
2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148
                    if(slen1){
                        for(i=0;i<n;i++)
                            g->scale_factors[j++] = get_bits(&s->gb, slen1);
                    }else{
                        for(i=0;i<n;i++)
                            g->scale_factors[j++] = 0;
                    }
                    if(slen2){
                        for(i=0;i<18;i++)
                            g->scale_factors[j++] = get_bits(&s->gb, slen2);
                        for(i=0;i<3;i++)
                            g->scale_factors[j++] = 0;
                    }else{
                        for(i=0;i<21;i++)
                            g->scale_factors[j++] = 0;
                    }
2149 2150 2151 2152 2153 2154 2155
                } else {
                    sc = granules[ch][0].scale_factors;
                    j = 0;
                    for(k=0;k<4;k++) {
                        n = (k == 0 ? 6 : 5);
                        if ((g->scfsi & (0x8 >> k)) == 0) {
                            slen = (k < 2) ? slen1 : slen2;
2156 2157 2158 2159 2160 2161 2162
                            if(slen){
                                for(i=0;i<n;i++)
                                    g->scale_factors[j++] = get_bits(&s->gb, slen);
                            }else{
                                for(i=0;i<n;i++)
                                    g->scale_factors[j++] = 0;
                            }
2163 2164 2165 2166 2167 2168 2169 2170 2171 2172
                        } else {
                            /* simply copy from last granule */
                            for(i=0;i<n;i++) {
                                g->scale_factors[j] = sc[j];
                                j++;
                            }
                        }
                    }
                    g->scale_factors[j++] = 0;
                }
2173
#if defined(DEBUG)
2174
                {
2175
                    dprintf(s->avctx, "scfsi=%x gr=%d ch=%d scale_factors:\n",
2176 2177
                           g->scfsi, gr, ch);
                    for(i=0;i<j;i++)
2178 2179
                        dprintf(s->avctx, " %d", g->scale_factors[i]);
                    dprintf(s->avctx, "\n");
2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223
                }
#endif
            } else {
                int tindex, tindex2, slen[4], sl, sf;

                /* LSF scale factors */
                if (g->block_type == 2) {
                    tindex = g->switch_point ? 2 : 1;
                } else {
                    tindex = 0;
                }
                sf = g->scalefac_compress;
                if ((s->mode_ext & MODE_EXT_I_STEREO) && ch == 1) {
                    /* intensity stereo case */
                    sf >>= 1;
                    if (sf < 180) {
                        lsf_sf_expand(slen, sf, 6, 6, 0);
                        tindex2 = 3;
                    } else if (sf < 244) {
                        lsf_sf_expand(slen, sf - 180, 4, 4, 0);
                        tindex2 = 4;
                    } else {
                        lsf_sf_expand(slen, sf - 244, 3, 0, 0);
                        tindex2 = 5;
                    }
                } else {
                    /* normal case */
                    if (sf < 400) {
                        lsf_sf_expand(slen, sf, 5, 4, 4);
                        tindex2 = 0;
                    } else if (sf < 500) {
                        lsf_sf_expand(slen, sf - 400, 5, 4, 0);
                        tindex2 = 1;
                    } else {
                        lsf_sf_expand(slen, sf - 500, 3, 0, 0);
                        tindex2 = 2;
                        g->preflag = 1;
                    }
                }

                j = 0;
                for(k=0;k<4;k++) {
                    n = lsf_nsf_table[tindex2][tindex][k];
                    sl = slen[k];
Michael Niedermayer's avatar
Michael Niedermayer committed
2224
                    if(sl){
2225 2226 2227 2228 2229 2230
                        for(i=0;i<n;i++)
                            g->scale_factors[j++] = get_bits(&s->gb, sl);
                    }else{
                        for(i=0;i<n;i++)
                            g->scale_factors[j++] = 0;
                    }
2231 2232 2233 2234
                }
                /* XXX: should compute exact size */
                for(;j<40;j++)
                    g->scale_factors[j] = 0;
2235
#if defined(DEBUG)
2236
                {
2237
                    dprintf(s->avctx, "gr=%d ch=%d scale_factors:\n",
2238 2239
                           gr, ch);
                    for(i=0;i<40;i++)
2240 2241
                        dprintf(s->avctx, " %d", g->scale_factors[i]);
                    dprintf(s->avctx, "\n");
2242 2243 2244 2245 2246 2247 2248
                }
#endif
            }

            exponents_from_scale_factors(s, g, exponents);

            /* read Huffman coded residue */
2249
            huffman_decode(s, g, exponents, bits_pos + g->part2_3_length);
2250 2251
#if defined(DEBUG)
            sample_dump(0, g->sb_hybrid, 576);
2252 2253 2254 2255 2256 2257 2258 2259 2260 2261
#endif
        } /* ch */

        if (s->nb_channels == 2)
            compute_stereo(s, &granules[0][gr], &granules[1][gr]);

        for(ch=0;ch<s->nb_channels;ch++) {
            g = &granules[ch][gr];

            reorder_block(s, g);
2262
#if defined(DEBUG)
2263 2264
            sample_dump(0, g->sb_hybrid, 576);
#endif
2265
            s->compute_antialias(s, g);
2266
#if defined(DEBUG)
2267 2268
            sample_dump(1, g->sb_hybrid, 576);
#endif
2269
            compute_imdct(s, g, &s->sb_samples[ch][18 * gr][0], s->mdct_buf[ch]);
2270
#if defined(DEBUG)
2271 2272 2273 2274
            sample_dump(2, &s->sb_samples[ch][18 * gr][0], 576);
#endif
        }
    } /* gr */
2275 2276
    if(get_bits_count(&s->gb)<0)
        skip_bits_long(&s->gb, -get_bits_count(&s->gb));
2277 2278 2279
    return nb_granules * 18;
}

2280
static int mp_decode_frame(MPADecodeContext *s,
2281
                           OUT_INT *samples, const uint8_t *buf, int buf_size)
2282 2283
{
    int i, nb_frames, ch;
2284
    OUT_INT *samples_ptr;
2285

2286
    init_get_bits(&s->gb, buf + HEADER_SIZE, (buf_size - HEADER_SIZE)*8);
2287

2288 2289
    /* skip error protection field */
    if (s->error_protection)
2290
        skip_bits(&s->gb, 16);
2291

2292
    dprintf(s->avctx, "frame %d:\n", s->frame_count);
2293 2294
    switch(s->layer) {
    case 1:
2295
        s->avctx->frame_size = 384;
2296 2297 2298
        nb_frames = mp_decode_layer1(s);
        break;
    case 2:
2299
        s->avctx->frame_size = 1152;
2300 2301 2302
        nb_frames = mp_decode_layer2(s);
        break;
    case 3:
2303
        s->avctx->frame_size = s->lsf ? 576 : 1152;
2304 2305
    default:
        nb_frames = mp_decode_layer3(s);
2306

2307 2308 2309 2310
        s->last_buf_size=0;
        if(s->in_gb.buffer){
            align_get_bits(&s->gb);
            i= (s->gb.size_in_bits - get_bits_count(&s->gb))>>3;
2311
            if(i >= 0 && i <= BACKSTEP_SIZE){
2312 2313
                memmove(s->last_buf, s->gb.buffer + (get_bits_count(&s->gb)>>3), i);
                s->last_buf_size=i;
2314 2315
            }else
                av_log(NULL, AV_LOG_ERROR, "invalid old backstep %d\n", i);
2316
            s->gb= s->in_gb;
2317
            s->in_gb.buffer= NULL;
2318 2319
        }

2320 2321
        align_get_bits(&s->gb);
        assert((get_bits_count(&s->gb) & 7) == 0);
2322 2323
        i= (s->gb.size_in_bits - get_bits_count(&s->gb))>>3;

2324 2325 2326 2327
        if(i<0 || i > BACKSTEP_SIZE || nb_frames<0){
            av_log(NULL, AV_LOG_ERROR, "invalid new backstep %d\n", i);
            i= FFMIN(BACKSTEP_SIZE, buf_size - HEADER_SIZE);
        }
2328
        assert(i <= buf_size - HEADER_SIZE && i>= 0);
2329
        memcpy(s->last_buf + s->last_buf_size, s->gb.buffer + buf_size - HEADER_SIZE - i, i);
2330
        s->last_buf_size += i;
2331

2332 2333 2334 2335 2336 2337
        break;
    }
#if defined(DEBUG)
    for(i=0;i<nb_frames;i++) {
        for(ch=0;ch<s->nb_channels;ch++) {
            int j;
2338
            dprintf(s->avctx, "%d-%d:", i, ch);
2339
            for(j=0;j<SBLIMIT;j++)
2340 2341
                dprintf(s->avctx, " %0.6f", (double)s->sb_samples[ch][i][j] / FRAC_ONE);
            dprintf(s->avctx, "\n");
2342 2343 2344 2345 2346 2347 2348
        }
    }
#endif
    /* apply the synthesis filter */
    for(ch=0;ch<s->nb_channels;ch++) {
        samples_ptr = samples + ch;
        for(i=0;i<nb_frames;i++) {
2349
            ff_mpa_synth_filter(s->synth_buf[ch], &(s->synth_buf_offset[ch]),
2350 2351
                         window, &s->dither_state,
                         samples_ptr, s->nb_channels,
2352 2353 2354 2355 2356
                         s->sb_samples[ch][i]);
            samples_ptr += 32 * s->nb_channels;
        }
    }
#ifdef DEBUG
2357
    s->frame_count++;
2358
#endif
2359
    return nb_frames * 32 * sizeof(OUT_INT) * s->nb_channels;
2360 2361
}

Fabrice Bellard's avatar
Fabrice Bellard committed
2362
static int decode_frame(AVCodecContext * avctx,
2363
                        void *data, int *data_size,
Michael Niedermayer's avatar
Michael Niedermayer committed
2364
                        const uint8_t * buf, int buf_size)
Fabrice Bellard's avatar
Fabrice Bellard committed
2365 2366
{
    MPADecodeContext *s = avctx->priv_data;
2367
    uint32_t header;
2368
    int out_size;
2369
    OUT_INT *out_samples = data;
Fabrice Bellard's avatar
Fabrice Bellard committed
2370

2371 2372 2373 2374
retry:
    if(buf_size < HEADER_SIZE)
        return -1;

2375
    header = AV_RB32(buf);
2376 2377 2378
    if(ff_mpa_check_header(header) < 0){
        buf++;
//        buf_size--;
Diego Biurrun's avatar
Diego Biurrun committed
2379
        av_log(avctx, AV_LOG_ERROR, "Header missing skipping one byte.\n");
2380 2381 2382
        goto retry;
    }

2383
    if (ff_mpegaudio_decode_header(s, header) == 1) {
2384 2385 2386 2387 2388 2389 2390 2391 2392
        /* free format: prepare to compute frame size */
        s->frame_size = -1;
        return -1;
    }
    /* update codec info */
    avctx->channels = s->nb_channels;
    avctx->bit_rate = s->bit_rate;
    avctx->sub_id = s->layer;

2393
    if(s->frame_size<=0 || s->frame_size > buf_size){
2394 2395
        av_log(avctx, AV_LOG_ERROR, "incomplete frame\n");
        return -1;
2396 2397
    }else if(s->frame_size < buf_size){
        av_log(avctx, AV_LOG_ERROR, "incorrect frame size\n");
2398
        buf_size= s->frame_size;
Fabrice Bellard's avatar
Fabrice Bellard committed
2399
    }
2400 2401

    out_size = mp_decode_frame(s, out_samples, buf, buf_size);
2402
    if(out_size>=0){
2403
        *data_size = out_size;
2404 2405 2406
        avctx->sample_rate = s->sample_rate;
        //FIXME maybe move the other codec info stuff from above here too
    }else
Diego Biurrun's avatar
Diego Biurrun committed
2407
        av_log(avctx, AV_LOG_DEBUG, "Error while decoding MPEG audio frame.\n"); //FIXME return -1 / but also return the number of bytes consumed
2408 2409
    s->frame_size = 0;
    return buf_size;
Fabrice Bellard's avatar
Fabrice Bellard committed
2410 2411
}

2412 2413
static void flush(AVCodecContext *avctx){
    MPADecodeContext *s = avctx->priv_data;
2414
    memset(s->synth_buf, 0, sizeof(s->synth_buf));
2415 2416 2417
    s->last_buf_size= 0;
}

2418
#ifdef CONFIG_MP3ADU_DECODER
Roberto Togni's avatar
Roberto Togni committed
2419
static int decode_frame_adu(AVCodecContext * avctx,
2420
                        void *data, int *data_size,
Michael Niedermayer's avatar
Michael Niedermayer committed
2421
                        const uint8_t * buf, int buf_size)
Roberto Togni's avatar
Roberto Togni committed
2422 2423 2424 2425
{
    MPADecodeContext *s = avctx->priv_data;
    uint32_t header;
    int len, out_size;
2426
    OUT_INT *out_samples = data;
Roberto Togni's avatar
Roberto Togni committed
2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440

    len = buf_size;

    // Discard too short frames
    if (buf_size < HEADER_SIZE) {
        *data_size = 0;
        return buf_size;
    }


    if (len > MPA_MAX_CODED_FRAME_SIZE)
        len = MPA_MAX_CODED_FRAME_SIZE;

    // Get header and restore sync word
2441
    header = AV_RB32(buf) | 0xffe00000;
Roberto Togni's avatar
Roberto Togni committed
2442

2443
    if (ff_mpa_check_header(header) < 0) { // Bad header, discard frame
Roberto Togni's avatar
Roberto Togni committed
2444 2445 2446 2447
        *data_size = 0;
        return buf_size;
    }

2448
    ff_mpegaudio_decode_header(s, header);
Roberto Togni's avatar
Roberto Togni committed
2449 2450 2451 2452 2453 2454
    /* update codec info */
    avctx->sample_rate = s->sample_rate;
    avctx->channels = s->nb_channels;
    avctx->bit_rate = s->bit_rate;
    avctx->sub_id = s->layer;

2455
    s->frame_size = len;
Roberto Togni's avatar
Roberto Togni committed
2456 2457

    if (avctx->parse_only) {
2458
        out_size = buf_size;
Roberto Togni's avatar
Roberto Togni committed
2459
    } else {
2460
        out_size = mp_decode_frame(s, out_samples, buf, buf_size);
Roberto Togni's avatar
Roberto Togni committed
2461 2462 2463 2464 2465
    }

    *data_size = out_size;
    return buf_size;
}
2466
#endif /* CONFIG_MP3ADU_DECODER */
Roberto Togni's avatar
Roberto Togni committed
2467

2468
#ifdef CONFIG_MP3ON4_DECODER
2469

2470 2471 2472 2473 2474 2475
/**
 * Context for MP3On4 decoder
 */
typedef struct MP3On4DecodeContext {
    int frames;   ///< number of mp3 frames per block (number of mp3 decoder instances)
    int syncword; ///< syncword patch
2476
    const uint8_t *coff; ///< channels offsets in output buffer
2477 2478 2479
    MPADecodeContext *mp3decctx[5]; ///< MPADecodeContext for every decoder instance
} MP3On4DecodeContext;

2480 2481
#include "mpeg4audio.h"

2482
/* Next 3 arrays are indexed by channel config number (passed via codecdata) */
2483
static const uint8_t mp3Frames[8] = {0,1,1,2,3,3,4,5};   /* number of mp3 decoder instances */
2484
/* offsets into output buffer, assume output order is FL FR BL BR C LFE */
2485
static const uint8_t chan_offset[8][5] = {
2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499
    {0},
    {0},            // C
    {0},            // FLR
    {2,0},          // C FLR
    {2,0,3},        // C FLR BS
    {4,0,2},        // C FLR BLRS
    {4,0,2,5},      // C FLR BLRS LFE
    {4,0,2,6,5},    // C FLR BLRS BLR LFE
};


static int decode_init_mp3on4(AVCodecContext * avctx)
{
    MP3On4DecodeContext *s = avctx->priv_data;
2500
    MPEG4AudioConfig cfg;
2501 2502 2503 2504 2505 2506 2507
    int i;

    if ((avctx->extradata_size < 2) || (avctx->extradata == NULL)) {
        av_log(avctx, AV_LOG_ERROR, "Codec extradata missing or too short.\n");
        return -1;
    }

2508 2509
    ff_mpeg4audio_get_config(&cfg, avctx->extradata, avctx->extradata_size);
    if (!cfg.chan_config || cfg.chan_config > 7) {
2510 2511 2512
        av_log(avctx, AV_LOG_ERROR, "Invalid channel config number.\n");
        return -1;
    }
2513 2514 2515
    s->frames = mp3Frames[cfg.chan_config];
    s->coff = chan_offset[cfg.chan_config];
    avctx->channels = ff_mpeg4audio_channels[cfg.chan_config];
2516

2517 2518 2519 2520 2521
    if (cfg.sample_rate < 16000)
        s->syncword = 0xffe00000;
    else
        s->syncword = 0xfff00000;

2522 2523 2524
    /* Init the first mp3 decoder in standard way, so that all tables get builded
     * We replace avctx->priv_data with the context of the first decoder so that
     * decode_init() does not have to be changed.
2525
     * Other decoders will be initialized here copying data from the first context
2526 2527 2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541 2542
     */
    // Allocate zeroed memory for the first decoder context
    s->mp3decctx[0] = av_mallocz(sizeof(MPADecodeContext));
    // Put decoder context in place to make init_decode() happy
    avctx->priv_data = s->mp3decctx[0];
    decode_init(avctx);
    // Restore mp3on4 context pointer
    avctx->priv_data = s;
    s->mp3decctx[0]->adu_mode = 1; // Set adu mode

    /* Create a separate codec/context for each frame (first is already ok).
     * Each frame is 1 or 2 channels - up to 5 frames allowed
     */
    for (i = 1; i < s->frames; i++) {
        s->mp3decctx[i] = av_mallocz(sizeof(MPADecodeContext));
        s->mp3decctx[i]->compute_antialias = s->mp3decctx[0]->compute_antialias;
        s->mp3decctx[i]->adu_mode = 1;
2543
        s->mp3decctx[i]->avctx = avctx;
2544 2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563
    }

    return 0;
}


static int decode_close_mp3on4(AVCodecContext * avctx)
{
    MP3On4DecodeContext *s = avctx->priv_data;
    int i;

    for (i = 0; i < s->frames; i++)
        if (s->mp3decctx[i])
            av_free(s->mp3decctx[i]);

    return 0;
}


static int decode_frame_mp3on4(AVCodecContext * avctx,
2564
                        void *data, int *data_size,
Michael Niedermayer's avatar
Michael Niedermayer committed
2565
                        const uint8_t * buf, int buf_size)
2566 2567 2568
{
    MP3On4DecodeContext *s = avctx->priv_data;
    MPADecodeContext *m;
2569
    int fsize, len = buf_size, out_size = 0;
2570 2571 2572 2573
    uint32_t header;
    OUT_INT *out_samples = data;
    OUT_INT decoded_buf[MPA_FRAME_SIZE * MPA_MAX_CHANNELS];
    OUT_INT *outptr, *bp;
2574
    int fr, j, n;
2575

2576
    *data_size = 0;
2577
    // Discard too short frames
2578 2579
    if (buf_size < HEADER_SIZE)
        return -1;
2580 2581 2582 2583

    // If only one decoder interleave is not needed
    outptr = s->frames == 1 ? out_samples : decoded_buf;

2584 2585
    avctx->bit_rate = 0;

2586
    for (fr = 0; fr < s->frames; fr++) {
Baptiste Coudurier's avatar
Baptiste Coudurier committed
2587
        fsize = AV_RB16(buf) >> 4;
2588
        fsize = FFMIN3(fsize, len, MPA_MAX_CODED_FRAME_SIZE);
2589 2590 2591
        m = s->mp3decctx[fr];
        assert (m != NULL);

2592
        header = (AV_RB32(buf) & 0x000fffff) | s->syncword; // patch header
2593

2594 2595
        if (ff_mpa_check_header(header) < 0) // Bad header, discard block
            break;
2596

2597
        ff_mpegaudio_decode_header(m, header);
2598
        out_size += mp_decode_frame(m, outptr, buf, fsize);
Baptiste Coudurier's avatar
Baptiste Coudurier committed
2599 2600
        buf += fsize;
        len -= fsize;
2601 2602

        if(s->frames > 1) {
2603
            n = m->avctx->frame_size*m->nb_channels;
2604
            /* interleave output data */
2605
            bp = out_samples + s->coff[fr];
2606 2607 2608
            if(m->nb_channels == 1) {
                for(j = 0; j < n; j++) {
                    *bp = decoded_buf[j];
Baptiste Coudurier's avatar
Baptiste Coudurier committed
2609
                    bp += avctx->channels;
2610 2611 2612 2613 2614
                }
            } else {
                for(j = 0; j < n; j++) {
                    bp[0] = decoded_buf[j++];
                    bp[1] = decoded_buf[j];
Baptiste Coudurier's avatar
Baptiste Coudurier committed
2615
                    bp += avctx->channels;
2616 2617 2618
                }
            }
        }
2619
        avctx->bit_rate += m->bit_rate;
2620 2621 2622 2623 2624 2625 2626 2627
    }

    /* update codec info */
    avctx->sample_rate = s->mp3decctx[0]->sample_rate;

    *data_size = out_size;
    return buf_size;
}
2628
#endif /* CONFIG_MP3ON4_DECODER */
2629

2630
#ifdef CONFIG_MP2_DECODER
2631
AVCodec mp2_decoder =
Fabrice Bellard's avatar
Fabrice Bellard committed
2632
{
2633
    "mp2",
Fabrice Bellard's avatar
Fabrice Bellard committed
2634 2635 2636 2637 2638 2639 2640
    CODEC_TYPE_AUDIO,
    CODEC_ID_MP2,
    sizeof(MPADecodeContext),
    decode_init,
    NULL,
    NULL,
    decode_frame,
2641
    CODEC_CAP_PARSE_ONLY,
2642
    .flush= flush,
2643
    .long_name= "MP2 (MPEG audio layer 2)",
Fabrice Bellard's avatar
Fabrice Bellard committed
2644
};
2645 2646
#endif
#ifdef CONFIG_MP3_DECODER
2647 2648 2649 2650
AVCodec mp3_decoder =
{
    "mp3",
    CODEC_TYPE_AUDIO,
2651
    CODEC_ID_MP3,
2652 2653 2654 2655 2656
    sizeof(MPADecodeContext),
    decode_init,
    NULL,
    NULL,
    decode_frame,
2657
    CODEC_CAP_PARSE_ONLY,
2658
    .flush= flush,
2659
    .long_name= "MP3 (MPEG audio layer 3)",
2660
};
2661 2662
#endif
#ifdef CONFIG_MP3ADU_DECODER
Roberto Togni's avatar
Roberto Togni committed
2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673
AVCodec mp3adu_decoder =
{
    "mp3adu",
    CODEC_TYPE_AUDIO,
    CODEC_ID_MP3ADU,
    sizeof(MPADecodeContext),
    decode_init,
    NULL,
    NULL,
    decode_frame_adu,
    CODEC_CAP_PARSE_ONLY,
2674
    .flush= flush,
2675
    .long_name= "ADU (Application Data Unit) MP3 (MPEG audio layer 3)",
Roberto Togni's avatar
Roberto Togni committed
2676
};
2677 2678
#endif
#ifdef CONFIG_MP3ON4_DECODER
2679 2680 2681 2682 2683 2684 2685 2686 2687 2688
AVCodec mp3on4_decoder =
{
    "mp3on4",
    CODEC_TYPE_AUDIO,
    CODEC_ID_MP3ON4,
    sizeof(MP3On4DecodeContext),
    decode_init_mp3on4,
    NULL,
    decode_close_mp3on4,
    decode_frame_mp3on4,
2689
    .flush= flush,
2690
    .long_name= "MP3onMP4",
2691
};
2692
#endif