dcaenc.c 41.4 KB
Newer Older
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1 2
/*
 * DCA encoder
Paul B Mahol's avatar
Paul B Mahol committed
3
 * Copyright (C) 2008-2012 Alexander E. Patrakov
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 *               2010 Benjamin Larsson
 *               2011 Xiang Wang
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

24 25 26
#define FFT_FLOAT 0
#define FFT_FIXED_32 1

Paul B Mahol's avatar
Paul B Mahol committed
27
#include "libavutil/avassert.h"
28
#include "libavutil/channel_layout.h"
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
29
#include "libavutil/common.h"
30
#include "libavutil/ffmath.h"
31
#include "libavutil/opt.h"
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
32
#include "avcodec.h"
Paul B Mahol's avatar
Paul B Mahol committed
33
#include "dca.h"
34 35 36
#include "dcaadpcm.h"
#include "dcamath.h"
#include "dca_core.h"
Paul B Mahol's avatar
Paul B Mahol committed
37 38
#include "dcadata.h"
#include "dcaenc.h"
39
#include "fft.h"
40
#include "internal.h"
41
#include "mathops.h"
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
42 43 44
#include "put_bits.h"

#define MAX_CHANNELS 6
Paul B Mahol's avatar
Paul B Mahol committed
45
#define DCA_MAX_FRAME_SIZE 16384
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
46
#define DCA_HEADER_SIZE 13
Paul B Mahol's avatar
Paul B Mahol committed
47
#define DCA_LFE_SAMPLES 8
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
48

49
#define DCAENC_SUBBANDS 32
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
50
#define SUBFRAMES 1
Paul B Mahol's avatar
Paul B Mahol committed
51 52 53
#define SUBSUBFRAMES 2
#define SUBBAND_SAMPLES (SUBFRAMES * SUBSUBFRAMES * 8)
#define AUBANDS 25
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
54

55 56
#define COS_T(x) (c->cos_table[(x) & 2047])

57 58 59 60
typedef struct CompressionOptions {
    int adpcm_mode;
} CompressionOptions;

61
typedef struct DCAEncContext {
62
    AVClass *class;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
63
    PutBitContext pb;
64
    DCAADPCMEncContext adpcm_ctx;
65
    FFTContext mdct;
66
    CompressionOptions options;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
67
    int frame_size;
Paul B Mahol's avatar
Paul B Mahol committed
68 69 70
    int frame_bits;
    int fullband_channels;
    int channels;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
71
    int lfe_channel;
Paul B Mahol's avatar
Paul B Mahol committed
72 73 74 75 76
    int samplerate_index;
    int bitrate_index;
    int channel_config;
    const int32_t *band_interpolation;
    const int32_t *band_spectrum;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
77
    int lfe_scale_factor;
Paul B Mahol's avatar
Paul B Mahol committed
78 79
    softfloat lfe_quant;
    int32_t lfe_peak_cb;
80
    const int8_t *channel_order_tab;  ///< channel reordering table, lfe and non lfe
Paul B Mahol's avatar
Paul B Mahol committed
81

82 83
    int32_t prediction_mode[MAX_CHANNELS][DCAENC_SUBBANDS];
    int32_t adpcm_history[MAX_CHANNELS][DCAENC_SUBBANDS][DCA_ADPCM_COEFFS * 2];
84
    int32_t history[MAX_CHANNELS][512]; /* This is a circular buffer */
85
    int32_t *subband[MAX_CHANNELS][DCAENC_SUBBANDS];
86 87
    int32_t quantized[MAX_CHANNELS][DCAENC_SUBBANDS][SUBBAND_SAMPLES];
    int32_t peak_cb[MAX_CHANNELS][DCAENC_SUBBANDS];
88
    int32_t diff_peak_cb[MAX_CHANNELS][DCAENC_SUBBANDS]; ///< expected peak of residual signal
Paul B Mahol's avatar
Paul B Mahol committed
89 90
    int32_t downsampled_lfe[DCA_LFE_SAMPLES];
    int32_t masking_curve_cb[SUBSUBFRAMES][256];
91
    int32_t bit_allocation_sel[MAX_CHANNELS];
92 93 94
    int abits[MAX_CHANNELS][DCAENC_SUBBANDS];
    int scale_factor[MAX_CHANNELS][DCAENC_SUBBANDS];
    softfloat quant[MAX_CHANNELS][DCAENC_SUBBANDS];
95
    int32_t quant_index_sel[MAX_CHANNELS][DCA_CODE_BOOKS];
Paul B Mahol's avatar
Paul B Mahol committed
96 97 98 99 100
    int32_t eff_masking_curve_cb[256];
    int32_t band_masking_cb[32];
    int32_t worst_quantization_noise;
    int32_t worst_noise_ever;
    int consumed_bits;
101
    int consumed_adpcm_bits; ///< Number of bits to transmit ADPCM related info
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
102

103 104 105 106 107 108 109 110
    int32_t cos_table[2048];
    int32_t band_interpolation_tab[2][512];
    int32_t band_spectrum_tab[2][8];
    int32_t auf[9][AUBANDS][256];
    int32_t cb_to_add[256];
    int32_t cb_to_level[2048];
    int32_t lfe_fir_64i[512];
} DCAEncContext;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
111

Paul B Mahol's avatar
Paul B Mahol committed
112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131
/* Transfer function of outer and middle ear, Hz -> dB */
static double hom(double f)
{
    double f1 = f / 1000;

    return -3.64 * pow(f1, -0.8)
           + 6.8 * exp(-0.6 * (f1 - 3.4) * (f1 - 3.4))
           - 6.0 * exp(-0.15 * (f1 - 8.7) * (f1 - 8.7))
           - 0.0006 * (f1 * f1) * (f1 * f1);
}

static double gammafilter(int i, double f)
{
    double h = (f - fc[i]) / erb[i];

    h = 1 + h * h;
    h = 1 / (h * h);
    return 20 * log10(h);
}

132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154
static int subband_bufer_alloc(DCAEncContext *c)
{
    int ch, band;
    int32_t *bufer = av_calloc(MAX_CHANNELS * DCAENC_SUBBANDS *
                               (SUBBAND_SAMPLES + DCA_ADPCM_COEFFS),
                               sizeof(int32_t));
    if (!bufer)
        return -1;

    /* we need a place for DCA_ADPCM_COEFF samples from previous frame
     * to calc prediction coefficients for each subband */
    for (ch = 0; ch < MAX_CHANNELS; ch++) {
        for (band = 0; band < DCAENC_SUBBANDS; band++) {
            c->subband[ch][band] = bufer +
                                   ch * DCAENC_SUBBANDS * (SUBBAND_SAMPLES + DCA_ADPCM_COEFFS) +
                                   band * (SUBBAND_SAMPLES + DCA_ADPCM_COEFFS) + DCA_ADPCM_COEFFS;
        }
    }
    return 0;
}

static void subband_bufer_free(DCAEncContext *c)
{
155 156 157 158 159
    if (c->subband[0][0]) {
        int32_t *bufer = c->subband[0][0] - DCA_ADPCM_COEFFS;
        av_free(bufer);
        c->subband[0][0] = NULL;
    }
160 161
}

Paul B Mahol's avatar
Paul B Mahol committed
162 163
static int encode_init(AVCodecContext *avctx)
{
164
    DCAEncContext *c = avctx->priv_data;
Paul B Mahol's avatar
Paul B Mahol committed
165
    uint64_t layout = avctx->channel_layout;
166
    int i, j, k, min_frame_bits;
167
    int ret;
Paul B Mahol's avatar
Paul B Mahol committed
168

169 170 171
    if (subband_bufer_alloc(c))
        return AVERROR(ENOMEM);

Paul B Mahol's avatar
Paul B Mahol committed
172 173
    c->fullband_channels = c->channels = avctx->channels;
    c->lfe_channel = (avctx->channels == 3 || avctx->channels == 6);
174 175
    c->band_interpolation = c->band_interpolation_tab[1];
    c->band_spectrum = c->band_spectrum_tab[1];
Paul B Mahol's avatar
Paul B Mahol committed
176 177
    c->worst_quantization_noise = -2047;
    c->worst_noise_ever = -2047;
178 179 180 181
    c->consumed_adpcm_bits = 0;

    if (ff_dcaadpcm_init(&c->adpcm_ctx))
        return AVERROR(ENOMEM);
Paul B Mahol's avatar
Paul B Mahol committed
182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199

    if (!layout) {
        av_log(avctx, AV_LOG_WARNING, "No channel layout specified. The "
                                      "encoder will guess the layout, but it "
                                      "might be incorrect.\n");
        layout = av_get_default_channel_layout(avctx->channels);
    }
    switch (layout) {
    case AV_CH_LAYOUT_MONO:         c->channel_config = 0; break;
    case AV_CH_LAYOUT_STEREO:       c->channel_config = 2; break;
    case AV_CH_LAYOUT_2_2:          c->channel_config = 8; break;
    case AV_CH_LAYOUT_5POINT0:      c->channel_config = 9; break;
    case AV_CH_LAYOUT_5POINT1:      c->channel_config = 9; break;
    default:
        av_log(avctx, AV_LOG_ERROR, "Unsupported channel layout!\n");
        return AVERROR_PATCHWELCOME;
    }

200
    if (c->lfe_channel) {
Paul B Mahol's avatar
Paul B Mahol committed
201
        c->fullband_channels--;
202
        c->channel_order_tab = channel_reorder_lfe[c->channel_config];
203
    } else {
204
        c->channel_order_tab = channel_reorder_nolfe[c->channel_config];
205
    }
Paul B Mahol's avatar
Paul B Mahol committed
206

207 208 209 210
    for (i = 0; i < MAX_CHANNELS; i++) {
        for (j = 0; j < DCA_CODE_BOOKS; j++) {
            c->quant_index_sel[i][j] = ff_dca_quant_index_group_size[j];
        }
211 212
        /* 6 - no Huffman */
        c->bit_allocation_sel[i] = 6;
213 214 215 216 217 218

        for (j = 0; j < DCAENC_SUBBANDS; j++) {
            /* -1 - no ADPCM */
            c->prediction_mode[i][j] = -1;
            memset(c->adpcm_history[i][j], 0, sizeof(int32_t)*DCA_ADPCM_COEFFS);
        }
219 220
    }

Paul B Mahol's avatar
Paul B Mahol committed
221 222 223 224 225 226 227 228 229
    for (i = 0; i < 9; i++) {
        if (sample_rates[i] == avctx->sample_rate)
            break;
    }
    if (i == 9)
        return AVERROR(EINVAL);
    c->samplerate_index = i;

    if (avctx->bit_rate < 32000 || avctx->bit_rate > 3840000) {
230
        av_log(avctx, AV_LOG_ERROR, "Bit rate %"PRId64" not supported.", avctx->bit_rate);
Paul B Mahol's avatar
Paul B Mahol committed
231 232
        return AVERROR(EINVAL);
    }
233
    for (i = 0; ff_dca_bit_rates[i] < avctx->bit_rate; i++)
Paul B Mahol's avatar
Paul B Mahol committed
234 235 236 237 238 239 240 241 242 243 244
        ;
    c->bitrate_index = i;
    c->frame_bits = FFALIGN((avctx->bit_rate * 512 + avctx->sample_rate - 1) / avctx->sample_rate, 32);
    min_frame_bits = 132 + (493 + 28 * 32) * c->fullband_channels + c->lfe_channel * 72;
    if (c->frame_bits < min_frame_bits || c->frame_bits > (DCA_MAX_FRAME_SIZE << 3))
        return AVERROR(EINVAL);

    c->frame_size = (c->frame_bits + 7) / 8;

    avctx->frame_size = 32 * SUBBAND_SAMPLES;

245 246 247
    if ((ret = ff_mdct_init(&c->mdct, 9, 0, 1.0)) < 0)
        return ret;

248 249 250 251 252 253 254 255 256 257
    /* Init all tables */
    c->cos_table[0] = 0x7fffffff;
    c->cos_table[512] = 0;
    c->cos_table[1024] = -c->cos_table[0];
    for (i = 1; i < 512; i++) {
        c->cos_table[i]   = (int32_t)(0x7fffffff * cos(M_PI * i / 1024));
        c->cos_table[1024-i] = -c->cos_table[i];
        c->cos_table[1024+i] = -c->cos_table[i];
        c->cos_table[2048-i] = +c->cos_table[i];
    }
Paul B Mahol's avatar
Paul B Mahol committed
258

259 260
    for (i = 0; i < 2048; i++)
        c->cb_to_level[i] = (int32_t)(0x7fffffff * ff_exp10(-0.005 * i));
261

262 263 264 265
    for (k = 0; k < 32; k++) {
        for (j = 0; j < 8; j++) {
            c->lfe_fir_64i[64 * j + k] = (int32_t)(0xffffff800000ULL * ff_dca_lfe_fir_64[8 * k + j]);
            c->lfe_fir_64i[64 * (7-j) + (63 - k)] = (int32_t)(0xffffff800000ULL * ff_dca_lfe_fir_64[8 * k + j]);
Paul B Mahol's avatar
Paul B Mahol committed
266
        }
267
    }
Paul B Mahol's avatar
Paul B Mahol committed
268

269 270 271 272
    for (i = 0; i < 512; i++) {
        c->band_interpolation_tab[0][i] = (int32_t)(0x1000000000ULL * ff_dca_fir_32bands_perfect[i]);
        c->band_interpolation_tab[1][i] = (int32_t)(0x1000000000ULL * ff_dca_fir_32bands_nonperfect[i]);
    }
Paul B Mahol's avatar
Paul B Mahol committed
273

274 275 276 277 278 279
    for (i = 0; i < 9; i++) {
        for (j = 0; j < AUBANDS; j++) {
            for (k = 0; k < 256; k++) {
                double freq = sample_rates[i] * (k + 0.5) / 512;

                c->auf[i][j][k] = (int32_t)(10 * (hom(freq) + gammafilter(j, freq)));
Paul B Mahol's avatar
Paul B Mahol committed
280 281
            }
        }
282
    }
Paul B Mahol's avatar
Paul B Mahol committed
283

284 285 286 287 288 289 290 291 292
    for (i = 0; i < 256; i++) {
        double add = 1 + ff_exp10(-0.01 * i);
        c->cb_to_add[i] = (int32_t)(100 * log10(add));
    }
    for (j = 0; j < 8; j++) {
        double accum = 0;
        for (i = 0; i < 512; i++) {
            double reconst = ff_dca_fir_32bands_perfect[i] * ((i & 64) ? (-1) : 1);
            accum += reconst * cos(2 * M_PI * (i + 0.5 - 256) * (j + 0.5) / 512);
Paul B Mahol's avatar
Paul B Mahol committed
293
        }
294 295 296 297 298 299 300
        c->band_spectrum_tab[0][j] = (int32_t)(200 * log10(accum));
    }
    for (j = 0; j < 8; j++) {
        double accum = 0;
        for (i = 0; i < 512; i++) {
            double reconst = ff_dca_fir_32bands_nonperfect[i] * ((i & 64) ? (-1) : 1);
            accum += reconst * cos(2 * M_PI * (i + 0.5 - 256) * (j + 0.5) / 512);
Paul B Mahol's avatar
Paul B Mahol committed
301
        }
302
        c->band_spectrum_tab[1][j] = (int32_t)(200 * log10(accum));
Paul B Mahol's avatar
Paul B Mahol committed
303
    }
304

Paul B Mahol's avatar
Paul B Mahol committed
305 306 307
    return 0;
}

308 309
static av_cold int encode_close(AVCodecContext *avctx)
{
310
    DCAEncContext *c = avctx->priv_data;
311
    ff_mdct_end(&c->mdct);
312 313 314
    subband_bufer_free(c);
    ff_dcaadpcm_free(&c->adpcm_ctx);

315 316 317
    return 0;
}

318
static void subband_transform(DCAEncContext *c, const int32_t *input)
Paul B Mahol's avatar
Paul B Mahol committed
319 320 321 322 323 324 325
{
    int ch, subs, i, k, j;

    for (ch = 0; ch < c->fullband_channels; ch++) {
        /* History is copied because it is also needed for PSY */
        int32_t hist[512];
        int hist_start = 0;
326
        const int chi = c->channel_order_tab[ch];
Paul B Mahol's avatar
Paul B Mahol committed
327

328
        memcpy(hist, &c->history[ch][0], 512 * sizeof(int32_t));
Paul B Mahol's avatar
Paul B Mahol committed
329 330 331 332 333 334 335

        for (subs = 0; subs < SUBBAND_SAMPLES; subs++) {
            int32_t accum[64];
            int32_t resp;
            int band;

            /* Calculate the convolutions at once */
336
            memset(accum, 0, 64 * sizeof(int32_t));
Paul B Mahol's avatar
Paul B Mahol committed
337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352

            for (k = 0, i = hist_start, j = 0;
                    i < 512; k = (k + 1) & 63, i++, j++)
                accum[k] += mul32(hist[i], c->band_interpolation[j]);
            for (i = 0; i < hist_start; k = (k + 1) & 63, i++, j++)
                accum[k] += mul32(hist[i], c->band_interpolation[j]);

            for (k = 16; k < 32; k++)
                accum[k] = accum[k] - accum[31 - k];
            for (k = 32; k < 48; k++)
                accum[k] = accum[k] + accum[95 - k];

            for (band = 0; band < 32; band++) {
                resp = 0;
                for (i = 16; i < 48; i++) {
                    int s = (2 * band + 1) * (2 * (i + 16) + 1);
353
                    resp += mul32(accum[i], COS_T(s << 3)) >> 3;
Paul B Mahol's avatar
Paul B Mahol committed
354 355
                }

356
                c->subband[ch][band][subs] = ((band + 1) & 2) ? -resp : resp;
Paul B Mahol's avatar
Paul B Mahol committed
357 358 359 360
            }

            /* Copy in 32 new samples from input */
            for (i = 0; i < 32; i++)
361
                hist[i + hist_start] = input[(subs * 32 + i) * c->channels + chi];
362

Paul B Mahol's avatar
Paul B Mahol committed
363 364 365 366 367
            hist_start = (hist_start + 32) & 511;
        }
    }
}

368
static void lfe_downsample(DCAEncContext *c, const int32_t *input)
Paul B Mahol's avatar
Paul B Mahol committed
369 370
{
    /* FIXME: make 128x LFE downsampling possible */
371
    const int lfech = lfe_index[c->channel_config];
Paul B Mahol's avatar
Paul B Mahol committed
372 373 374 375 376
    int i, j, lfes;
    int32_t hist[512];
    int32_t accum;
    int hist_start = 0;

377
    memcpy(hist, &c->history[c->channels - 1][0], 512 * sizeof(int32_t));
Paul B Mahol's avatar
Paul B Mahol committed
378 379 380 381 382 383

    for (lfes = 0; lfes < DCA_LFE_SAMPLES; lfes++) {
        /* Calculate the convolution */
        accum = 0;

        for (i = hist_start, j = 0; i < 512; i++, j++)
384
            accum += mul32(hist[i], c->lfe_fir_64i[j]);
Paul B Mahol's avatar
Paul B Mahol committed
385
        for (i = 0; i < hist_start; i++, j++)
386
            accum += mul32(hist[i], c->lfe_fir_64i[j]);
Paul B Mahol's avatar
Paul B Mahol committed
387 388 389 390 391

        c->downsampled_lfe[lfes] = accum;

        /* Copy in 64 new samples from input */
        for (i = 0; i < 64; i++)
392
            hist[i + hist_start] = input[(lfes * 64 + i) * c->channels + lfech];
Paul B Mahol's avatar
Paul B Mahol committed
393 394 395

        hist_start = (hist_start + 64) & 511;
    }
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
396 397
}

398
static int32_t get_cb(DCAEncContext *c, int32_t in)
Paul B Mahol's avatar
Paul B Mahol committed
399
{
400 401
    int i, res = 0;
    in = FFABS(in);
Paul B Mahol's avatar
Paul B Mahol committed
402 403

    for (i = 1024; i > 0; i >>= 1) {
404
        if (c->cb_to_level[i + res] >= in)
Paul B Mahol's avatar
Paul B Mahol committed
405
            res += i;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
406
    }
Paul B Mahol's avatar
Paul B Mahol committed
407
    return -res;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
408 409
}

410
static int32_t add_cb(DCAEncContext *c, int32_t a, int32_t b)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
411
{
Paul B Mahol's avatar
Paul B Mahol committed
412 413 414 415 416
    if (a < b)
        FFSWAP(int32_t, a, b);

    if (a - b >= 256)
        return a;
417
    return a + c->cb_to_add[a - b];
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
418 419
}

420 421 422 423 424 425 426
static void calc_power(DCAEncContext *c,
                       const int32_t in[2 * 256], int32_t power[256])
{
    int i;
    LOCAL_ALIGNED_32(int32_t, data,  [512]);
    LOCAL_ALIGNED_32(int32_t, coeff, [256]);

427 428 429
    for (i = 0; i < 512; i++)
        data[i] = norm__(mul32(in[i], 0x3fffffff - (COS_T(4 * i + 2) >> 1)), 4);

430 431
    c->mdct.mdct_calc(&c->mdct, coeff, data);
    for (i = 0; i < 256; i++) {
432 433
        const int32_t cb = get_cb(c, coeff[i]);
        power[i] = add_cb(c, cb, cb);
434 435 436 437
    }
}

static void adjust_jnd(DCAEncContext *c,
Paul B Mahol's avatar
Paul B Mahol committed
438
                       const int32_t in[512], int32_t out_cb[256])
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
439
{
Paul B Mahol's avatar
Paul B Mahol committed
440 441 442 443 444
    int32_t power[256];
    int32_t out_cb_unnorm[256];
    int32_t denom;
    const int32_t ca_cb = -1114;
    const int32_t cs_cb = 928;
445
    const int samplerate_index = c->samplerate_index;
Paul B Mahol's avatar
Paul B Mahol committed
446 447
    int i, j;

448
    calc_power(c, in, power);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
449

450
    for (j = 0; j < 256; j++)
Paul B Mahol's avatar
Paul B Mahol committed
451 452 453 454 455
        out_cb_unnorm[j] = -2047; /* and can only grow */

    for (i = 0; i < AUBANDS; i++) {
        denom = ca_cb; /* and can only grow */
        for (j = 0; j < 256; j++)
456
            denom = add_cb(c, denom, power[j] + c->auf[samplerate_index][i][j]);
Paul B Mahol's avatar
Paul B Mahol committed
457
        for (j = 0; j < 256; j++)
458 459
            out_cb_unnorm[j] = add_cb(c, out_cb_unnorm[j],
                                      -denom + c->auf[samplerate_index][i][j]);
Paul B Mahol's avatar
Paul B Mahol committed
460 461 462
    }

    for (j = 0; j < 256; j++)
463
        out_cb[j] = add_cb(c, out_cb[j], -out_cb_unnorm[j] - ca_cb - cs_cb);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
464 465
}

466
typedef void (*walk_band_t)(DCAEncContext *c, int band1, int band2, int f,
Paul B Mahol's avatar
Paul B Mahol committed
467 468 469
                            int32_t spectrum1, int32_t spectrum2, int channel,
                            int32_t * arg);

470
static void walk_band_low(DCAEncContext *c, int band, int channel,
Paul B Mahol's avatar
Paul B Mahol committed
471
                          walk_band_t walk, int32_t *arg)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
472
{
Paul B Mahol's avatar
Paul B Mahol committed
473
    int f;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
474

Paul B Mahol's avatar
Paul B Mahol committed
475 476 477 478 479 480 481 482 483
    if (band == 0) {
        for (f = 0; f < 4; f++)
            walk(c, 0, 0, f, 0, -2047, channel, arg);
    } else {
        for (f = 0; f < 8; f++)
            walk(c, band, band - 1, 8 * band - 4 + f,
                    c->band_spectrum[7 - f], c->band_spectrum[f], channel, arg);
    }
}
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
484

485
static void walk_band_high(DCAEncContext *c, int band, int channel,
Paul B Mahol's avatar
Paul B Mahol committed
486 487 488
                           walk_band_t walk, int32_t *arg)
{
    int f;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
489

Paul B Mahol's avatar
Paul B Mahol committed
490 491 492 493 494 495 496 497 498
    if (band == 31) {
        for (f = 0; f < 4; f++)
            walk(c, 31, 31, 256 - 4 + f, 0, -2047, channel, arg);
    } else {
        for (f = 0; f < 8; f++)
            walk(c, band, band + 1, 8 * band + 4 + f,
                    c->band_spectrum[f], c->band_spectrum[7 - f], channel, arg);
    }
}
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
499

500
static void update_band_masking(DCAEncContext *c, int band1, int band2,
Paul B Mahol's avatar
Paul B Mahol committed
501 502 503 504
                                int f, int32_t spectrum1, int32_t spectrum2,
                                int channel, int32_t * arg)
{
    int32_t value = c->eff_masking_curve_cb[f] - spectrum1;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
505

Paul B Mahol's avatar
Paul B Mahol committed
506 507 508 509
    if (value < c->band_masking_cb[band1])
        c->band_masking_cb[band1] = value;
}

510
static void calc_masking(DCAEncContext *c, const int32_t *input)
Paul B Mahol's avatar
Paul B Mahol committed
511 512 513 514 515 516 517 518 519 520
{
    int i, k, band, ch, ssf;
    int32_t data[512];

    for (i = 0; i < 256; i++)
        for (ssf = 0; ssf < SUBSUBFRAMES; ssf++)
            c->masking_curve_cb[ssf][i] = -2047;

    for (ssf = 0; ssf < SUBSUBFRAMES; ssf++)
        for (ch = 0; ch < c->fullband_channels; ch++) {
521 522
            const int chi = c->channel_order_tab[ch];

Paul B Mahol's avatar
Paul B Mahol committed
523
            for (i = 0, k = 128 + 256 * ssf; k < 512; i++, k++)
524
                data[i] = c->history[ch][k];
Paul B Mahol's avatar
Paul B Mahol committed
525
            for (k -= 512; i < 512; i++, k++)
526
                data[i] = input[k * c->channels + chi];
527
            adjust_jnd(c, data, c->masking_curve_cb[ssf]);
Paul B Mahol's avatar
Paul B Mahol committed
528 529 530 531 532 533 534 535 536 537 538 539 540 541
        }
    for (i = 0; i < 256; i++) {
        int32_t m = 2048;

        for (ssf = 0; ssf < SUBSUBFRAMES; ssf++)
            if (c->masking_curve_cb[ssf][i] < m)
                m = c->masking_curve_cb[ssf][i];
        c->eff_masking_curve_cb[i] = m;
    }

    for (band = 0; band < 32; band++) {
        c->band_masking_cb[band] = 2048;
        walk_band_low(c, band, 0, update_band_masking, NULL);
        walk_band_high(c, band, 0, update_band_masking, NULL);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
542 543 544
    }
}

545 546
static inline int32_t find_peak(DCAEncContext *c, const int32_t *in, int len)
{
547 548 549 550
    int sample;
    int32_t m = 0;
    for (sample = 0; sample < len; sample++) {
        int32_t s = abs(in[sample]);
551
        if (m < s)
552 553
            m = s;
    }
554
    return get_cb(c, m);
555 556
}

557
static void find_peaks(DCAEncContext *c)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
558
{
Paul B Mahol's avatar
Paul B Mahol committed
559 560
    int band, ch;

561
    for (ch = 0; ch < c->fullband_channels; ch++) {
562 563 564
        for (band = 0; band < 32; band++)
            c->peak_cb[ch][band] = find_peak(c, c->subband[ch][band],
                                             SUBBAND_SAMPLES);
565
    }
Paul B Mahol's avatar
Paul B Mahol committed
566

567 568
    if (c->lfe_channel)
        c->lfe_peak_cb = find_peak(c, c->downsampled_lfe, DCA_LFE_SAMPLES);
569 570 571 572 573 574 575 576
}

static void adpcm_analysis(DCAEncContext *c)
{
    int ch, band;
    int pred_vq_id;
    int32_t *samples;
    int32_t estimated_diff[SUBBAND_SAMPLES];
Paul B Mahol's avatar
Paul B Mahol committed
577

578 579 580 581
    c->consumed_adpcm_bits = 0;
    for (ch = 0; ch < c->fullband_channels; ch++) {
        for (band = 0; band < 32; band++) {
            samples = c->subband[ch][band] - DCA_ADPCM_COEFFS;
582 583
            pred_vq_id = ff_dcaadpcm_subband_analysis(&c->adpcm_ctx, samples,
                                                      SUBBAND_SAMPLES, estimated_diff);
584 585 586
            if (pred_vq_id >= 0) {
                c->prediction_mode[ch][band] = pred_vq_id;
                c->consumed_adpcm_bits += 12; //12 bits to transmit prediction vq index
587
                c->diff_peak_cb[ch][band] = find_peak(c, estimated_diff, 16);
588 589 590 591
            } else {
                c->prediction_mode[ch][band] = -1;
            }
        }
Paul B Mahol's avatar
Paul B Mahol committed
592
    }
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
593 594
}

Paul B Mahol's avatar
Paul B Mahol committed
595 596 597 598
static const int snr_fudge = 128;
#define USED_1ABITS 1
#define USED_26ABITS 4

599
static inline int32_t get_step_size(DCAEncContext *c, int ch, int band)
600
{
601
    int32_t step_size;
602

603 604 605 606 607 608
    if (c->bitrate_index == 3)
        step_size = ff_dca_lossless_quant[c->abits[ch][band]];
    else
        step_size = ff_dca_lossy_quant[c->abits[ch][band]];

    return step_size;
609 610
}

611 612
static int calc_one_scale(DCAEncContext *c, int32_t peak_cb, int abits,
                          softfloat *quant)
613 614 615 616 617 618 619 620 621
{
    int32_t peak;
    int our_nscale, try_remove;
    softfloat our_quant;

    av_assert0(peak_cb <= 0);
    av_assert0(peak_cb >= -2047);

    our_nscale = 127;
622
    peak = c->cb_to_level[-peak_cb];
623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643

    for (try_remove = 64; try_remove > 0; try_remove >>= 1) {
        if (scalefactor_inv[our_nscale - try_remove].e + stepsize_inv[abits].e <= 17)
            continue;
        our_quant.m = mul32(scalefactor_inv[our_nscale - try_remove].m, stepsize_inv[abits].m);
        our_quant.e = scalefactor_inv[our_nscale - try_remove].e + stepsize_inv[abits].e - 17;
        if ((ff_dca_quant_levels[abits] - 1) / 2 < quantize_value(peak, our_quant))
            continue;
        our_nscale -= try_remove;
    }

    if (our_nscale >= 125)
        our_nscale = 124;

    quant->m = mul32(scalefactor_inv[our_nscale].m, stepsize_inv[abits].m);
    quant->e = scalefactor_inv[our_nscale].e + stepsize_inv[abits].e - 17;
    av_assert0((ff_dca_quant_levels[abits] - 1) / 2 >= quantize_value(peak, *quant));

    return our_nscale;
}

644 645 646 647
static inline void quantize_adpcm_subband(DCAEncContext *c, int ch, int band)
{
    int32_t step_size;
    int32_t diff_peak_cb = c->diff_peak_cb[ch][band];
648
    c->scale_factor[ch][band] = calc_one_scale(c, diff_peak_cb,
649 650 651 652 653
                                               c->abits[ch][band],
                                               &c->quant[ch][band]);

    step_size = get_step_size(c, ch, band);
    ff_dcaadpcm_do_real(c->prediction_mode[ch][band],
654 655 656 657 658
                        c->quant[ch][band],
                        ff_dca_scale_factor_quant7[c->scale_factor[ch][band]],
                        step_size, c->adpcm_history[ch][band], c->subband[ch][band],
                        c->adpcm_history[ch][band] + 4, c->quantized[ch][band],
                        SUBBAND_SAMPLES, c->cb_to_level[-diff_peak_cb]);
659 660 661 662 663 664 665 666 667 668 669 670 671
}

static void quantize_adpcm(DCAEncContext *c)
{
    int band, ch;

    for (ch = 0; ch < c->fullband_channels; ch++)
        for (band = 0; band < 32; band++)
            if (c->prediction_mode[ch][band] >= 0)
                quantize_adpcm_subband(c, ch, band);
}

static void quantize_pcm(DCAEncContext *c)
672 673 674
{
    int sample, band, ch;

675 676 677 678 679 680 681 682 683 684 685
    for (ch = 0; ch < c->fullband_channels; ch++) {
        for (band = 0; band < 32; band++) {
            if (c->prediction_mode[ch][band] == -1) {
                for (sample = 0; sample < SUBBAND_SAMPLES; sample++) {
                    int32_t val = quantize_value(c->subband[ch][band][sample],
                                                 c->quant[ch][band]);
                    c->quantized[ch][band][sample] = val;
                }
            }
        }
    }
686 687
}

688 689
static void accumulate_huff_bit_consumption(int abits, int32_t *quantized,
                                            uint32_t *result)
690 691 692
{
    uint8_t sel, id = abits - 1;
    for (sel = 0; sel < ff_dca_quant_index_group_size[id]; sel++)
693 694
        result[sel] += ff_dca_vlc_calc_quant_bits(quantized, SUBBAND_SAMPLES,
                                                  sel, id);
695 696
}

697 698 699
static uint32_t set_best_code(uint32_t vlc_bits[DCA_CODE_BOOKS][7],
                              uint32_t clc_bits[DCA_CODE_BOOKS],
                              int32_t res[DCA_CODE_BOOKS])
700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737
{
    uint8_t i, sel;
    uint32_t best_sel_bits[DCA_CODE_BOOKS];
    int32_t best_sel_id[DCA_CODE_BOOKS];
    uint32_t t, bits = 0;

    for (i = 0; i < DCA_CODE_BOOKS; i++) {

        av_assert0(!((!!vlc_bits[i][0]) ^ (!!clc_bits[i])));
        if (vlc_bits[i][0] == 0) {
            /* do not transmit adjustment index for empty codebooks */
            res[i] = ff_dca_quant_index_group_size[i];
            /* and skip it */
            continue;
        }

        best_sel_bits[i] = vlc_bits[i][0];
        best_sel_id[i] = 0;
        for (sel = 0; sel < ff_dca_quant_index_group_size[i]; sel++) {
            if (best_sel_bits[i] > vlc_bits[i][sel] && vlc_bits[i][sel]) {
                best_sel_bits[i] = vlc_bits[i][sel];
                best_sel_id[i] = sel;
            }
        }

        /* 2 bits to transmit scale factor adjustment index */
        t = best_sel_bits[i] + 2;
        if (t < clc_bits[i]) {
            res[i] = best_sel_id[i];
            bits += t;
        } else {
            res[i] = ff_dca_quant_index_group_size[i];
            bits += clc_bits[i];
        }
    }
    return bits;
}

738 739
static uint32_t set_best_abits_code(int abits[DCAENC_SUBBANDS], int bands,
                                    int32_t *res)
740 741 742 743 744 745 746 747
{
    uint8_t i;
    uint32_t t;
    int32_t best_sel = 6;
    int32_t best_bits = bands * 5;

    /* Check do we have subband which cannot be encoded by Huffman tables */
    for (i = 0; i < bands; i++) {
748
        if (abits[i] > 12 || abits[i] == 0) {
749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765
            *res = best_sel;
            return best_bits;
        }
    }

    for (i = 0; i < DCA_BITALLOC_12_COUNT; i++) {
        t = ff_dca_vlc_calc_alloc_bits(abits, bands, i);
        if (t < best_bits) {
            best_bits = t;
            best_sel = i;
        }
    }

    *res = best_sel;
    return best_bits;
}

766
static int init_quantization_noise(DCAEncContext *c, int noise, int forbid_zero)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
767
{
768
    int ch, band, ret = USED_26ABITS | USED_1ABITS;
769 770 771
    uint32_t huff_bit_count_accum[MAX_CHANNELS][DCA_CODE_BOOKS][7];
    uint32_t clc_bit_count_accum[MAX_CHANNELS][DCA_CODE_BOOKS];
    uint32_t bits_counter = 0;
Paul B Mahol's avatar
Paul B Mahol committed
772

773
    c->consumed_bits = 132 + 333 * c->fullband_channels;
774
    c->consumed_bits += c->consumed_adpcm_bits;
Paul B Mahol's avatar
Paul B Mahol committed
775 776 777 778 779 780
    if (c->lfe_channel)
        c->consumed_bits += 72;

    /* attempt to guess the bit distribution based on the prevoius frame */
    for (ch = 0; ch < c->fullband_channels; ch++) {
        for (band = 0; band < 32; band++) {
781
            int snr_cb = c->peak_cb[ch][band] - c->band_masking_cb[band] - noise;
Paul B Mahol's avatar
Paul B Mahol committed
782 783

            if (snr_cb >= 1312) {
784
                c->abits[ch][band] = 26;
785
                ret &= ~USED_1ABITS;
Paul B Mahol's avatar
Paul B Mahol committed
786
            } else if (snr_cb >= 222) {
787
                c->abits[ch][band] = 8 + mul32(snr_cb - 222, 69000000);
788
                ret &= ~(USED_26ABITS | USED_1ABITS);
Paul B Mahol's avatar
Paul B Mahol committed
789
            } else if (snr_cb >= 0) {
790
                c->abits[ch][band] = 2 + mul32(snr_cb, 106000000);
791 792
                ret &= ~(USED_26ABITS | USED_1ABITS);
            } else if (forbid_zero || snr_cb >= -140) {
793
                c->abits[ch][band] = 1;
794 795 796 797
                ret &= ~USED_26ABITS;
            } else {
                c->abits[ch][band] = 0;
                ret &= ~(USED_26ABITS | USED_1ABITS);
Paul B Mahol's avatar
Paul B Mahol committed
798 799
            }
        }
800 801
        c->consumed_bits += set_best_abits_code(c->abits[ch], 32,
                                                &c->bit_allocation_sel[ch]);
Paul B Mahol's avatar
Paul B Mahol committed
802
    }
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
803

804 805 806 807 808
    /* Recalc scale_factor each time to get bits consumption in case of Huffman coding.
       It is suboptimal solution */
    /* TODO: May be cache scaled values */
    for (ch = 0; ch < c->fullband_channels; ch++) {
        for (band = 0; band < 32; band++) {
809
            if (c->prediction_mode[ch][band] == -1) {
810
                c->scale_factor[ch][band] = calc_one_scale(c, c->peak_cb[ch][band],
811 812 813
                                                           c->abits[ch][band],
                                                           &c->quant[ch][band]);
            }
814 815
        }
    }
816 817
    quantize_adpcm(c);
    quantize_pcm(c);
818 819 820 821

    memset(huff_bit_count_accum, 0, MAX_CHANNELS * DCA_CODE_BOOKS * 7 * sizeof(uint32_t));
    memset(clc_bit_count_accum, 0, MAX_CHANNELS * DCA_CODE_BOOKS * sizeof(uint32_t));
    for (ch = 0; ch < c->fullband_channels; ch++) {
822
        for (band = 0; band < 32; band++) {
823
            if (c->abits[ch][band] && c->abits[ch][band] <= DCA_CODE_BOOKS) {
824 825 826
                accumulate_huff_bit_consumption(c->abits[ch][band],
                                                c->quantized[ch][band],
                                                huff_bit_count_accum[ch][c->abits[ch][band] - 1]);
827 828 829 830
                clc_bit_count_accum[ch][c->abits[ch][band] - 1] += bit_consumption[c->abits[ch][band]];
            } else {
                bits_counter += bit_consumption[c->abits[ch][band]];
            }
Paul B Mahol's avatar
Paul B Mahol committed
831
        }
832 833 834
    }

    for (ch = 0; ch < c->fullband_channels; ch++) {
835 836 837
        bits_counter += set_best_code(huff_bit_count_accum[ch],
                                      clc_bit_count_accum[ch],
                                      c->quant_index_sel[ch]);
838 839 840
    }

    c->consumed_bits += bits_counter;
Paul B Mahol's avatar
Paul B Mahol committed
841 842 843 844

    return ret;
}

845
static void assign_bits(DCAEncContext *c)
Paul B Mahol's avatar
Paul B Mahol committed
846 847 848 849
{
    /* Find the bounds where the binary search should work */
    int low, high, down;
    int used_abits = 0;
850 851 852
    int forbid_zero = 1;
restart:
    init_quantization_noise(c, c->worst_quantization_noise, forbid_zero);
Paul B Mahol's avatar
Paul B Mahol committed
853 854 855
    low = high = c->worst_quantization_noise;
    if (c->consumed_bits > c->frame_bits) {
        while (c->consumed_bits > c->frame_bits) {
856 857 858 859
            if (used_abits == USED_1ABITS && forbid_zero) {
                forbid_zero = 0;
                goto restart;
            }
Paul B Mahol's avatar
Paul B Mahol committed
860 861
            low = high;
            high += snr_fudge;
862
            used_abits = init_quantization_noise(c, high, forbid_zero);
Paul B Mahol's avatar
Paul B Mahol committed
863 864 865 866 867 868 869
        }
    } else {
        while (c->consumed_bits <= c->frame_bits) {
            high = low;
            if (used_abits == USED_26ABITS)
                goto out; /* The requested bitrate is too high, pad with zeros */
            low -= snr_fudge;
870
            used_abits = init_quantization_noise(c, low, forbid_zero);
Paul B Mahol's avatar
Paul B Mahol committed
871 872 873 874 875
        }
    }

    /* Now do a binary search between low and high to see what fits */
    for (down = snr_fudge >> 1; down; down >>= 1) {
876
        init_quantization_noise(c, high - down, forbid_zero);
Paul B Mahol's avatar
Paul B Mahol committed
877 878 879
        if (c->consumed_bits <= c->frame_bits)
            high -= down;
    }
880
    init_quantization_noise(c, high, forbid_zero);
Paul B Mahol's avatar
Paul B Mahol committed
881 882 883 884 885 886
out:
    c->worst_quantization_noise = high;
    if (high > c->worst_noise_ever)
        c->worst_noise_ever = high;
}

887
static void shift_history(DCAEncContext *c, const int32_t *input)
Paul B Mahol's avatar
Paul B Mahol committed
888 889 890 891
{
    int k, ch;

    for (k = 0; k < 512; k++)
892 893 894
        for (ch = 0; ch < c->channels; ch++) {
            const int chi = c->channel_order_tab[ch];

895
            c->history[ch][k] = input[k * c->channels + chi];
896
        }
Paul B Mahol's avatar
Paul B Mahol committed
897 898
}

899 900 901 902 903 904 905 906 907 908 909 910 911 912 913
static void fill_in_adpcm_bufer(DCAEncContext *c)
{
     int ch, band;
     int32_t step_size;
     /* We fill in ADPCM work buffer for subbands which hasn't been ADPCM coded
      * in current frame - we need this data if subband of next frame is
      * ADPCM
      */
     for (ch = 0; ch < c->channels; ch++) {
        for (band = 0; band < 32; band++) {
            int32_t *samples = c->subband[ch][band] - DCA_ADPCM_COEFFS;
            if (c->prediction_mode[ch][band] == -1) {
                step_size = get_step_size(c, ch, band);

                ff_dca_core_dequantize(c->adpcm_history[ch][band],
914 915
                                       c->quantized[ch][band]+12, step_size,
                                       ff_dca_scale_factor_quant7[c->scale_factor[ch][band]], 0, 4);
916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934
            } else {
                AV_COPY128U(c->adpcm_history[ch][band], c->adpcm_history[ch][band]+4);
            }
            /* Copy dequantized values for LPC analysis.
             * It reduces artifacts in case of extreme quantization,
             * example: in current frame abits is 1 and has no prediction flag,
             * but end of this frame is sine like signal. In this case, if LPC analysis uses
             * original values, likely LPC analysis returns good prediction gain, and sets prediction flag.
             * But there are no proper value in decoder history, so likely result will be no good.
             * Bitstream has "Predictor history flag switch", but this flag disables history for all subbands
             */
            samples[0] = c->adpcm_history[ch][band][0] << 7;
            samples[1] = c->adpcm_history[ch][band][1] << 7;
            samples[2] = c->adpcm_history[ch][band][2] << 7;
            samples[3] = c->adpcm_history[ch][band][3] << 7;
        }
     }
}

935
static void calc_lfe_scales(DCAEncContext *c)
Paul B Mahol's avatar
Paul B Mahol committed
936 937
{
    if (c->lfe_channel)
938
        c->lfe_scale_factor = calc_one_scale(c, c->lfe_peak_cb, 11, &c->lfe_quant);
Paul B Mahol's avatar
Paul B Mahol committed
939 940
}

941
static void put_frame_header(DCAEncContext *c)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
942 943 944 945 946 947 948 949 950 951 952 953 954 955 956
{
    /* SYNC */
    put_bits(&c->pb, 16, 0x7ffe);
    put_bits(&c->pb, 16, 0x8001);

    /* Frame type: normal */
    put_bits(&c->pb, 1, 1);

    /* Deficit sample count: none */
    put_bits(&c->pb, 5, 31);

    /* CRC is not present */
    put_bits(&c->pb, 1, 0);

    /* Number of PCM sample blocks */
Paul B Mahol's avatar
Paul B Mahol committed
957
    put_bits(&c->pb, 7, SUBBAND_SAMPLES - 1);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
958 959

    /* Primary frame byte size */
Paul B Mahol's avatar
Paul B Mahol committed
960
    put_bits(&c->pb, 14, c->frame_size - 1);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
961

Paul B Mahol's avatar
Paul B Mahol committed
962 963
    /* Audio channel arrangement */
    put_bits(&c->pb, 6, c->channel_config);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
964 965

    /* Core audio sampling frequency */
Paul B Mahol's avatar
Paul B Mahol committed
966
    put_bits(&c->pb, 4, bitstream_sfreq[c->samplerate_index]);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
967

Paul B Mahol's avatar
Paul B Mahol committed
968 969
    /* Transmission bit rate */
    put_bits(&c->pb, 5, c->bitrate_index);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994

    /* Embedded down mix: disabled */
    put_bits(&c->pb, 1, 0);

    /* Embedded dynamic range flag: not present */
    put_bits(&c->pb, 1, 0);

    /* Embedded time stamp flag: not present */
    put_bits(&c->pb, 1, 0);

    /* Auxiliary data flag: not present */
    put_bits(&c->pb, 1, 0);

    /* HDCD source: no */
    put_bits(&c->pb, 1, 0);

    /* Extension audio ID: N/A */
    put_bits(&c->pb, 3, 0);

    /* Extended audio data: not present */
    put_bits(&c->pb, 1, 0);

    /* Audio sync word insertion flag: after each sub-frame */
    put_bits(&c->pb, 1, 0);

Paul B Mahol's avatar
Paul B Mahol committed
995 996
    /* Low frequency effects flag: not present or 64x subsampling */
    put_bits(&c->pb, 2, c->lfe_channel ? 2 : 0);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023

    /* Predictor history switch flag: on */
    put_bits(&c->pb, 1, 1);

    /* No CRC */
    /* Multirate interpolator switch: non-perfect reconstruction */
    put_bits(&c->pb, 1, 0);

    /* Encoder software revision: 7 */
    put_bits(&c->pb, 4, 7);

    /* Copy history: 0 */
    put_bits(&c->pb, 2, 0);

    /* Source PCM resolution: 16 bits, not DTS ES */
    put_bits(&c->pb, 3, 0);

    /* Front sum/difference coding: no */
    put_bits(&c->pb, 1, 0);

    /* Surrounds sum/difference coding: no */
    put_bits(&c->pb, 1, 0);

    /* Dialog normalization: 0 dB */
    put_bits(&c->pb, 4, 0);
}

1024
static void put_primary_audio_header(DCAEncContext *c)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1025 1026 1027 1028 1029 1030
{
    int ch, i;
    /* Number of subframes */
    put_bits(&c->pb, 4, SUBFRAMES - 1);

    /* Number of primary audio channels */
Paul B Mahol's avatar
Paul B Mahol committed
1031
    put_bits(&c->pb, 3, c->fullband_channels - 1);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1032 1033

    /* Subband activity count */
Paul B Mahol's avatar
Paul B Mahol committed
1034
    for (ch = 0; ch < c->fullband_channels; ch++)
1035
        put_bits(&c->pb, 5, DCAENC_SUBBANDS - 2);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1036 1037

    /* High frequency VQ start subband */
Paul B Mahol's avatar
Paul B Mahol committed
1038
    for (ch = 0; ch < c->fullband_channels; ch++)
1039
        put_bits(&c->pb, 5, DCAENC_SUBBANDS - 1);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1040 1041

    /* Joint intensity coding index: 0, 0 */
Paul B Mahol's avatar
Paul B Mahol committed
1042
    for (ch = 0; ch < c->fullband_channels; ch++)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1043 1044 1045
        put_bits(&c->pb, 3, 0);

    /* Transient mode codebook: A4, A4 (arbitrary) */
Paul B Mahol's avatar
Paul B Mahol committed
1046
    for (ch = 0; ch < c->fullband_channels; ch++)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1047 1048 1049
        put_bits(&c->pb, 2, 0);

    /* Scale factor code book: 7 bit linear, 7-bit sqrt table (for each channel) */
Paul B Mahol's avatar
Paul B Mahol committed
1050
    for (ch = 0; ch < c->fullband_channels; ch++)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1051 1052 1053
        put_bits(&c->pb, 3, 6);

    /* Bit allocation quantizer select: linear 5-bit */
Paul B Mahol's avatar
Paul B Mahol committed
1054
    for (ch = 0; ch < c->fullband_channels; ch++)
1055
        put_bits(&c->pb, 3, c->bit_allocation_sel[ch]);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1056

1057 1058
    /* Quantization index codebook select */
    for (i = 0; i < DCA_CODE_BOOKS; i++)
Paul B Mahol's avatar
Paul B Mahol committed
1059
        for (ch = 0; ch < c->fullband_channels; ch++)
1060 1061 1062 1063 1064 1065 1066
            put_bits(&c->pb, ff_dca_quant_index_sel_nbits[i], c->quant_index_sel[ch][i]);

    /* Scale factor adjustment index: transmitted in case of Huffman coding */
    for (i = 0; i < DCA_CODE_BOOKS; i++)
        for (ch = 0; ch < c->fullband_channels; ch++)
            if (c->quant_index_sel[ch][i] < ff_dca_quant_index_group_size[i])
                put_bits(&c->pb, 2, 0);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1067

Paul B Mahol's avatar
Paul B Mahol committed
1068
    /* Audio header CRC check word: not transmitted */
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1069 1070
}

1071
static void put_subframe_samples(DCAEncContext *c, int ss, int band, int ch)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1072
{
1073 1074 1075 1076 1077 1078
    int i, j, sum, bits, sel;
    if (c->abits[ch][band] <= DCA_CODE_BOOKS) {
        av_assert0(c->abits[ch][band] > 0);
        sel = c->quant_index_sel[ch][c->abits[ch][band] - 1];
        // Huffman codes
        if (sel < ff_dca_quant_index_group_size[c->abits[ch][band] - 1]) {
1079 1080
            ff_dca_vlc_enc_quant(&c->pb, &c->quantized[ch][band][ss * 8], 8,
                                 sel, c->abits[ch][band] - 1);
1081
            return;
Paul B Mahol's avatar
Paul B Mahol committed
1082
        }
1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095

        // Block codes
        if (c->abits[ch][band] <= 7) {
            for (i = 0; i < 8; i += 4) {
                sum = 0;
                for (j = 3; j >= 0; j--) {
                    sum *= ff_dca_quant_levels[c->abits[ch][band]];
                    sum += c->quantized[ch][band][ss * 8 + i + j];
                    sum += (ff_dca_quant_levels[c->abits[ch][band]] - 1) / 2;
                }
                put_bits(&c->pb, bit_consumption[c->abits[ch][band]] / 4, sum);
            }
            return;
Paul B Mahol's avatar
Paul B Mahol committed
1096
        }
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1097
    }
1098 1099 1100 1101 1102

    for (i = 0; i < 8; i++) {
        bits = bit_consumption[c->abits[ch][band]] / 16;
        put_sbits(&c->pb, bits, c->quantized[ch][band][ss * 8 + i]);
    }
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1103 1104
}

1105
static void put_subframe(DCAEncContext *c, int subframe)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1106
{
Paul B Mahol's avatar
Paul B Mahol committed
1107
    int i, band, ss, ch;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1108 1109 1110 1111 1112 1113 1114 1115

    /* Subsubframes count */
    put_bits(&c->pb, 2, SUBSUBFRAMES -1);

    /* Partial subsubframe sample count: dummy */
    put_bits(&c->pb, 3, 0);

    /* Prediction mode: no ADPCM, in each channel and subband */
Paul B Mahol's avatar
Paul B Mahol committed
1116
    for (ch = 0; ch < c->fullband_channels; ch++)
1117
        for (band = 0; band < DCAENC_SUBBANDS; band++)
1118 1119 1120 1121 1122 1123 1124
            put_bits(&c->pb, 1, !(c->prediction_mode[ch][band] == -1));

    /* Prediction VQ address */
    for (ch = 0; ch < c->fullband_channels; ch++)
        for (band = 0; band < DCAENC_SUBBANDS; band++)
            if (c->prediction_mode[ch][band] >= 0)
                put_bits(&c->pb, 12, c->prediction_mode[ch][band]);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1125 1126

    /* Bit allocation index */
1127 1128 1129 1130 1131 1132
    for (ch = 0; ch < c->fullband_channels; ch++) {
        if (c->bit_allocation_sel[ch] == 6) {
            for (band = 0; band < DCAENC_SUBBANDS; band++) {
                put_bits(&c->pb, 5, c->abits[ch][band]);
            }
        } else {
1133 1134
            ff_dca_vlc_enc_alloc(&c->pb, c->abits[ch], DCAENC_SUBBANDS,
                                 c->bit_allocation_sel[ch]);
1135 1136
        }
    }
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1137 1138 1139

    if (SUBSUBFRAMES > 1) {
        /* Transition mode: none for each channel and subband */
Paul B Mahol's avatar
Paul B Mahol committed
1140
        for (ch = 0; ch < c->fullband_channels; ch++)
1141
            for (band = 0; band < DCAENC_SUBBANDS; band++)
1142 1143
                if (c->abits[ch][band])
                    put_bits(&c->pb, 1, 0); /* codebook A4 */
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1144 1145
    }

Paul B Mahol's avatar
Paul B Mahol committed
1146 1147
    /* Scale factors */
    for (ch = 0; ch < c->fullband_channels; ch++)
1148
        for (band = 0; band < DCAENC_SUBBANDS; band++)
1149 1150
            if (c->abits[ch][band])
                put_bits(&c->pb, 7, c->scale_factor[ch][band]);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1151 1152 1153 1154 1155 1156 1157 1158

    /* Joint subband scale factor codebook select: not transmitted */
    /* Scale factors for joint subband coding: not transmitted */
    /* Stereo down-mix coefficients: not transmitted */
    /* Dynamic range coefficient: not transmitted */
    /* Stde information CRC check word: not transmitted */
    /* VQ encoded high frequency subbands: not transmitted */

Paul B Mahol's avatar
Paul B Mahol committed
1159
    /* LFE data: 8 samples and scalefactor */
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1160
    if (c->lfe_channel) {
Paul B Mahol's avatar
Paul B Mahol committed
1161 1162
        for (i = 0; i < DCA_LFE_SAMPLES; i++)
            put_bits(&c->pb, 8, quantize_value(c->downsampled_lfe[i], c->lfe_quant) & 0xff);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1163 1164 1165 1166 1167
        put_bits(&c->pb, 8, c->lfe_scale_factor);
    }

    /* Audio data (subsubframes) */
    for (ss = 0; ss < SUBSUBFRAMES ; ss++)
Paul B Mahol's avatar
Paul B Mahol committed
1168
        for (ch = 0; ch < c->fullband_channels; ch++)
1169
            for (band = 0; band < DCAENC_SUBBANDS; band++)
1170
                if (c->abits[ch][band])
Paul B Mahol's avatar
Paul B Mahol committed
1171
                    put_subframe_samples(c, ss, band, ch);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1172 1173 1174 1175 1176

    /* DSYNC */
    put_bits(&c->pb, 16, 0xffff);
}

1177 1178
static int encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
                        const AVFrame *frame, int *got_packet_ptr)
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1179
{
1180
    DCAEncContext *c = avctx->priv_data;
Paul B Mahol's avatar
Paul B Mahol committed
1181 1182
    const int32_t *samples;
    int ret, i;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1183

1184
    if ((ret = ff_alloc_packet2(avctx, avpkt, c->frame_size, 0)) < 0)
1185 1186
        return ret;

Paul B Mahol's avatar
Paul B Mahol committed
1187
    samples = (const int32_t *)frame->data[0];
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1188

Paul B Mahol's avatar
Paul B Mahol committed
1189 1190 1191
    subband_transform(c, samples);
    if (c->lfe_channel)
        lfe_downsample(c, samples);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1192

Paul B Mahol's avatar
Paul B Mahol committed
1193
    calc_masking(c, samples);
1194 1195
    if (c->options.adpcm_mode)
        adpcm_analysis(c);
Paul B Mahol's avatar
Paul B Mahol committed
1196 1197
    find_peaks(c);
    assign_bits(c);
1198
    calc_lfe_scales(c);
Paul B Mahol's avatar
Paul B Mahol committed
1199
    shift_history(c, samples);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1200

Paul B Mahol's avatar
Paul B Mahol committed
1201
    init_put_bits(&c->pb, avpkt->data, avpkt->size);
1202
    fill_in_adpcm_bufer(c);
Paul B Mahol's avatar
Paul B Mahol committed
1203 1204 1205 1206
    put_frame_header(c);
    put_primary_audio_header(c);
    for (i = 0; i < SUBFRAMES; i++)
        put_subframe(c, i);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1207

1208 1209 1210 1211

    for (i = put_bits_count(&c->pb); i < 8*c->frame_size; i++)
        put_bits(&c->pb, 1, 0);

Paul B Mahol's avatar
Paul B Mahol committed
1212
    flush_put_bits(&c->pb);
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1213

Paul B Mahol's avatar
Paul B Mahol committed
1214 1215
    avpkt->pts      = frame->pts;
    avpkt->duration = ff_samples_to_time_base(avctx, frame->nb_samples);
1216
    avpkt->size     = put_bits_count(&c->pb) >> 3;
Paul B Mahol's avatar
Paul B Mahol committed
1217
    *got_packet_ptr = 1;
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1218 1219 1220
    return 0;
}

1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234
#define DCAENC_FLAGS AV_OPT_FLAG_ENCODING_PARAM | AV_OPT_FLAG_AUDIO_PARAM

static const AVOption options[] = {
    { "dca_adpcm", "Use ADPCM encoding", offsetof(DCAEncContext, options.adpcm_mode), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, DCAENC_FLAGS },
    { NULL },
};

static const AVClass dcaenc_class = {
    .class_name = "DCA (DTS Coherent Acoustics)",
    .item_name = av_default_item_name,
    .option = options,
    .version = LIBAVUTIL_VERSION_INT,
};

Paul B Mahol's avatar
Paul B Mahol committed
1235 1236 1237 1238 1239
static const AVCodecDefault defaults[] = {
    { "b",          "1411200" },
    { NULL },
};

Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1240
AVCodec ff_dca_encoder = {
Paul B Mahol's avatar
Paul B Mahol committed
1241
    .name                  = "dca",
1242
    .long_name             = NULL_IF_CONFIG_SMALL("DCA (DTS Coherent Acoustics)"),
Paul B Mahol's avatar
Paul B Mahol committed
1243 1244
    .type                  = AVMEDIA_TYPE_AUDIO,
    .id                    = AV_CODEC_ID_DTS,
1245
    .priv_data_size        = sizeof(DCAEncContext),
Paul B Mahol's avatar
Paul B Mahol committed
1246
    .init                  = encode_init,
1247
    .close                 = encode_close,
Paul B Mahol's avatar
Paul B Mahol committed
1248
    .encode2               = encode_frame,
1249
    .capabilities          = AV_CODEC_CAP_EXPERIMENTAL,
1250
    .caps_internal         = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_INIT_CLEANUP,
Paul B Mahol's avatar
Paul B Mahol committed
1251 1252 1253 1254 1255 1256 1257 1258 1259 1260
    .sample_fmts           = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S32,
                                                            AV_SAMPLE_FMT_NONE },
    .supported_samplerates = sample_rates,
    .channel_layouts       = (const uint64_t[]) { AV_CH_LAYOUT_MONO,
                                                  AV_CH_LAYOUT_STEREO,
                                                  AV_CH_LAYOUT_2_2,
                                                  AV_CH_LAYOUT_5POINT0,
                                                  AV_CH_LAYOUT_5POINT1,
                                                  0 },
    .defaults              = defaults,
1261
    .priv_class            = &dcaenc_class,
Alexander E. Patrakov's avatar
Alexander E. Patrakov committed
1262
};