libopencore-amr.c 11.5 KB
Newer Older
1 2 3 4
/*
 * AMR Audio decoder stub
 * Copyright (c) 2003 the ffmpeg project
 *
5
 * This file is part of Libav.
6
 *
7
 * Libav is free software; you can redistribute it and/or
8 9 10 11
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
12
 * Libav is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with Libav; if not, write to the Free Software
19 20 21
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

22
#include "libavutil/avstring.h"
23
#include "libavutil/channel_layout.h"
24
#include "libavutil/common.h"
25
#include "libavutil/opt.h"
26
#include "avcodec.h"
27 28
#include "audio_frame_queue.h"
#include "internal.h"
29

30
static int amr_decode_fix_avctx(AVCodecContext *avctx)
31
{
32
    const int is_amr_wb = 1 + (avctx->codec_id == AV_CODEC_ID_AMR_WB);
33

34
    avctx->sample_rate = 8000 * is_amr_wb;
35

36
    if (avctx->channels > 1) {
37
        avpriv_report_missing_feature(avctx, "multi-channel AMR");
38 39
        return AVERROR_PATCHWELCOME;
    }
40

41 42 43
    avctx->channels       = 1;
    avctx->channel_layout = AV_CH_LAYOUT_MONO;
    avctx->sample_fmt     = AV_SAMPLE_FMT_S16;
44
    return 0;
45 46 47 48 49 50 51 52
}

#if CONFIG_LIBOPENCORE_AMRNB

#include <opencore-amrnb/interf_dec.h>
#include <opencore-amrnb/interf_enc.h>

typedef struct AMRContext {
53
    AVClass *av_class;
54 55
    void *dec_state;
    void *enc_state;
56
    int   enc_bitrate;
57
    int   enc_mode;
58
    int   enc_dtx;
59
    int   enc_last_frame;
60
    AudioFrameQueue afq;
61 62
} AMRContext;

63
#if CONFIG_LIBOPENCORE_AMRNB_DECODER
64 65
static av_cold int amr_nb_decode_init(AVCodecContext *avctx)
{
66
    AMRContext *s  = avctx->priv_data;
67 68 69 70
    int ret;

    if ((ret = amr_decode_fix_avctx(avctx)) < 0)
        return ret;
71

72 73
    s->dec_state   = Decoder_Interface_init();
    if (!s->dec_state) {
74
        av_log(avctx, AV_LOG_ERROR, "Decoder_Interface_init error\n");
75 76 77 78 79 80 81 82 83 84
        return -1;
    }

    return 0;
}

static av_cold int amr_nb_decode_close(AVCodecContext *avctx)
{
    AMRContext *s = avctx->priv_data;

85
    Decoder_Interface_exit(s->dec_state);
86

87 88 89 90
    return 0;
}

static int amr_nb_decode_frame(AVCodecContext *avctx, void *data,
91
                               int *got_frame_ptr, AVPacket *avpkt)
92
{
93
    AVFrame *frame     = data;
94 95
    const uint8_t *buf = avpkt->data;
    int buf_size       = avpkt->size;
96
    AMRContext *s      = avctx->priv_data;
97 98
    static const uint8_t block_size[16] = { 12, 13, 15, 17, 19, 20, 26, 31, 5, 0, 0, 0, 0, 0, 0, 0 };
    enum Mode dec_mode;
99
    int packet_size, ret;
100

101
    ff_dlog(avctx, "amr_decode_frame buf=%p buf_size=%d frame_count=%d!!\n",
102
            buf, buf_size, avctx->frame_number);
103

104
    /* get output buffer */
105
    frame->nb_samples = 160;
106
    if ((ret = ff_get_buffer(avctx, frame, 0)) < 0) {
107 108
        av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
        return ret;
109 110
    }

111
    dec_mode    = (buf[0] >> 3) & 0x000F;
112 113 114 115 116
    packet_size = block_size[dec_mode] + 1;

    if (packet_size > buf_size) {
        av_log(avctx, AV_LOG_ERROR, "amr frame too short (%u, should be %u)\n",
               buf_size, packet_size);
117
        return AVERROR_INVALIDDATA;
118 119
    }

120
    ff_dlog(avctx, "packet_size=%d buf= 0x%X %X %X %X\n",
121
              packet_size, buf[0], buf[1], buf[2], buf[3]);
122
    /* call decoder */
123
    Decoder_Interface_Decode(s->dec_state, buf, (short *)frame->data[0], 0);
124

125
    *got_frame_ptr = 1;
126 127 128 129

    return packet_size;
}

130
AVCodec ff_libopencore_amrnb_decoder = {
131
    .name           = "libopencore_amrnb",
132
    .long_name      = NULL_IF_CONFIG_SMALL("OpenCORE AMR-NB (Adaptive Multi-Rate Narrow-Band)"),
133
    .type           = AVMEDIA_TYPE_AUDIO,
134
    .id             = AV_CODEC_ID_AMR_NB,
135 136 137 138
    .priv_data_size = sizeof(AMRContext),
    .init           = amr_nb_decode_init,
    .close          = amr_nb_decode_close,
    .decode         = amr_nb_decode_frame,
139
    .capabilities   = CODEC_CAP_DR1,
140
};
141
#endif /* CONFIG_LIBOPENCORE_AMRNB_DECODER */
142

143
#if CONFIG_LIBOPENCORE_AMRNB_ENCODER
144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187
/* Common code for fixed and float version*/
typedef struct AMR_bitrates {
    int       rate;
    enum Mode mode;
} AMR_bitrates;

/* Match desired bitrate */
static int get_bitrate_mode(int bitrate, void *log_ctx)
{
    /* make the correspondance between bitrate and mode */
    static const AMR_bitrates rates[] = {
        { 4750, MR475 }, { 5150, MR515 }, {  5900, MR59  }, {  6700, MR67  },
        { 7400, MR74 },  { 7950, MR795 }, { 10200, MR102 }, { 12200, MR122 }
    };
    int i, best = -1, min_diff = 0;
    char log_buf[200];

    for (i = 0; i < 8; i++) {
        if (rates[i].rate == bitrate)
            return rates[i].mode;
        if (best < 0 || abs(rates[i].rate - bitrate) < min_diff) {
            best     = i;
            min_diff = abs(rates[i].rate - bitrate);
        }
    }
    /* no bitrate matching exactly, log a warning */
    snprintf(log_buf, sizeof(log_buf), "bitrate not supported: use one of ");
    for (i = 0; i < 8; i++)
        av_strlcatf(log_buf, sizeof(log_buf), "%.2fk, ", rates[i].rate    / 1000.f);
    av_strlcatf(log_buf, sizeof(log_buf), "using %.2fk", rates[best].rate / 1000.f);
    av_log(log_ctx, AV_LOG_WARNING, "%s\n", log_buf);

    return best;
}

static const AVOption options[] = {
    { "dtx", "Allow DTX (generate comfort noise)", offsetof(AMRContext, enc_dtx), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
    { NULL }
};

static const AVClass class = {
    "libopencore_amrnb", av_default_item_name, options, LIBAVUTIL_VERSION_INT
};

188 189 190 191 192 193
static av_cold int amr_nb_encode_init(AVCodecContext *avctx)
{
    AMRContext *s = avctx->priv_data;

    if (avctx->sample_rate != 8000) {
        av_log(avctx, AV_LOG_ERROR, "Only 8000Hz sample rate supported\n");
194
        return AVERROR(ENOSYS);
195 196 197 198
    }

    if (avctx->channels != 1) {
        av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
199
        return AVERROR(ENOSYS);
200 201 202
    }

    avctx->frame_size  = 160;
203
    avctx->initial_padding = 50;
204
    ff_af_queue_init(avctx, &s->afq);
205

206
    s->enc_state = Encoder_Interface_init(s->enc_dtx);
207
    if (!s->enc_state) {
208
        av_log(avctx, AV_LOG_ERROR, "Encoder_Interface_init error\n");
209
        av_freep(&avctx->coded_frame);
210 211 212
        return -1;
    }

213 214
    s->enc_mode    = get_bitrate_mode(avctx->bit_rate, avctx);
    s->enc_bitrate = avctx->bit_rate;
215 216 217 218 219 220 221 222

    return 0;
}

static av_cold int amr_nb_encode_close(AVCodecContext *avctx)
{
    AMRContext *s = avctx->priv_data;

223
    Encoder_Interface_exit(s->enc_state);
224
    ff_af_queue_close(&s->afq);
225 226 227
    return 0;
}

228 229
static int amr_nb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
                               const AVFrame *frame, int *got_packet_ptr)
230 231
{
    AMRContext *s = avctx->priv_data;
232
    int written, ret;
233
    int16_t *flush_buf = NULL;
234
    const int16_t *samples = frame ? (const int16_t *)frame->data[0] : NULL;
235

236 237 238 239
    if (s->enc_bitrate != avctx->bit_rate) {
        s->enc_mode    = get_bitrate_mode(avctx->bit_rate, avctx);
        s->enc_bitrate = avctx->bit_rate;
    }
240

241 242 243 244 245 246 247 248
    if ((ret = ff_alloc_packet(avpkt, 32))) {
        av_log(avctx, AV_LOG_ERROR, "Error getting output packet\n");
        return ret;
    }

    if (frame) {
        if (frame->nb_samples < avctx->frame_size) {
            flush_buf = av_mallocz(avctx->frame_size * sizeof(*flush_buf));
249 250
            if (!flush_buf)
                return AVERROR(ENOMEM);
251
            memcpy(flush_buf, samples, frame->nb_samples * sizeof(*flush_buf));
252
            samples = flush_buf;
253
            if (frame->nb_samples < avctx->frame_size - avctx->initial_padding)
254 255
                s->enc_last_frame = -1;
        }
256
        if ((ret = ff_af_queue_add(&s->afq, frame)) < 0) {
257 258 259
            av_freep(&flush_buf);
            return ret;
        }
260 261 262
    } else {
        if (s->enc_last_frame < 0)
            return 0;
263
        flush_buf = av_mallocz(avctx->frame_size * sizeof(*flush_buf));
264 265 266 267 268 269 270
        if (!flush_buf)
            return AVERROR(ENOMEM);
        samples = flush_buf;
        s->enc_last_frame = -1;
    }

    written = Encoder_Interface_Encode(s->enc_state, s->enc_mode, samples,
271
                                       avpkt->data, 0);
272
    ff_dlog(avctx, "amr_nb_encode_frame encoded %u bytes, bitrate %u, first byte was %#02x\n",
273
            written, s->enc_mode, frame[0]);
274

275 276 277 278 279 280
    /* Get the next frame pts/duration */
    ff_af_queue_remove(&s->afq, avctx->frame_size, &avpkt->pts,
                       &avpkt->duration);

    avpkt->size = written;
    *got_packet_ptr = 1;
281
    av_freep(&flush_buf);
282
    return 0;
283 284
}

285
AVCodec ff_libopencore_amrnb_encoder = {
286
    .name           = "libopencore_amrnb",
287
    .long_name      = NULL_IF_CONFIG_SMALL("OpenCORE AMR-NB (Adaptive Multi-Rate Narrow-Band)"),
288
    .type           = AVMEDIA_TYPE_AUDIO,
289
    .id             = AV_CODEC_ID_AMR_NB,
290 291
    .priv_data_size = sizeof(AMRContext),
    .init           = amr_nb_encode_init,
292
    .encode2        = amr_nb_encode_frame,
293
    .close          = amr_nb_encode_close,
294
    .capabilities   = CODEC_CAP_DELAY | CODEC_CAP_SMALL_LAST_FRAME,
295 296 297
    .sample_fmts    = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
                                                     AV_SAMPLE_FMT_NONE },
    .priv_class     = &class,
298
};
299
#endif /* CONFIG_LIBOPENCORE_AMRNB_ENCODER */
300

301
#endif /* CONFIG_LIBOPENCORE_AMRNB */
302 303

/* -----------AMR wideband ------------*/
304
#if CONFIG_LIBOPENCORE_AMRWB_DECODER
305 306 307 308 309 310 311 312 313 314 315

#include <opencore-amrwb/dec_if.h>
#include <opencore-amrwb/if_rom.h>

typedef struct AMRWBContext {
    void  *state;
} AMRWBContext;

static av_cold int amr_wb_decode_init(AVCodecContext *avctx)
{
    AMRWBContext *s = avctx->priv_data;
316
    int ret;
317

318 319
    if ((ret = amr_decode_fix_avctx(avctx)) < 0)
        return ret;
320

321
    s->state        = D_IF_init();
322 323 324 325 326

    return 0;
}

static int amr_wb_decode_frame(AVCodecContext *avctx, void *data,
327
                               int *got_frame_ptr, AVPacket *avpkt)
328
{
329
    AVFrame *frame     = data;
330 331
    const uint8_t *buf = avpkt->data;
    int buf_size       = avpkt->size;
332
    AMRWBContext *s    = avctx->priv_data;
333 334
    int mode, ret;
    int packet_size;
335 336
    static const uint8_t block_size[16] = {18, 24, 33, 37, 41, 47, 51, 59, 61, 6, 6, 0, 0, 0, 1, 1};

337
    /* get output buffer */
338
    frame->nb_samples = 320;
339
    if ((ret = ff_get_buffer(avctx, frame, 0)) < 0) {
340 341
        av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
        return ret;
342 343
    }

344
    mode        = (buf[0] >> 3) & 0x000F;
345 346 347 348 349
    packet_size = block_size[mode];

    if (packet_size > buf_size) {
        av_log(avctx, AV_LOG_ERROR, "amr frame too short (%u, should be %u)\n",
               buf_size, packet_size + 1);
350
        return AVERROR_INVALIDDATA;
351 352
    }

353
    D_IF_decode(s->state, buf, (short *)frame->data[0], _good_frame);
354

355
    *got_frame_ptr = 1;
356

357 358 359 360 361 362 363 364 365 366 367
    return packet_size;
}

static int amr_wb_decode_close(AVCodecContext *avctx)
{
    AMRWBContext *s = avctx->priv_data;

    D_IF_exit(s->state);
    return 0;
}

368
AVCodec ff_libopencore_amrwb_decoder = {
369
    .name           = "libopencore_amrwb",
370
    .long_name      = NULL_IF_CONFIG_SMALL("OpenCORE AMR-WB (Adaptive Multi-Rate Wide-Band)"),
371
    .type           = AVMEDIA_TYPE_AUDIO,
372
    .id             = AV_CODEC_ID_AMR_WB,
373 374 375 376
    .priv_data_size = sizeof(AMRWBContext),
    .init           = amr_wb_decode_init,
    .close          = amr_wb_decode_close,
    .decode         = amr_wb_decode_frame,
377
    .capabilities   = CODEC_CAP_DR1,
378 379
};

380
#endif /* CONFIG_LIBOPENCORE_AMRWB_DECODER */