libvo-amrwbenc.c 5.02 KB
Newer Older
1 2 3 4
/*
 * AMR Audio encoder stub
 * Copyright (c) 2003 the ffmpeg project
 *
5
 * This file is part of FFmpeg.
6
 *
7
 * FFmpeg is free software; you can redistribute it and/or
8 9 10 11
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
12
 * FFmpeg is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with FFmpeg; if not, write to the Free Software
19 20 21 22
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include <vo-amrwbenc/enc_if.h>
23 24
#include <stdio.h>
#include <stdlib.h>
25

26
#include "libavutil/avstring.h"
27 28
#include "libavutil/internal.h"
#include "libavutil/mem.h"
29
#include "libavutil/opt.h"
30 31 32 33
#include "avcodec.h"
#include "internal.h"

#define MAX_PACKET_SIZE  (1 + (477 + 7) / 8)
34 35

typedef struct AMRWBContext {
36
    AVClass *av_class;
37 38
    void  *state;
    int    mode;
39
    int    last_bitrate;
40 41 42
    int    allow_dtx;
} AMRWBContext;

43
static const AVOption options[] = {
44
    { "dtx", "Allow DTX (generate comfort noise)", offsetof(AMRWBContext, allow_dtx), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
45 46 47 48 49 50 51
    { NULL }
};

static const AVClass class = {
    "libvo_amrwbenc", av_default_item_name, options, LIBAVUTIL_VERSION_INT
};

52
static int get_wb_bitrate_mode(int bitrate, void *log_ctx)
53 54
{
    /* make the correspondance between bitrate and mode */
55 56
    static const int rates[] = {  6600,  8850, 12650, 14250, 15850, 18250,
                                 19850, 23050, 23850 };
57 58
    int i, best = -1, min_diff = 0;
    char log_buf[200];
59

60
    for (i = 0; i < 9; i++) {
61 62
        if (rates[i] == bitrate)
            return i;
63 64 65 66 67 68 69 70 71 72 73 74 75
        if (best < 0 || abs(rates[i] - bitrate) < min_diff) {
            best     = i;
            min_diff = abs(rates[i] - bitrate);
        }
    }
    /* no bitrate matching exactly, log a warning */
    snprintf(log_buf, sizeof(log_buf), "bitrate not supported: use one of ");
    for (i = 0; i < 9; i++)
        av_strlcatf(log_buf, sizeof(log_buf), "%.2fk, ", rates[i]    / 1000.f);
    av_strlcatf(log_buf, sizeof(log_buf), "using %.2fk", rates[best] / 1000.f);
    av_log(log_ctx, AV_LOG_WARNING, "%s\n", log_buf);

    return best;
76 77 78 79 80 81
}

static av_cold int amr_wb_encode_init(AVCodecContext *avctx)
{
    AMRWBContext *s = avctx->priv_data;

82
    if (avctx->sample_rate != 16000 && avctx->strict_std_compliance > FF_COMPLIANCE_UNOFFICIAL) {
83
        av_log(avctx, AV_LOG_ERROR, "Only 16000Hz sample rate supported\n");
84
        return AVERROR(ENOSYS);
85 86 87 88
    }

    if (avctx->channels != 1) {
        av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
89
        return AVERROR(ENOSYS);
90 91
    }

92 93
    s->mode            = get_wb_bitrate_mode(avctx->bit_rate, avctx);
    s->last_bitrate    = avctx->bit_rate;
94 95

    avctx->frame_size  = 320;
96 97
    avctx->delay       =  80;
#if FF_API_OLD_ENCODE_AUDIO
98
    avctx->coded_frame = avcodec_alloc_frame();
99 100
    if (!avctx->coded_frame)
        return AVERROR(ENOMEM);
101
#endif
102 103 104 105 106 107 108 109 110 111 112 113 114 115 116

    s->state     = E_IF_init();

    return 0;
}

static int amr_wb_encode_close(AVCodecContext *avctx)
{
    AMRWBContext *s = avctx->priv_data;

    E_IF_exit(s->state);
    av_freep(&avctx->coded_frame);
    return 0;
}

117 118
static int amr_wb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
                               const AVFrame *frame, int *got_packet_ptr)
119 120
{
    AMRWBContext *s = avctx->priv_data;
121 122 123
    const int16_t *samples = (const int16_t *)frame->data[0];
    int size, ret;

124
    if ((ret = ff_alloc_packet2(avctx, avpkt, MAX_PACKET_SIZE)))
125
        return ret;
126

127 128 129 130
    if (s->last_bitrate != avctx->bit_rate) {
        s->mode         = get_wb_bitrate_mode(avctx->bit_rate, avctx);
        s->last_bitrate = avctx->bit_rate;
    }
131 132 133 134 135 136 137 138 139 140 141 142
    size = E_IF_encode(s->state, s->mode, samples, avpkt->data, s->allow_dtx);
    if (size <= 0 || size > MAX_PACKET_SIZE) {
        av_log(avctx, AV_LOG_ERROR, "Error encoding frame\n");
        return AVERROR(EINVAL);
    }

    if (frame->pts != AV_NOPTS_VALUE)
        avpkt->pts = frame->pts - ff_samples_to_time_base(avctx, avctx->delay);

    avpkt->size = size;
    *got_packet_ptr = 1;
    return 0;
143 144 145
}

AVCodec ff_libvo_amrwbenc_encoder = {
146 147
    .name           = "libvo_amrwbenc",
    .type           = AVMEDIA_TYPE_AUDIO,
148
    .id             = AV_CODEC_ID_AMR_WB,
149 150
    .priv_data_size = sizeof(AMRWBContext),
    .init           = amr_wb_encode_init,
151
    .encode2        = amr_wb_encode_frame,
152
    .close          = amr_wb_encode_close,
153 154
    .sample_fmts    = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
                                                     AV_SAMPLE_FMT_NONE },
155 156
    .long_name      = NULL_IF_CONFIG_SMALL("Android VisualOn AMR-WB "
                                           "(Adaptive Multi-Rate Wide-Band)"),
157
    .priv_class     = &class,
158
};