Commit 88c0536a authored by Kostya Shishkov's avatar Kostya Shishkov

Add several vector functions used by Monkey's Audio decoder to dsputil

Originally committed as revision 14081 to svn://svn.ffmpeg.org/ffmpeg/trunk
parent fcc402b1
...@@ -161,29 +161,6 @@ typedef struct APEContext { ...@@ -161,29 +161,6 @@ typedef struct APEContext {
} APEContext; } APEContext;
// TODO: dsputilize // TODO: dsputilize
static inline void vector_add(int16_t * v1, int16_t * v2, int order)
{
while (order--)
*v1++ += *v2++;
}
// TODO: dsputilize
static inline void vector_sub(int16_t * v1, int16_t * v2, int order)
{
while (order--)
*v1++ -= *v2++;
}
// TODO: dsputilize
static inline int32_t scalarproduct(int16_t * v1, int16_t * v2, int order)
{
int res = 0;
while (order--)
res += *v1++ * *v2++;
return res;
}
static av_cold int ape_decode_init(AVCodecContext * avctx) static av_cold int ape_decode_init(AVCodecContext * avctx)
{ {
...@@ -672,19 +649,19 @@ static void init_filter(APEContext * ctx, APEFilter *f, int16_t * buf, int order ...@@ -672,19 +649,19 @@ static void init_filter(APEContext * ctx, APEFilter *f, int16_t * buf, int order
do_init_filter(&f[1], buf + order * 3 + HISTORY_SIZE, order); do_init_filter(&f[1], buf + order * 3 + HISTORY_SIZE, order);
} }
static inline void do_apply_filter(int version, APEFilter *f, int32_t *data, int count, int order, int fracbits) static inline void do_apply_filter(APEContext * ctx, int version, APEFilter *f, int32_t *data, int count, int order, int fracbits)
{ {
int res; int res;
int absres; int absres;
while (count--) { while (count--) {
/* round fixedpoint scalar product */ /* round fixedpoint scalar product */
res = (scalarproduct(f->delay - order, f->coeffs, order) + (1 << (fracbits - 1))) >> fracbits; res = (ctx->dsp.scalarproduct_int16(f->delay - order, f->coeffs, order, 0) + (1 << (fracbits - 1))) >> fracbits;
if (*data < 0) if (*data < 0)
vector_add(f->coeffs, f->adaptcoeffs - order, order); ctx->dsp.add_int16(f->coeffs, f->adaptcoeffs - order, order);
else if (*data > 0) else if (*data > 0)
vector_sub(f->coeffs, f->adaptcoeffs - order, order); ctx->dsp.sub_int16(f->coeffs, f->adaptcoeffs - order, order);
res += *data; res += *data;
...@@ -736,9 +713,9 @@ static void apply_filter(APEContext * ctx, APEFilter *f, ...@@ -736,9 +713,9 @@ static void apply_filter(APEContext * ctx, APEFilter *f,
int32_t * data0, int32_t * data1, int32_t * data0, int32_t * data1,
int count, int order, int fracbits) int count, int order, int fracbits)
{ {
do_apply_filter(ctx->fileversion, &f[0], data0, count, order, fracbits); do_apply_filter(ctx, ctx->fileversion, &f[0], data0, count, order, fracbits);
if (data1) if (data1)
do_apply_filter(ctx->fileversion, &f[1], data1, count, order, fracbits); do_apply_filter(ctx, ctx->fileversion, &f[1], data1, count, order, fracbits);
} }
static void ape_apply_filters(APEContext * ctx, int32_t * decoded0, static void ape_apply_filters(APEContext * ctx, int32_t * decoded0,
......
...@@ -3944,6 +3944,28 @@ void ff_float_to_int16_c(int16_t *dst, const float *src, int len){ ...@@ -3944,6 +3944,28 @@ void ff_float_to_int16_c(int16_t *dst, const float *src, int len){
} }
} }
static void add_int16_c(int16_t * v1, int16_t * v2, int order)
{
while (order--)
*v1++ += *v2++;
}
static void sub_int16_c(int16_t * v1, int16_t * v2, int order)
{
while (order--)
*v1++ -= *v2++;
}
static int32_t scalarproduct_int16_c(int16_t * v1, int16_t * v2, int order, int shift)
{
int res = 0;
while (order--)
res += (*v1++ * *v2++) >> shift;
return res;
}
#define W0 2048 #define W0 2048
#define W1 2841 /* 2048*sqrt (2)*cos (1*pi/16) */ #define W1 2841 /* 2048*sqrt (2)*cos (1*pi/16) */
#define W2 2676 /* 2048*sqrt (2)*cos (2*pi/16) */ #define W2 2676 /* 2048*sqrt (2)*cos (2*pi/16) */
...@@ -4429,6 +4451,9 @@ void dsputil_init(DSPContext* c, AVCodecContext *avctx) ...@@ -4429,6 +4451,9 @@ void dsputil_init(DSPContext* c, AVCodecContext *avctx)
c->vector_fmul_reverse = vector_fmul_reverse_c; c->vector_fmul_reverse = vector_fmul_reverse_c;
c->vector_fmul_add_add = ff_vector_fmul_add_add_c; c->vector_fmul_add_add = ff_vector_fmul_add_add_c;
c->float_to_int16 = ff_float_to_int16_c; c->float_to_int16 = ff_float_to_int16_c;
c->add_int16 = add_int16_c;
c->sub_int16 = sub_int16_c;
c->scalarproduct_int16 = scalarproduct_int16_c;
c->shrink[0]= ff_img_copy_plane; c->shrink[0]= ff_img_copy_plane;
c->shrink[1]= ff_shrink22; c->shrink[1]= ff_shrink22;
......
...@@ -451,6 +451,23 @@ typedef struct DSPContext { ...@@ -451,6 +451,23 @@ typedef struct DSPContext {
void (*x8_setup_spatial_compensation)(uint8_t *src, uint8_t *dst, int linesize, void (*x8_setup_spatial_compensation)(uint8_t *src, uint8_t *dst, int linesize,
int * range, int * sum, int edges); int * range, int * sum, int edges);
/* ape functions */
/**
* Add contents of the second vector to the first one.
* @param len length of vectors, should be multiple of 8
*/
void (*add_int16)(int16_t *v1/*align 16*/, int16_t *v2, int len);
/**
* Add contents of the second vector to the first one.
* @param len length of vectors, should be multiple of 8
*/
void (*sub_int16)(int16_t *v1/*align 16*/, int16_t *v2, int len);
/**
* Calculate scalar product of two vectors.
* @param len length of vectors, should be multiple of 8
* @param shift number of bits to discard from product
*/
int32_t (*scalarproduct_int16)(int16_t *v1, int16_t *v2/*align 16*/, int len, int shift);
} DSPContext; } DSPContext;
void dsputil_static_init(void); void dsputil_static_init(void);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment