vp8dsp.c 16.5 KB
Newer Older
1
/*
David Conrad's avatar
David Conrad committed
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 * Copyright (C) 2010 David Conrad
 * Copyright (C) 2010 Ronald S. Bultje
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

22 23 24 25 26
/**
 * @file
 * VP8 compatible video decoder
 */

David Conrad's avatar
David Conrad committed
27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51
#include "dsputil.h"
#include "vp8dsp.h"

// TODO: Maybe add dequant
static void vp8_luma_dc_wht_c(DCTELEM block[4][4][16], DCTELEM dc[16])
{
    int i, t0, t1, t2, t3;

    for (i = 0; i < 4; i++) {
        t0 = dc[0*4+i] + dc[3*4+i];
        t1 = dc[1*4+i] + dc[2*4+i];
        t2 = dc[1*4+i] - dc[2*4+i];
        t3 = dc[0*4+i] - dc[3*4+i];

        dc[0*4+i] = t0 + t1;
        dc[1*4+i] = t3 + t2;
        dc[2*4+i] = t0 - t1;
        dc[3*4+i] = t3 - t2;
    }

    for (i = 0; i < 4; i++) {
        t0 = dc[i*4+0] + dc[i*4+3] + 3; // rounding
        t1 = dc[i*4+1] + dc[i*4+2];
        t2 = dc[i*4+1] - dc[i*4+2];
        t3 = dc[i*4+0] - dc[i*4+3] + 3; // rounding
52 53 54 55
        dc[i*4+0] = 0;
        dc[i*4+1] = 0;
        dc[i*4+2] = 0;
        dc[i*4+3] = 0;
David Conrad's avatar
David Conrad committed
56

57 58 59 60
        block[i][0][0] = (t0 + t1) >> 3;
        block[i][1][0] = (t3 + t2) >> 3;
        block[i][2][0] = (t0 - t1) >> 3;
        block[i][3][0] = (t3 - t2) >> 3;
David Conrad's avatar
David Conrad committed
61 62 63
    }
}

64 65 66 67 68 69 70 71 72 73 74 75
static void vp8_luma_dc_wht_dc_c(DCTELEM block[4][4][16], DCTELEM dc[16])
{
    int i, val = (dc[0] + 3) >> 3;
    dc[0] = 0;

    for (i = 0; i < 4; i++) {
        block[i][0][0] = val;
        block[i][1][0] = val;
        block[i][2][0] = val;
        block[i][3][0] = val;
    }
}
David Conrad's avatar
David Conrad committed
76 77 78 79

#define MUL_20091(a) ((((a)*20091) >> 16) + (a))
#define MUL_35468(a)  (((a)*35468) >> 16)

80
static void vp8_idct_add_c(uint8_t *dst, DCTELEM block[16], ptrdiff_t stride)
David Conrad's avatar
David Conrad committed
81 82 83 84 85 86 87 88 89
{
    int i, t0, t1, t2, t3;
    DCTELEM tmp[16];

    for (i = 0; i < 4; i++) {
        t0 = block[0*4+i] + block[2*4+i];
        t1 = block[0*4+i] - block[2*4+i];
        t2 = MUL_35468(block[1*4+i]) - MUL_20091(block[3*4+i]);
        t3 = MUL_20091(block[1*4+i]) + MUL_35468(block[3*4+i]);
90 91 92 93
        block[0*4+i] = 0;
        block[1*4+i] = 0;
        block[2*4+i] = 0;
        block[3*4+i] = 0;
David Conrad's avatar
David Conrad committed
94 95 96 97 98 99 100 101 102 103 104 105 106

        tmp[i*4+0] = t0 + t3;
        tmp[i*4+1] = t1 + t2;
        tmp[i*4+2] = t1 - t2;
        tmp[i*4+3] = t0 - t3;
    }

    for (i = 0; i < 4; i++) {
        t0 = tmp[0*4+i] + tmp[2*4+i];
        t1 = tmp[0*4+i] - tmp[2*4+i];
        t2 = MUL_35468(tmp[1*4+i]) - MUL_20091(tmp[3*4+i]);
        t3 = MUL_20091(tmp[1*4+i]) + MUL_35468(tmp[3*4+i]);

107 108 109 110
        dst[0] = av_clip_uint8(dst[0] + ((t0 + t3 + 4) >> 3));
        dst[1] = av_clip_uint8(dst[1] + ((t1 + t2 + 4) >> 3));
        dst[2] = av_clip_uint8(dst[2] + ((t1 - t2 + 4) >> 3));
        dst[3] = av_clip_uint8(dst[3] + ((t0 - t3 + 4) >> 3));
David Conrad's avatar
David Conrad committed
111 112 113 114
        dst += stride;
    }
}

115
static void vp8_idct_dc_add_c(uint8_t *dst, DCTELEM block[16], ptrdiff_t stride)
David Conrad's avatar
David Conrad committed
116 117
{
    int i, dc = (block[0] + 4) >> 3;
118
    block[0] = 0;
David Conrad's avatar
David Conrad committed
119 120

    for (i = 0; i < 4; i++) {
121 122 123 124
        dst[0] = av_clip_uint8(dst[0] + dc);
        dst[1] = av_clip_uint8(dst[1] + dc);
        dst[2] = av_clip_uint8(dst[2] + dc);
        dst[3] = av_clip_uint8(dst[3] + dc);
David Conrad's avatar
David Conrad committed
125 126 127 128
        dst += stride;
    }
}

129
static void vp8_idct_dc_add4uv_c(uint8_t *dst, DCTELEM block[4][16], ptrdiff_t stride)
130
{
131 132 133 134 135 136
    vp8_idct_dc_add_c(dst+stride*0+0, block[0], stride);
    vp8_idct_dc_add_c(dst+stride*0+4, block[1], stride);
    vp8_idct_dc_add_c(dst+stride*4+0, block[2], stride);
    vp8_idct_dc_add_c(dst+stride*4+4, block[3], stride);
}

137
static void vp8_idct_dc_add4y_c(uint8_t *dst, DCTELEM block[4][16], ptrdiff_t stride)
138 139 140 141 142
{
    vp8_idct_dc_add_c(dst+ 0, block[0], stride);
    vp8_idct_dc_add_c(dst+ 4, block[1], stride);
    vp8_idct_dc_add_c(dst+ 8, block[2], stride);
    vp8_idct_dc_add_c(dst+12, block[3], stride);
143
}
David Conrad's avatar
David Conrad committed
144 145 146 147 148 149 150 151 152 153 154 155

// because I like only having two parameters to pass functions...
#define LOAD_PIXELS\
    int av_unused p3 = p[-4*stride];\
    int av_unused p2 = p[-3*stride];\
    int av_unused p1 = p[-2*stride];\
    int av_unused p0 = p[-1*stride];\
    int av_unused q0 = p[ 0*stride];\
    int av_unused q1 = p[ 1*stride];\
    int av_unused q2 = p[ 2*stride];\
    int av_unused q3 = p[ 3*stride];

156 157
#define clip_int8(n) (cm[n+0x80]-0x80)

158
static av_always_inline void filter_common(uint8_t *p, ptrdiff_t stride, int is4tap)
David Conrad's avatar
David Conrad committed
159 160 161
{
    LOAD_PIXELS
    int a, f1, f2;
162
    uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
David Conrad's avatar
David Conrad committed
163 164 165 166

    a = 3*(q0 - p0);

    if (is4tap)
167
        a += clip_int8(p1 - q1);
David Conrad's avatar
David Conrad committed
168

169
    a = clip_int8(a);
David Conrad's avatar
David Conrad committed
170 171 172 173 174 175 176 177

    // We deviate from the spec here with c(a+3) >> 3
    // since that's what libvpx does.
    f1 = FFMIN(a+4, 127) >> 3;
    f2 = FFMIN(a+3, 127) >> 3;

    // Despite what the spec says, we do need to clamp here to
    // be bitexact with libvpx.
178 179
    p[-1*stride] = cm[p0 + f2];
    p[ 0*stride] = cm[q0 - f1];
David Conrad's avatar
David Conrad committed
180 181 182 183

    // only used for _inner on blocks without high edge variance
    if (!is4tap) {
        a = (f1+1)>>1;
184 185
        p[-2*stride] = cm[p1 + a];
        p[ 1*stride] = cm[q1 - a];
David Conrad's avatar
David Conrad committed
186 187 188
    }
}

189
static av_always_inline int simple_limit(uint8_t *p, ptrdiff_t stride, int flim)
David Conrad's avatar
David Conrad committed
190 191 192 193 194 195 196 197 198
{
    LOAD_PIXELS
    return 2*FFABS(p0-q0) + (FFABS(p1-q1) >> 1) <= flim;
}

/**
 * E - limit at the macroblock edge
 * I - limit for interior difference
 */
199
static av_always_inline int normal_limit(uint8_t *p, ptrdiff_t stride, int E, int I)
David Conrad's avatar
David Conrad committed
200 201
{
    LOAD_PIXELS
202
    return simple_limit(p, stride, E)
David Conrad's avatar
David Conrad committed
203 204 205 206 207
        && FFABS(p3-p2) <= I && FFABS(p2-p1) <= I && FFABS(p1-p0) <= I
        && FFABS(q3-q2) <= I && FFABS(q2-q1) <= I && FFABS(q1-q0) <= I;
}

// high edge variance
208
static av_always_inline int hev(uint8_t *p, ptrdiff_t stride, int thresh)
David Conrad's avatar
David Conrad committed
209 210 211 212 213
{
    LOAD_PIXELS
    return FFABS(p1-p0) > thresh || FFABS(q1-q0) > thresh;
}

214
static av_always_inline void filter_mbedge(uint8_t *p, ptrdiff_t stride)
David Conrad's avatar
David Conrad committed
215 216
{
    int a0, a1, a2, w;
217
    uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
David Conrad's avatar
David Conrad committed
218 219 220

    LOAD_PIXELS

221 222
    w = clip_int8(p1-q1);
    w = clip_int8(w + 3*(q0-p0));
David Conrad's avatar
David Conrad committed
223 224 225 226 227

    a0 = (27*w + 63) >> 7;
    a1 = (18*w + 63) >> 7;
    a2 = ( 9*w + 63) >> 7;

228 229 230 231 232 233
    p[-3*stride] = cm[p2 + a2];
    p[-2*stride] = cm[p1 + a1];
    p[-1*stride] = cm[p0 + a0];
    p[ 0*stride] = cm[q0 - a0];
    p[ 1*stride] = cm[q1 - a1];
    p[ 2*stride] = cm[q2 - a2];
David Conrad's avatar
David Conrad committed
234 235
}

236
#define LOOP_FILTER(dir, size, stridea, strideb, maybe_inline) \
237
static maybe_inline void vp8_ ## dir ## _loop_filter ## size ## _c(uint8_t *dst, ptrdiff_t stride,\
David Conrad's avatar
David Conrad committed
238 239 240 241 242 243 244 245 246 247 248 249 250
                                     int flim_E, int flim_I, int hev_thresh)\
{\
    int i;\
\
    for (i = 0; i < size; i++)\
        if (normal_limit(dst+i*stridea, strideb, flim_E, flim_I)) {\
            if (hev(dst+i*stridea, strideb, hev_thresh))\
                filter_common(dst+i*stridea, strideb, 1);\
            else\
                filter_mbedge(dst+i*stridea, strideb);\
        }\
}\
\
251
static maybe_inline void vp8_ ## dir ## _loop_filter ## size ## _inner_c(uint8_t *dst, ptrdiff_t stride,\
David Conrad's avatar
David Conrad committed
252 253
                                      int flim_E, int flim_I, int hev_thresh)\
{\
254
    int i;\
David Conrad's avatar
David Conrad committed
255 256 257
\
    for (i = 0; i < size; i++)\
        if (normal_limit(dst+i*stridea, strideb, flim_E, flim_I)) {\
258 259 260 261 262
            int hv = hev(dst+i*stridea, strideb, hev_thresh);\
            if (hv) \
                filter_common(dst+i*stridea, strideb, 1);\
            else \
                filter_common(dst+i*stridea, strideb, 0);\
David Conrad's avatar
David Conrad committed
263 264 265
        }\
}

266 267 268 269 270
LOOP_FILTER(v, 16, 1, stride,)
LOOP_FILTER(h, 16, stride, 1,)

#define UV_LOOP_FILTER(dir, stridea, strideb) \
LOOP_FILTER(dir, 8, stridea, strideb, av_always_inline) \
271
static void vp8_ ## dir ## _loop_filter8uv_c(uint8_t *dstU, uint8_t *dstV, ptrdiff_t stride,\
272 273 274 275 276
                                      int fE, int fI, int hev_thresh)\
{\
  vp8_ ## dir ## _loop_filter8_c(dstU, stride, fE, fI, hev_thresh);\
  vp8_ ## dir ## _loop_filter8_c(dstV, stride, fE, fI, hev_thresh);\
}\
277
static void vp8_ ## dir ## _loop_filter8uv_inner_c(uint8_t *dstU, uint8_t *dstV, ptrdiff_t stride,\
278 279 280 281 282 283 284 285
                                      int fE, int fI, int hev_thresh)\
{\
  vp8_ ## dir ## _loop_filter8_inner_c(dstU, stride, fE, fI, hev_thresh);\
  vp8_ ## dir ## _loop_filter8_inner_c(dstV, stride, fE, fI, hev_thresh);\
}

UV_LOOP_FILTER(v, 1, stride)
UV_LOOP_FILTER(h, stride, 1)
David Conrad's avatar
David Conrad committed
286

287
static void vp8_v_loop_filter_simple_c(uint8_t *dst, ptrdiff_t stride, int flim)
David Conrad's avatar
David Conrad committed
288 289 290 291 292 293 294 295
{
    int i;

    for (i = 0; i < 16; i++)
        if (simple_limit(dst+i, stride, flim))
            filter_common(dst+i, stride, 1);
}

296
static void vp8_h_loop_filter_simple_c(uint8_t *dst, ptrdiff_t stride, int flim)
David Conrad's avatar
David Conrad committed
297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314
{
    int i;

    for (i = 0; i < 16; i++)
        if (simple_limit(dst+i*stride, 1, flim))
            filter_common(dst+i*stride, 1, 1);
}

static const uint8_t subpel_filters[7][6] = {
    { 0,   6, 123,  12,   1,   0 },
    { 2,  11, 108,  36,   8,   1 },
    { 0,   9,  93,  50,   6,   0 },
    { 3,  16,  77,  77,  16,   3 },
    { 0,   6,  50,  93,   9,   0 },
    { 1,   8,  36, 108,  11,   2 },
    { 0,   1,  12, 123,   6,   0 },
};

315
#define PUT_PIXELS(WIDTH) \
316
static void put_vp8_pixels ## WIDTH ##_c(uint8_t *dst, ptrdiff_t dststride, uint8_t *src, ptrdiff_t srcstride, int h, int x, int y) { \
Jason Garrett-Glaser's avatar
Jason Garrett-Glaser committed
317 318
    int i; \
    for (i = 0; i < h; i++, dst+= dststride, src+= srcstride) { \
319 320 321 322 323 324 325
        memcpy(dst, src, WIDTH); \
    } \
}

PUT_PIXELS(16)
PUT_PIXELS(8)
PUT_PIXELS(4)
David Conrad's avatar
David Conrad committed
326 327

#define FILTER_6TAP(src, F, stride) \
328 329
    cm[(F[2]*src[x+0*stride] - F[1]*src[x-1*stride] + F[0]*src[x-2*stride] + \
        F[3]*src[x+1*stride] - F[4]*src[x+2*stride] + F[5]*src[x+3*stride] + 64) >> 7]
David Conrad's avatar
David Conrad committed
330 331

#define FILTER_4TAP(src, F, stride) \
332 333
    cm[(F[2]*src[x+0*stride] - F[1]*src[x-1*stride] + \
        F[3]*src[x+1*stride] - F[4]*src[x+2*stride] + 64) >> 7]
David Conrad's avatar
David Conrad committed
334

335
#define VP8_EPEL_H(SIZE, TAPS) \
336
static void put_vp8_epel ## SIZE ## _h ## TAPS ## _c(uint8_t *dst, ptrdiff_t dststride, uint8_t *src, ptrdiff_t srcstride, int h, int mx, int my) \
David Conrad's avatar
David Conrad committed
337 338
{ \
    const uint8_t *filter = subpel_filters[mx-1]; \
339
    uint8_t *cm = ff_cropTbl + MAX_NEG_CROP; \
David Conrad's avatar
David Conrad committed
340 341 342 343
    int x, y; \
\
    for (y = 0; y < h; y++) { \
        for (x = 0; x < SIZE; x++) \
344
            dst[x] = FILTER_ ## TAPS ## TAP(src, filter, 1); \
345 346
        dst += dststride; \
        src += srcstride; \
David Conrad's avatar
David Conrad committed
347 348
    } \
}
349
#define VP8_EPEL_V(SIZE, TAPS) \
350
static void put_vp8_epel ## SIZE ## _v ## TAPS ## _c(uint8_t *dst, ptrdiff_t dststride, uint8_t *src, ptrdiff_t srcstride, int h, int mx, int my) \
David Conrad's avatar
David Conrad committed
351 352
{ \
    const uint8_t *filter = subpel_filters[my-1]; \
353
    uint8_t *cm = ff_cropTbl + MAX_NEG_CROP; \
David Conrad's avatar
David Conrad committed
354 355 356 357
    int x, y; \
\
    for (y = 0; y < h; y++) { \
        for (x = 0; x < SIZE; x++) \
358
            dst[x] = FILTER_ ## TAPS ## TAP(src, filter, srcstride); \
359 360
        dst += dststride; \
        src += srcstride; \
David Conrad's avatar
David Conrad committed
361 362
    } \
}
363
#define VP8_EPEL_HV(SIZE, HTAPS, VTAPS) \
364
static void put_vp8_epel ## SIZE ## _h ## HTAPS ## v ## VTAPS ## _c(uint8_t *dst, ptrdiff_t dststride, uint8_t *src, ptrdiff_t srcstride, int h, int mx, int my) \
David Conrad's avatar
David Conrad committed
365 366
{ \
    const uint8_t *filter = subpel_filters[mx-1]; \
367
    uint8_t *cm = ff_cropTbl + MAX_NEG_CROP; \
David Conrad's avatar
David Conrad committed
368
    int x, y; \
369
    uint8_t tmp_array[(2*SIZE+VTAPS-1)*SIZE]; \
David Conrad's avatar
David Conrad committed
370
    uint8_t *tmp = tmp_array; \
371
    src -= (2-(VTAPS==4))*srcstride; \
David Conrad's avatar
David Conrad committed
372
\
373
    for (y = 0; y < h+VTAPS-1; y++) { \
David Conrad's avatar
David Conrad committed
374
        for (x = 0; x < SIZE; x++) \
375
            tmp[x] = FILTER_ ## HTAPS ## TAP(src, filter, 1); \
David Conrad's avatar
David Conrad committed
376
        tmp += SIZE; \
377
        src += srcstride; \
David Conrad's avatar
David Conrad committed
378 379
    } \
\
380
    tmp = tmp_array + (2-(VTAPS==4))*SIZE; \
David Conrad's avatar
David Conrad committed
381 382 383 384
    filter = subpel_filters[my-1]; \
\
    for (y = 0; y < h; y++) { \
        for (x = 0; x < SIZE; x++) \
385
            dst[x] = FILTER_ ## VTAPS ## TAP(tmp, filter, SIZE); \
386
        dst += dststride; \
David Conrad's avatar
David Conrad committed
387 388 389 390
        tmp += SIZE; \
    } \
}

391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414
VP8_EPEL_H(16, 4)
VP8_EPEL_H(8,  4)
VP8_EPEL_H(4,  4)
VP8_EPEL_H(16, 6)
VP8_EPEL_H(8,  6)
VP8_EPEL_H(4,  6)
VP8_EPEL_V(16, 4)
VP8_EPEL_V(8,  4)
VP8_EPEL_V(4,  4)
VP8_EPEL_V(16, 6)
VP8_EPEL_V(8,  6)
VP8_EPEL_V(4,  6)
VP8_EPEL_HV(16, 4, 4)
VP8_EPEL_HV(8,  4, 4)
VP8_EPEL_HV(4,  4, 4)
VP8_EPEL_HV(16, 4, 6)
VP8_EPEL_HV(8,  4, 6)
VP8_EPEL_HV(4,  4, 6)
VP8_EPEL_HV(16, 6, 4)
VP8_EPEL_HV(8,  6, 4)
VP8_EPEL_HV(4,  6, 4)
VP8_EPEL_HV(16, 6, 6)
VP8_EPEL_HV(8,  6, 6)
VP8_EPEL_HV(4,  6, 6)
David Conrad's avatar
David Conrad committed
415

David Conrad's avatar
David Conrad committed
416
#define VP8_BILINEAR(SIZE) \
417
static void put_vp8_bilinear ## SIZE ## _h_c(uint8_t *dst, ptrdiff_t stride, uint8_t *src, ptrdiff_t s2, int h, int mx, int my) \
David Conrad's avatar
David Conrad committed
418 419 420 421 422 423 424 425 426 427 428
{ \
    int a = 8-mx, b = mx; \
    int x, y; \
\
    for (y = 0; y < h; y++) { \
        for (x = 0; x < SIZE; x++) \
            dst[x] = (a*src[x] + b*src[x+1] + 4) >> 3; \
        dst += stride; \
        src += stride; \
    } \
} \
429
static void put_vp8_bilinear ## SIZE ## _v_c(uint8_t *dst, ptrdiff_t stride, uint8_t *src, ptrdiff_t s2, int h, int mx, int my) \
David Conrad's avatar
David Conrad committed
430 431 432 433 434 435 436 437 438 439 440 441
{ \
    int c = 8-my, d = my; \
    int x, y; \
\
    for (y = 0; y < h; y++) { \
        for (x = 0; x < SIZE; x++) \
            dst[x] = (c*src[x] + d*src[x+stride] + 4) >> 3; \
        dst += stride; \
        src += stride; \
    } \
} \
\
442
static void put_vp8_bilinear ## SIZE ## _hv_c(uint8_t *dst, ptrdiff_t stride, uint8_t *src, ptrdiff_t s2, int h, int mx, int my) \
David Conrad's avatar
David Conrad committed
443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470
{ \
    int a = 8-mx, b = mx; \
    int c = 8-my, d = my; \
    int x, y; \
    uint8_t tmp_array[(2*SIZE+1)*SIZE]; \
    uint8_t *tmp = tmp_array; \
\
    for (y = 0; y < h+1; y++) { \
        for (x = 0; x < SIZE; x++) \
            tmp[x] = (a*src[x] + b*src[x+1] + 4) >> 3; \
        tmp += SIZE; \
        src += stride; \
    } \
\
    tmp = tmp_array; \
\
    for (y = 0; y < h; y++) { \
        for (x = 0; x < SIZE; x++) \
            dst[x] = (c*tmp[x] + d*tmp[x+SIZE] + 4) >> 3; \
        dst += stride; \
        tmp += SIZE; \
    } \
}

VP8_BILINEAR(16)
VP8_BILINEAR(8)
VP8_BILINEAR(4)

David Conrad's avatar
David Conrad committed
471
#define VP8_MC_FUNC(IDX, SIZE) \
472
    dsp->put_vp8_epel_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \
David Conrad's avatar
David Conrad committed
473 474 475 476 477 478 479 480 481
    dsp->put_vp8_epel_pixels_tab[IDX][0][1] = put_vp8_epel ## SIZE ## _h4_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][0][2] = put_vp8_epel ## SIZE ## _h6_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][1][0] = put_vp8_epel ## SIZE ## _v4_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][1][1] = put_vp8_epel ## SIZE ## _h4v4_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][1][2] = put_vp8_epel ## SIZE ## _h6v4_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][2][0] = put_vp8_epel ## SIZE ## _v6_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][2][1] = put_vp8_epel ## SIZE ## _h4v6_c; \
    dsp->put_vp8_epel_pixels_tab[IDX][2][2] = put_vp8_epel ## SIZE ## _h6v6_c

David Conrad's avatar
David Conrad committed
482 483 484 485 486 487 488 489 490 491 492
#define VP8_BILINEAR_MC_FUNC(IDX, SIZE) \
    dsp->put_vp8_bilinear_pixels_tab[IDX][0][0] = put_vp8_pixels ## SIZE ## _c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][0][1] = put_vp8_bilinear ## SIZE ## _h_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][0][2] = put_vp8_bilinear ## SIZE ## _h_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][1][0] = put_vp8_bilinear ## SIZE ## _v_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][1][1] = put_vp8_bilinear ## SIZE ## _hv_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][1][2] = put_vp8_bilinear ## SIZE ## _hv_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][2][0] = put_vp8_bilinear ## SIZE ## _v_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][2][1] = put_vp8_bilinear ## SIZE ## _hv_c; \
    dsp->put_vp8_bilinear_pixels_tab[IDX][2][2] = put_vp8_bilinear ## SIZE ## _hv_c

David Conrad's avatar
David Conrad committed
493 494
av_cold void ff_vp8dsp_init(VP8DSPContext *dsp)
{
495
    dsp->vp8_luma_dc_wht    = vp8_luma_dc_wht_c;
496
    dsp->vp8_luma_dc_wht_dc = vp8_luma_dc_wht_dc_c;
497 498 499 500
    dsp->vp8_idct_add       = vp8_idct_add_c;
    dsp->vp8_idct_dc_add    = vp8_idct_dc_add_c;
    dsp->vp8_idct_dc_add4y  = vp8_idct_dc_add4y_c;
    dsp->vp8_idct_dc_add4uv = vp8_idct_dc_add4uv_c;
David Conrad's avatar
David Conrad committed
501

502 503 504 505
    dsp->vp8_v_loop_filter16y = vp8_v_loop_filter16_c;
    dsp->vp8_h_loop_filter16y = vp8_h_loop_filter16_c;
    dsp->vp8_v_loop_filter8uv = vp8_v_loop_filter8uv_c;
    dsp->vp8_h_loop_filter8uv = vp8_h_loop_filter8uv_c;
David Conrad's avatar
David Conrad committed
506

507 508 509 510
    dsp->vp8_v_loop_filter16y_inner = vp8_v_loop_filter16_inner_c;
    dsp->vp8_h_loop_filter16y_inner = vp8_h_loop_filter16_inner_c;
    dsp->vp8_v_loop_filter8uv_inner = vp8_v_loop_filter8uv_inner_c;
    dsp->vp8_h_loop_filter8uv_inner = vp8_h_loop_filter8uv_inner_c;
David Conrad's avatar
David Conrad committed
511 512 513 514 515 516 517

    dsp->vp8_v_loop_filter_simple = vp8_v_loop_filter_simple_c;
    dsp->vp8_h_loop_filter_simple = vp8_h_loop_filter_simple_c;

    VP8_MC_FUNC(0, 16);
    VP8_MC_FUNC(1, 8);
    VP8_MC_FUNC(2, 4);
David Conrad's avatar
David Conrad committed
518 519 520 521

    VP8_BILINEAR_MC_FUNC(0, 16);
    VP8_BILINEAR_MC_FUNC(1, 8);
    VP8_BILINEAR_MC_FUNC(2, 4);
522

523
    if (HAVE_MMX)
524
        ff_vp8dsp_init_x86(dsp);
David Conrad's avatar
David Conrad committed
525 526
    if (HAVE_ALTIVEC)
        ff_vp8dsp_init_altivec(dsp);
527 528
    if (ARCH_ARM)
        ff_vp8dsp_init_arm(dsp);
David Conrad's avatar
David Conrad committed
529
}