Implement full horizontal chroma for rgb/bgr24/32 output.

Originally committed as revision 27580 to svn://svn.mplayerhq.hu/mplayer/trunk/libswscale

Implement full horizontal chroma for rgb/bgr24/32 output.
Originally committed as revision 27580 to svn://svn.mplayerhq.hu/mplayer/trunk/libswscale
f0faee4c · Michael Niedermayer · 36b3e36e · f0faee4c · f0faee4c
Commit f0faee4c authored Sep 11, 2008 by Michael Niedermayer
Show whitespace changes
Inline Side-by-side

Showing with 115 additions and 1 deletion

swscale.c libswscale/swscale.c +87 -1

swscale_template.c libswscale/swscale_template.c +28 -0

No files found.
--- a/libswscale/swscale.c
+++ b/libswscale/swscale.c
@@ -473,6 +473,43 @@ static inline void yuv2nv12XinC(int16_t *lumFilter, int16_t **lumSrc, int lumFil
            else if (V<0) V=0;    \
        }

+#define YSCALE_YUV_2_PACKEDX_FULL_C \
+    for (i=0; i<dstW; i++){\
+        int j;\
+        int Y = 0;\
+        int U = -128<<19;\
+        int V = -128<<19;\
+        int R,G,B;\
+        \
+        for (j=0; j<lumFilterSize; j++){\
+            Y += lumSrc[j][i     ] * lumFilter[j];\
+        }\
+        for (j=0; j<chrFilterSize; j++){\
+            U += chrSrc[j][i     ] * chrFilter[j];\
+            V += chrSrc[j][i+VOFW] * chrFilter[j];\
+        }\
+        Y >>=10;\
+        U >>=10;\
+        V >>=10;\
+
+#define YSCALE_YUV_2_RGBX_FULL_C(rnd) \
+    YSCALE_YUV_2_PACKEDX_FULL_C\
+        Y-= c->oy;\
+        Y*= c->cy;\
+        Y+= rnd;\
+        R= Y + V*c->cvr;\
+        G= Y + V*c->cvg + U*c->cug;\
+        B= Y +            U*c->cub;\
+        if ((R|G|B)&(0xC0000000)){\
+            if (R>=(256<<22))   R=(256<<22)-1; \
+            else if (R<0)R=0;   \
+            if (G>=(256<<22))   G=(256<<22)-1; \
+            else if (G<0)G=0;   \
+            if (B>=(256<<22))   B=(256<<22)-1; \
+            else if (B<0)B=0;   \
+        }\
+
+
 #define YSCALE_YUV_2_GRAY16_C \
    for (i=0; i<(dstW>>1); i++){\
        int j;\
@@ -756,6 +793,42 @@ static inline void yuv2packedXinC(SwsContext *c, int16_t *lumFilter, int16_t **l
    YSCALE_YUV_2_ANYRGB_C(YSCALE_YUV_2_RGBX_C, YSCALE_YUV_2_PACKEDX_C(void), YSCALE_YUV_2_GRAY16_C, YSCALE_YUV_2_MONOBLACKX_C)
 }

+static inline void yuv2rgbXinC_full(SwsContext *c, int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize,
+                                    int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize,
+                                    uint8_t *dest, int dstW, int y)
+{
+    int i;
+    int step= fmt_depth(c->dstFormat)/8;
+
+    switch(c->dstFormat){
+    case PIX_FMT_ARGB:
+        dest++;
+    case PIX_FMT_RGB24:
+    case PIX_FMT_RGBA:
+        YSCALE_YUV_2_RGBX_FULL_C(1<<21)
+            dest[0]= R>>22;
+            dest[1]= G>>22;
+            dest[2]= B>>22;
+            dest[3]= 0;
+            dest+= step;
+        }
+        break;
+    case PIX_FMT_ABGR:
+        dest++;
+    case PIX_FMT_BGR24:
+    case PIX_FMT_BGRA:
+        YSCALE_YUV_2_RGBX_FULL_C(1<<21)
+            dest[0]= B>>22;
+            dest[1]= G>>22;
+            dest[2]= R>>22;
+            dest[3]= 0;
+            dest+= step;
+        }
+        break;
+    default:
+        assert(0);
+    }
+}

 //Note: we have C, X86, MMX, MMX2, 3DNOW version therse no 3DNOW+MMX2 one
 //Plain C versions
@@ -1880,6 +1953,13 @@ int sws_setColorspaceDetails(SwsContext *c, const int inv_table[4], int srcRange
    c->ugCoeff=   roundToInt16(cgu*8192) * 0x0001000100010001ULL;
    c->yOffset=   roundToInt16(oy *   8) * 0x0001000100010001ULL;

+    c->cy = (int16_t)roundToInt16(cy <<13);
+    c->oy = (int16_t)roundToInt16(oy <<9);
+    c->cvr= (int16_t)roundToInt16(crv<<13);
+    c->cvg= (int16_t)roundToInt16(cgv<<13);
+    c->cug= (int16_t)roundToInt16(cgu<<13);
+    c->cub= (int16_t)roundToInt16(cbu<<13);
+
    yuv2rgb_c_init_tables(c, inv_table, srcRange, brightness, contrast, saturation);
    //FIXME factorize

@@ -1993,7 +2073,13 @@ SwsContext *sws_getContext(int srcW, int srcH, int srcFormat, int dstW, int dstH
        av_log(NULL, AV_LOG_ERROR, "swScaler: Exactly one scaler algorithm must be choosen\n");
        return NULL;
    }
-
+if(   dstFormat != PIX_FMT_RGB32 //HACK
+   && dstFormat != PIX_FMT_RGB32_1
+   && dstFormat != PIX_FMT_RGB24
+   && dstFormat != PIX_FMT_BGR24
+   && dstFormat != PIX_FMT_BGR32
+   && dstFormat != PIX_FMT_BGR32_1)
+    flags &= ~SWS_FULL_CHR_H_INT;

    /* sanity check */
    if (srcW<4 || srcH<1 || dstW<8 || dstH<1) //FIXME check if these are enough and try to lowwer them after fixing the relevant parts of the code

--- a/libswscale/swscale_template.c
+++ b/libswscale/swscale_template.c
@@ -3132,9 +3132,16 @@ static int RENAME(swScale)(SwsContext *c, uint8_t* src[], int srcStride[], int s
                if (vLumFilterSize == 1 && vChrFilterSize == 2) //unscaled RGB
                {
                    int chrAlpha= vChrFilter[2*dstY+1];
+                    if(flags & SWS_FULL_CHR_H_INT){
+                        yuv2rgbXinC_full(c, //FIXME write a packed1_full function
+                            vLumFilter+dstY*vLumFilterSize, lumSrcPtr, vLumFilterSize,
+                            vChrFilter+dstY*vChrFilterSize, chrSrcPtr, vChrFilterSize,
+                            dest, dstW, dstY);
+                    }else{
                    RENAME(yuv2packed1)(c, *lumSrcPtr, *chrSrcPtr, *(chrSrcPtr+1),
                        dest, dstW, chrAlpha, dstFormat, flags, dstY);
                    }
+                }
                else if (vLumFilterSize == 2 && vChrFilterSize == 2) //bilinear upscale RGB
                {
                    int lumAlpha= vLumFilter[2*dstY+1];
@@ -3143,11 +3150,24 @@ static int RENAME(swScale)(SwsContext *c, uint8_t* src[], int srcStride[], int s
                    lumMmxFilter[3]= vLumFilter[2*dstY   ]*0x10001;
                    chrMmxFilter[2]=
                    chrMmxFilter[3]= vChrFilter[2*chrDstY]*0x10001;
+                    if(flags & SWS_FULL_CHR_H_INT){
+                        yuv2rgbXinC_full(c, //FIXME write a packed2_full function
+                            vLumFilter+dstY*vLumFilterSize, lumSrcPtr, vLumFilterSize,
+                            vChrFilter+dstY*vChrFilterSize, chrSrcPtr, vChrFilterSize,
+                            dest, dstW, dstY);
+                    }else{
                    RENAME(yuv2packed2)(c, *lumSrcPtr, *(lumSrcPtr+1), *chrSrcPtr, *(chrSrcPtr+1),
                        dest, dstW, lumAlpha, chrAlpha, dstY);
                    }
+                }
                else //general RGB
                {
+                    if(flags & SWS_FULL_CHR_H_INT){
+                        yuv2rgbXinC_full(c,
+                            vLumFilter+dstY*vLumFilterSize, lumSrcPtr, vLumFilterSize,
+                            vChrFilter+dstY*vChrFilterSize, chrSrcPtr, vChrFilterSize,
+                            dest, dstW, dstY);
+                    }else{
                    RENAME(yuv2packedX)(c,
                        vLumFilter+dstY*vLumFilterSize, lumSrcPtr, vLumFilterSize,
                        vChrFilter+dstY*vChrFilterSize, chrSrcPtr, vChrFilterSize,
@@ -3155,6 +3175,7 @@ static int RENAME(swScale)(SwsContext *c, uint8_t* src[], int srcStride[], int s
                    }
                }
            }
+        }
        else // hmm looks like we can't use MMX here without overwriting this array's tail
        {
            int16_t **lumSrcPtr= lumPixBuf + lumBufIndex + firstLumSrcY - lastInLumBuf + vLumBufSize;
@@ -3180,6 +3201,12 @@ static int RENAME(swScale)(SwsContext *c, uint8_t* src[], int srcStride[], int s
            {
                assert(lumSrcPtr + vLumFilterSize - 1 < lumPixBuf + vLumBufSize*2);
                assert(chrSrcPtr + vChrFilterSize - 1 < chrPixBuf + vChrBufSize*2);
+                if(flags & SWS_FULL_CHR_H_INT){
+                    yuv2rgbXinC_full(c,
+                        vLumFilter+dstY*vLumFilterSize, lumSrcPtr, vLumFilterSize,
+                        vChrFilter+dstY*vChrFilterSize, chrSrcPtr, vChrFilterSize,
+                        dest, dstW, dstY);
+                }else{
                yuv2packedXinC(c,
                    vLumFilter+dstY*vLumFilterSize, lumSrcPtr, vLumFilterSize,
                    vChrFilter+dstY*vChrFilterSize, chrSrcPtr, vChrFilterSize,
@@ -3187,6 +3214,7 @@ static int RENAME(swScale)(SwsContext *c, uint8_t* src[], int srcStride[], int s
                }
            }
        }
+    }

 #ifdef HAVE_MMX
    asm volatile(SFENCE:::"memory");