Commit 4596673c authored by Michael Niedermayer's avatar Michael Niedermayer

-fPIC compileable

Originally committed as revision 9395 to svn://svn.mplayerhq.hu/mplayer/trunk/postproc
parent b3b8bf64
...@@ -1409,7 +1409,7 @@ static inline void RENAME(yuvPlanartoyuy2)(const uint8_t *ysrc, const uint8_t *u ...@@ -1409,7 +1409,7 @@ static inline void RENAME(yuvPlanartoyuy2)(const uint8_t *ysrc, const uint8_t *u
"addl $8, %%eax \n\t" "addl $8, %%eax \n\t"
"cmpl %4, %%eax \n\t" "cmpl %4, %%eax \n\t"
" jb 1b \n\t" " jb 1b \n\t"
::"r"(dst), "r"(ysrc), "r"(usrc), "r"(vsrc), "r" (chromWidth) ::"r"(dst), "r"(ysrc), "r"(usrc), "r"(vsrc), "g" (chromWidth)
: "%eax" : "%eax"
); );
#else #else
...@@ -1590,7 +1590,7 @@ static inline void RENAME(yuy2toyv12)(const uint8_t *src, uint8_t *ydst, uint8_t ...@@ -1590,7 +1590,7 @@ static inline void RENAME(yuy2toyv12)(const uint8_t *src, uint8_t *ydst, uint8_t
"addl $8, %%eax \n\t" "addl $8, %%eax \n\t"
"cmpl %4, %%eax \n\t" "cmpl %4, %%eax \n\t"
" jb 1b \n\t" " jb 1b \n\t"
::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "r" (chromWidth) ::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "g" (chromWidth)
: "memory", "%eax" : "memory", "%eax"
); );
...@@ -1620,7 +1620,7 @@ static inline void RENAME(yuy2toyv12)(const uint8_t *src, uint8_t *ydst, uint8_t ...@@ -1620,7 +1620,7 @@ static inline void RENAME(yuy2toyv12)(const uint8_t *src, uint8_t *ydst, uint8_t
"cmpl %4, %%eax \n\t" "cmpl %4, %%eax \n\t"
" jb 1b \n\t" " jb 1b \n\t"
::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "r" (chromWidth) ::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "g" (chromWidth)
: "memory", "%eax" : "memory", "%eax"
); );
#else #else
...@@ -1828,7 +1828,7 @@ static inline void RENAME(uyvytoyv12)(const uint8_t *src, uint8_t *ydst, uint8_t ...@@ -1828,7 +1828,7 @@ static inline void RENAME(uyvytoyv12)(const uint8_t *src, uint8_t *ydst, uint8_t
"addl $8, %%eax \n\t" "addl $8, %%eax \n\t"
"cmpl %4, %%eax \n\t" "cmpl %4, %%eax \n\t"
" jb 1b \n\t" " jb 1b \n\t"
::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "r" (chromWidth) ::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "g" (chromWidth)
: "memory", "%eax" : "memory", "%eax"
); );
...@@ -1858,7 +1858,7 @@ static inline void RENAME(uyvytoyv12)(const uint8_t *src, uint8_t *ydst, uint8_t ...@@ -1858,7 +1858,7 @@ static inline void RENAME(uyvytoyv12)(const uint8_t *src, uint8_t *ydst, uint8_t
"cmpl %4, %%eax \n\t" "cmpl %4, %%eax \n\t"
" jb 1b \n\t" " jb 1b \n\t"
::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "r" (chromWidth) ::"r"(src), "r"(ydst), "r"(udst), "r"(vdst), "g" (chromWidth)
: "memory", "%eax" : "memory", "%eax"
); );
#else #else
...@@ -2385,32 +2385,24 @@ static inline void RENAME(yvu9_to_yuy2)(const uint8_t *src1, const uint8_t *src2 ...@@ -2385,32 +2385,24 @@ static inline void RENAME(yvu9_to_yuy2)(const uint8_t *src1, const uint8_t *src2
int srcStride1, int srcStride2, int srcStride1, int srcStride2,
int srcStride3, int dstStride) int srcStride3, int dstStride)
{ {
unsigned y,x,x2,w,h; unsigned y,x,w,h;
w=width/2; h=height; w=width/2; h=height;
#ifdef HAVE_MMX
asm volatile(
PREFETCH" %0\n\t"
PREFETCH" %1\n\t"
PREFETCH" %2\n\t"
::"m"(*(src1+srcStride1)),"m"(*(src2+srcStride2)),"m"(*(src3+srcStride3)):"memory");
#endif
for(y=0;y<h;y++){ for(y=0;y<h;y++){
const uint8_t* yp=src1+srcStride1*y; const uint8_t* yp=src1+srcStride1*y;
const uint8_t* up=src2+srcStride2*(y>>2); const uint8_t* up=src2+srcStride2*(y>>2);
const uint8_t* vp=src3+srcStride3*(y>>2); const uint8_t* vp=src3+srcStride3*(y>>2);
uint8_t* d=dst+dstStride*y; uint8_t* d=dst+dstStride*y;
x2=0;
x=0; x=0;
#ifdef HAVE_MMX #ifdef HAVE_MMX
for(;x<w-7;x+=8,x2+=32) for(;x<w-7;x+=8)
{ {
asm volatile( asm volatile(
PREFETCH" 32%1\n\t" PREFETCH" 32(%1, %0)\n\t"
PREFETCH" 32%2\n\t" PREFETCH" 32(%2, %0)\n\t"
PREFETCH" 32%3\n\t" PREFETCH" 32(%3, %0)\n\t"
"movq %1, %%mm0\n\t" /* Y0Y1Y2Y3Y4Y5Y6Y7 */ "movq (%1, %0, 4), %%mm0\n\t" /* Y0Y1Y2Y3Y4Y5Y6Y7 */
"movq %2, %%mm1\n\t" /* U0U1U2U3U4U5U6U7 */ "movq (%2, %0), %%mm1\n\t" /* U0U1U2U3U4U5U6U7 */
"movq %3, %%mm2\n\t" /* V0V1V2V3V4V5V6V7 */ "movq (%3, %0), %%mm2\n\t" /* V0V1V2V3V4V5V6V7 */
"movq %%mm0, %%mm3\n\t" /* Y0Y1Y2Y3Y4Y5Y6Y7 */ "movq %%mm0, %%mm3\n\t" /* Y0Y1Y2Y3Y4Y5Y6Y7 */
"movq %%mm1, %%mm4\n\t" /* U0U1U2U3U4U5U6U7 */ "movq %%mm1, %%mm4\n\t" /* U0U1U2U3U4U5U6U7 */
"movq %%mm2, %%mm5\n\t" /* V0V1V2V3V4V5V6V7 */ "movq %%mm2, %%mm5\n\t" /* V0V1V2V3V4V5V6V7 */
...@@ -2423,41 +2415,42 @@ static inline void RENAME(yvu9_to_yuy2)(const uint8_t *src1, const uint8_t *src2 ...@@ -2423,41 +2415,42 @@ static inline void RENAME(yvu9_to_yuy2)(const uint8_t *src1, const uint8_t *src2
"punpcklbw %%mm2, %%mm1\n\t" /* U0V0 U0V0 U1V1 U1V1*/ "punpcklbw %%mm2, %%mm1\n\t" /* U0V0 U0V0 U1V1 U1V1*/
"punpcklbw %%mm1, %%mm0\n\t" /* Y0U0 Y1V0 Y2U0 Y3V0*/ "punpcklbw %%mm1, %%mm0\n\t" /* Y0U0 Y1V0 Y2U0 Y3V0*/
"punpckhbw %%mm1, %%mm3\n\t" /* Y4U1 Y5V1 Y6U1 Y7V1*/ "punpckhbw %%mm1, %%mm3\n\t" /* Y4U1 Y5V1 Y6U1 Y7V1*/
MOVNTQ" %%mm0, %0\n\t" MOVNTQ" %%mm0, (%4, %0, 8)\n\t"
MOVNTQ" %%mm3, 8%0\n\t" MOVNTQ" %%mm3, 8(%4, %0, 8)\n\t"
"punpckhbw %%mm2, %%mm6\n\t" /* U2V2 U2V2 U3V3 U3V3*/ "punpckhbw %%mm2, %%mm6\n\t" /* U2V2 U2V2 U3V3 U3V3*/
"movq 8%1, %%mm0\n\t" "movq 8(%1, %0, 4), %%mm0\n\t"
"movq %%mm0, %%mm3\n\t" "movq %%mm0, %%mm3\n\t"
"punpcklbw %%mm6, %%mm0\n\t" /* Y U2 Y V2 Y U2 Y V2*/ "punpcklbw %%mm6, %%mm0\n\t" /* Y U2 Y V2 Y U2 Y V2*/
"punpckhbw %%mm6, %%mm3\n\t" /* Y U3 Y V3 Y U3 Y V3*/ "punpckhbw %%mm6, %%mm3\n\t" /* Y U3 Y V3 Y U3 Y V3*/
MOVNTQ" %%mm0, 16%0\n\t" MOVNTQ" %%mm0, 16(%4, %0, 8)\n\t"
MOVNTQ" %%mm3, 24%0\n\t" MOVNTQ" %%mm3, 24(%4, %0, 8)\n\t"
"movq %%mm4, %%mm6\n\t" "movq %%mm4, %%mm6\n\t"
"movq 16%1, %%mm0\n\t" "movq 16(%1, %0, 4), %%mm0\n\t"
"movq %%mm0, %%mm3\n\t" "movq %%mm0, %%mm3\n\t"
"punpcklbw %%mm5, %%mm4\n\t" "punpcklbw %%mm5, %%mm4\n\t"
"punpcklbw %%mm4, %%mm0\n\t" /* Y U4 Y V4 Y U4 Y V4*/ "punpcklbw %%mm4, %%mm0\n\t" /* Y U4 Y V4 Y U4 Y V4*/
"punpckhbw %%mm4, %%mm3\n\t" /* Y U5 Y V5 Y U5 Y V5*/ "punpckhbw %%mm4, %%mm3\n\t" /* Y U5 Y V5 Y U5 Y V5*/
MOVNTQ" %%mm0, 32%0\n\t" MOVNTQ" %%mm0, 32(%4, %0, 8)\n\t"
MOVNTQ" %%mm3, 40%0\n\t" MOVNTQ" %%mm3, 40(%4, %0, 8)\n\t"
"punpckhbw %%mm5, %%mm6\n\t" "punpckhbw %%mm5, %%mm6\n\t"
"movq 24%1, %%mm0\n\t" "movq 24(%1, %0, 4), %%mm0\n\t"
"movq %%mm0, %%mm3\n\t" "movq %%mm0, %%mm3\n\t"
"punpcklbw %%mm6, %%mm0\n\t" /* Y U6 Y V6 Y U6 Y V6*/ "punpcklbw %%mm6, %%mm0\n\t" /* Y U6 Y V6 Y U6 Y V6*/
"punpckhbw %%mm6, %%mm3\n\t" /* Y U7 Y V7 Y U7 Y V7*/ "punpckhbw %%mm6, %%mm3\n\t" /* Y U7 Y V7 Y U7 Y V7*/
MOVNTQ" %%mm0, 48%0\n\t" MOVNTQ" %%mm0, 48(%4, %0, 8)\n\t"
MOVNTQ" %%mm3, 56%0\n\t" MOVNTQ" %%mm3, 56(%4, %0, 8)\n\t"
:"=m"(d[8*x]) : "+r" (x)
:"m"(yp[x2]),"m"(up[x]),"m"(vp[x]) : "r"(yp), "r" (up), "r"(vp), "r"(d)
:"memory"); :"memory");
} }
#endif #endif
for(;x<w;x++,x2+=4) for(; x<w; x++)
{ {
const int x2= x<<2;
d[8*x+0]=yp[x2]; d[8*x+0]=yp[x2];
d[8*x+1]=up[x]; d[8*x+1]=up[x];
d[8*x+2]=yp[x2+1]; d[8*x+2]=yp[x2+1];
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment