Commit e42a152b authored by Michael Niedermayer's avatar Michael Niedermayer

x86 cpu capabilities detection rewrite / cleanup

Originally committed as revision 3750 to svn://svn.ffmpeg.org/ffmpeg/trunk
parent 74679f5c
...@@ -1169,6 +1169,7 @@ typedef struct AVCodecContext { ...@@ -1169,6 +1169,7 @@ typedef struct AVCodecContext {
#define FF_MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */ #define FF_MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */
#define FF_MM_SSE 0x0008 /* SSE functions */ #define FF_MM_SSE 0x0008 /* SSE functions */
#define FF_MM_SSE2 0x0010 /* PIV SSE2 functions */ #define FF_MM_SSE2 0x0010 /* PIV SSE2 functions */
#define FF_MM_3DNOWEXT 0x0020 /* AMD 3DNowExt */
#endif /* HAVE_MMX */ #endif /* HAVE_MMX */
/** /**
......
...@@ -408,6 +408,7 @@ int mm_support(void); ...@@ -408,6 +408,7 @@ int mm_support(void);
#define MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */ #define MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */
#define MM_SSE 0x0008 /* SSE functions */ #define MM_SSE 0x0008 /* SSE functions */
#define MM_SSE2 0x0010 /* PIV SSE2 functions */ #define MM_SSE2 0x0010 /* PIV SSE2 functions */
#define MM_3DNOWEXT 0x0020 /* AMD 3DNowExt */
extern int mm_flags; extern int mm_flags;
......
...@@ -27,6 +27,7 @@ int mm_support(void) ...@@ -27,6 +27,7 @@ int mm_support(void)
{ {
int rval = 0; int rval = 0;
int eax, ebx, ecx, edx; int eax, ebx, ecx, edx;
int max_std_level, max_ext_level, std_caps=0, ext_caps=0;
long a, c; long a, c;
__asm__ __volatile__ ( __asm__ __volatile__ (
...@@ -53,57 +54,43 @@ int mm_support(void) ...@@ -53,57 +54,43 @@ int mm_support(void)
if (a == c) if (a == c)
return 0; /* CPUID not supported */ return 0; /* CPUID not supported */
cpuid(0, eax, ebx, ecx, edx); cpuid(0, max_std_level, ebx, ecx, edx);
if (ebx == 0x756e6547 &&
edx == 0x49656e69 &&
ecx == 0x6c65746e) {
/* intel */ if(max_std_level >= 1){
inteltest: cpuid(1, eax, ebx, ecx, std_caps);
cpuid(1, eax, ebx, ecx, edx); if (std_caps & (1<<23))
if ((edx & 0x00800000) == 0)
return 0;
rval |= MM_MMX; rval |= MM_MMX;
if (edx & 0x02000000) if (std_caps & (1<<25))
rval |= MM_MMXEXT | MM_SSE; rval |= MM_MMXEXT | MM_SSE;
if (edx & 0x04000000) if (std_caps & (1<<26))
rval |= MM_SSE2; rval |= MM_SSE2;
return rval; }
} else if (ebx == 0x68747541 &&
cpuid(0x80000000, max_ext_level, ebx, ecx, edx);
if(max_ext_level >= 0x80000001){
cpuid(0x80000001, eax, ebx, ecx, ext_caps);
if (ext_caps & (1<<31))
rval |= MM_3DNOW;
if (ext_caps & (1<<30))
rval |= MM_3DNOWEXT;
if (ext_caps & (1<<23))
rval |= MM_MMX;
}
cpuid(0, eax, ebx, ecx, edx);
if ( ebx == 0x68747541 &&
edx == 0x69746e65 && edx == 0x69746e65 &&
ecx == 0x444d4163) { ecx == 0x444d4163) {
/* AMD */ /* AMD */
cpuid(0x80000000, eax, ebx, ecx, edx); if(ext_caps & (1<<22))
if ((unsigned)eax < 0x80000001)
goto inteltest;
cpuid(0x80000001, eax, ebx, ecx, edx);
if ((edx & 0x00800000) == 0)
return 0;
rval = MM_MMX;
if (edx & 0x80000000)
rval |= MM_3DNOW;
if (edx & 0x00400000)
rval |= MM_MMXEXT; rval |= MM_MMXEXT;
goto inteltest;
} else if (ebx == 0x746e6543 && } else if (ebx == 0x746e6543 &&
edx == 0x48727561 && edx == 0x48727561 &&
ecx == 0x736c7561) { /* "CentaurHauls" */ ecx == 0x736c7561) { /* "CentaurHauls" */
/* VIA C3 */ /* VIA C3 */
cpuid(0x80000000, eax, ebx, ecx, edx); if(ext_caps & (1<<24))
if ((unsigned)eax < 0x80000001)
goto inteltest;
cpuid(0x80000001, eax, ebx, ecx, edx);
rval = 0;
if( edx & ( 1 << 31) )
rval |= MM_3DNOW;
if( edx & ( 1 << 23) )
rval |= MM_MMX;
if( edx & ( 1 << 24) )
rval |= MM_MMXEXT; rval |= MM_MMXEXT;
if(rval==0)
goto inteltest;
return rval;
} else if (ebx == 0x69727943 && } else if (ebx == 0x69727943 &&
edx == 0x736e4978 && edx == 0x736e4978 &&
ecx == 0x64616574) { ecx == 0x64616574) {
...@@ -116,29 +103,21 @@ int mm_support(void) ...@@ -116,29 +103,21 @@ int mm_support(void)
According to the table, the only CPU which supports level According to the table, the only CPU which supports level
2 is also the only one which supports extended CPUID levels. 2 is also the only one which supports extended CPUID levels.
*/ */
if (eax != 2) if (eax < 2)
goto inteltest;
cpuid(0x80000001, eax, ebx, ecx, edx);
if ((eax & 0x00800000) == 0)
return 0;
rval = MM_MMX;
if (eax & 0x01000000)
rval |= MM_MMXEXT;
return rval; return rval;
} else if (ebx == 0x756e6547 && if (ext_caps & (1<<24))
edx == 0x54656e69 && rval |= MM_MMXEXT;
ecx == 0x3638784d) {
/* Tranmeta Crusoe */
cpuid(0x80000000, eax, ebx, ecx, edx);
if ((unsigned)eax < 0x80000001)
return 0;
cpuid(0x80000001, eax, ebx, ecx, edx);
if ((edx & 0x00800000) == 0)
return 0;
return MM_MMX;
} else {
return 0;
} }
#if 0
av_log(NULL, AV_LOG_DEBUG, "%s%s%s%s%s%s\n",
(rval&MM_MMX) ? "MMX ":"",
(rval&MM_MMXEXT) ? "MMX2 ":"",
(rval&MM_SSE) ? "SSE ":"",
(rval&MM_SSE2) ? "SSE2 ":"",
(rval&MM_3DNOW) ? "3DNow ":"",
(rval&MM_3DNOWEXT) ? "3DNowExt ":"");
#endif
return rval;
} }
#ifdef __TEST__ #ifdef __TEST__
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment