Mercurial > libavcodec.hg
annotate x86/cpuid.c @ 9976:e52cd349e708 libavcodec
Only compile in NEON optimizations for H.264 when the H.264 decoder is enabled.
| author | diego |
|---|---|
| date | Wed, 22 Jul 2009 22:33:33 +0000 |
| parents | 7f594601d5e9 |
| children | fbf4d5b1b664 |
| rev | line source |
|---|---|
| 8430 | 1 /* |
| 2 * CPU detection code, extracted from mmx.h | |
| 3 * (c)1997-99 by H. Dietz and R. Fisher | |
| 4 * Converted to C and improved by Fabrice Bellard. | |
| 5 * | |
| 6 * This file is part of FFmpeg. | |
| 7 * | |
| 8 * FFmpeg is free software; you can redistribute it and/or | |
| 9 * modify it under the terms of the GNU Lesser General Public | |
| 10 * License as published by the Free Software Foundation; either | |
| 11 * version 2.1 of the License, or (at your option) any later version. | |
| 12 * | |
| 13 * FFmpeg is distributed in the hope that it will be useful, | |
| 14 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
| 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
| 16 * Lesser General Public License for more details. | |
| 17 * | |
| 18 * You should have received a copy of the GNU Lesser General Public | |
| 19 * License along with FFmpeg; if not, write to the Free Software | |
| 20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
| 21 */ | |
| 22 | |
| 23 #include <stdlib.h> | |
| 24 #include "libavutil/x86_cpu.h" | |
| 25 #include "libavcodec/dsputil.h" | |
| 26 | |
| 27 #undef printf | |
| 28 | |
| 29 /* ebx saving is necessary for PIC. gcc seems unable to see it alone */ | |
| 30 #define cpuid(index,eax,ebx,ecx,edx)\ | |
| 31 __asm__ volatile\ | |
| 32 ("mov %%"REG_b", %%"REG_S"\n\t"\ | |
| 33 "cpuid\n\t"\ | |
| 34 "xchg %%"REG_b", %%"REG_S\ | |
| 35 : "=a" (eax), "=S" (ebx),\ | |
| 36 "=c" (ecx), "=d" (edx)\ | |
| 37 : "0" (index)); | |
| 38 | |
| 39 /* Function to test if multimedia instructions are supported... */ | |
| 40 int mm_support(void) | |
| 41 { | |
| 42 int rval = 0; | |
| 43 int eax, ebx, ecx, edx; | |
| 44 int max_std_level, max_ext_level, std_caps=0, ext_caps=0; | |
|
9015
a50419dcda53
Remove CPUID availability check on AMD64 as it's architectural.
zuxy
parents:
8590
diff
changeset
|
45 |
|
a50419dcda53
Remove CPUID availability check on AMD64 as it's architectural.
zuxy
parents:
8590
diff
changeset
|
46 #if ARCH_X86_32 |
| 8430 | 47 x86_reg a, c; |
| 48 __asm__ volatile ( | |
| 49 /* See if CPUID instruction is supported ... */ | |
| 50 /* ... Get copies of EFLAGS into eax and ecx */ | |
|
9015
a50419dcda53
Remove CPUID availability check on AMD64 as it's architectural.
zuxy
parents:
8590
diff
changeset
|
51 "pushfl\n\t" |
| 8430 | 52 "pop %0\n\t" |
| 53 "mov %0, %1\n\t" | |
| 54 | |
| 55 /* ... Toggle the ID bit in one copy and store */ | |
| 56 /* to the EFLAGS reg */ | |
| 57 "xor $0x200000, %0\n\t" | |
| 58 "push %0\n\t" | |
|
9015
a50419dcda53
Remove CPUID availability check on AMD64 as it's architectural.
zuxy
parents:
8590
diff
changeset
|
59 "popfl\n\t" |
| 8430 | 60 |
| 61 /* ... Get the (hopefully modified) EFLAGS */ | |
|
9015
a50419dcda53
Remove CPUID availability check on AMD64 as it's architectural.
zuxy
parents:
8590
diff
changeset
|
62 "pushfl\n\t" |
| 8430 | 63 "pop %0\n\t" |
| 64 : "=a" (a), "=c" (c) | |
| 65 : | |
| 66 : "cc" | |
| 67 ); | |
| 68 | |
| 69 if (a == c) | |
| 70 return 0; /* CPUID not supported */ | |
|
9015
a50419dcda53
Remove CPUID availability check on AMD64 as it's architectural.
zuxy
parents:
8590
diff
changeset
|
71 #endif |
| 8430 | 72 |
| 73 cpuid(0, max_std_level, ebx, ecx, edx); | |
| 74 | |
| 75 if(max_std_level >= 1){ | |
| 76 cpuid(1, eax, ebx, ecx, std_caps); | |
| 77 if (std_caps & (1<<23)) | |
| 78 rval |= FF_MM_MMX; | |
| 79 if (std_caps & (1<<25)) | |
|
9342
7f594601d5e9
Rename FF_MM_MMXEXT to FF_MM_MMX2, for both clarity and consistency
stefano
parents:
9329
diff
changeset
|
80 rval |= FF_MM_MMX2 |
| 8590 | 81 #if HAVE_SSE |
| 8430 | 82 | FF_MM_SSE; |
| 83 if (std_caps & (1<<26)) | |
| 84 rval |= FF_MM_SSE2; | |
| 85 if (ecx & 1) | |
| 86 rval |= FF_MM_SSE3; | |
| 87 if (ecx & 0x00000200 ) | |
| 9329 | 88 rval |= FF_MM_SSSE3; |
| 89 if (ecx & 0x00080000 ) | |
| 90 rval |= FF_MM_SSE4; | |
| 91 if (ecx & 0x00100000 ) | |
| 92 rval |= FF_MM_SSE42; | |
| 8430 | 93 #endif |
| 94 ; | |
| 95 } | |
| 96 | |
| 97 cpuid(0x80000000, max_ext_level, ebx, ecx, edx); | |
| 98 | |
| 99 if(max_ext_level >= 0x80000001){ | |
| 100 cpuid(0x80000001, eax, ebx, ecx, ext_caps); | |
| 101 if (ext_caps & (1<<31)) | |
| 102 rval |= FF_MM_3DNOW; | |
| 103 if (ext_caps & (1<<30)) | |
| 104 rval |= FF_MM_3DNOWEXT; | |
| 105 if (ext_caps & (1<<23)) | |
| 106 rval |= FF_MM_MMX; | |
| 107 if (ext_caps & (1<<22)) | |
|
9342
7f594601d5e9
Rename FF_MM_MMXEXT to FF_MM_MMX2, for both clarity and consistency
stefano
parents:
9329
diff
changeset
|
108 rval |= FF_MM_MMX2; |
| 8430 | 109 } |
| 110 | |
| 111 #if 0 | |
| 9329 | 112 av_log(NULL, AV_LOG_DEBUG, "%s%s%s%s%s%s%s%s%s%s\n", |
| 8430 | 113 (rval&FF_MM_MMX) ? "MMX ":"", |
|
9342
7f594601d5e9
Rename FF_MM_MMXEXT to FF_MM_MMX2, for both clarity and consistency
stefano
parents:
9329
diff
changeset
|
114 (rval&FF_MM_MMX2) ? "MMX2 ":"", |
| 8430 | 115 (rval&FF_MM_SSE) ? "SSE ":"", |
| 116 (rval&FF_MM_SSE2) ? "SSE2 ":"", | |
| 117 (rval&FF_MM_SSE3) ? "SSE3 ":"", | |
| 118 (rval&FF_MM_SSSE3) ? "SSSE3 ":"", | |
| 9329 | 119 (rval&FF_MM_SSE4) ? "SSE4.1 ":"", |
| 120 (rval&FF_MM_SSE42) ? "SSE4.2 ":"", | |
| 8430 | 121 (rval&FF_MM_3DNOW) ? "3DNow ":"", |
| 122 (rval&FF_MM_3DNOWEXT) ? "3DNowExt ":""); | |
| 123 #endif | |
| 124 return rval; | |
| 125 } | |
| 126 | |
| 127 #ifdef TEST | |
| 128 int main ( void ) | |
| 129 { | |
| 130 int mm_flags; | |
| 131 mm_flags = mm_support(); | |
| 132 printf("mm_support = 0x%08X\n",mm_flags); | |
| 133 return 0; | |
| 134 } | |
| 135 #endif |
