1 /*****************************************************************************
2 * cpu.c: CPU detection code
3 *****************************************************************************
4 * Copyright (C) 1998-2004 the VideoLAN team
7 * Authors: Samuel Hocevar <sam@zoy.org>
8 * Christophe Massiot <massiot@via.ecp.fr>
9 * Eugenio Jarosiewicz <ej0@cise.ufl.eduEujenio>
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License as published by
13 * the Free Software Foundation; either version 2 of the License, or
14 * (at your option) any later version.
16 * This program is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU General Public License for more details.
21 * You should have received a copy of the GNU General Public License
22 * along with this program; if not, write to the Free Software
23 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
24 *****************************************************************************/
26 /*****************************************************************************
28 *****************************************************************************/
33 #include <vlc_common.h>
36 #include <sys/types.h>
45 #define PF_SSE3_INSTRUCTIONS_AVAILABLE 13
50 #if defined(__APPLE__) && (defined(__ppc__) || defined(__ppc64__))
51 #include <sys/sysctl.h>
54 #if defined( __i386__ ) || defined( __x86_64__ ) || defined( __powerpc__ ) \
55 || defined( __ppc__ ) || defined( __ppc64__ ) || defined( __powerpc64__ )
57 static bool check_OS_capability( const char *psz_capability
, pid_t pid
)
62 return false; /* fail safe :-/ */
64 while( waitpid( pid
, &status
, 0 ) == -1 );
66 if( WIFEXITED( status
) && WEXITSTATUS( status
) == 0 )
69 fprintf( stderr
, "warning: your CPU has %s instructions, but not your "
70 "operating system.\n", psz_capability
);
71 fprintf( stderr
, " some optimizations will be disabled unless "
72 "you upgrade your OS\n" );
76 # define check_capability(name, flag, code) \
81 signal(SIGILL, SIG_DFL); \
82 __asm__ __volatile__ ( code : : ); \
85 if( check_OS_capability((name), pid )) \
86 i_capabilities |= (flag); \
90 # define check_capability(name, flag, code) \
92 i_capabilities |= (flag); \
97 /*****************************************************************************
98 * CPUCapabilities: get the CPU capabilities
99 *****************************************************************************
100 * This function is called to list extensions the CPU may have.
101 *****************************************************************************/
102 uint32_t CPUCapabilities( void )
104 uint32_t i_capabilities
= 0;
106 #if defined( __i386__ ) || defined( __x86_64__ )
107 unsigned int i_eax
, i_ebx
, i_ecx
, i_edx
;
110 /* Needed for x86 CPU capabilities detection */
111 # if defined( __x86_64__ )
112 # define cpuid( reg ) \
113 asm volatile ( "cpuid\n\t" \
114 "movl %%ebx,%1\n\t" \
122 # define cpuid( reg ) \
123 asm volatile ( "push %%ebx\n\t" \
125 "movl %%ebx,%1\n\t" \
134 /* Check if the OS really supports the requested instructions */
135 # if defined (__i386__) && !defined (__i486__) && !defined (__i586__) \
136 && !defined (__i686__) && !defined (__pentium4__) \
137 && !defined (__k6__) && !defined (__athlon__) && !defined (__k8__)
138 /* check if cpuid instruction is supported */
139 asm volatile ( "push %%ebx\n\t"
142 "movl %%eax, %%ebx\n\t"
143 "xorl $0x200000, %%eax\n\t"
159 /* the CPU supports the CPUID instruction - get its level */
162 # if defined (__i386__) && !defined (__i586__) \
163 && !defined (__i686__) && !defined (__pentium4__) \
164 && !defined (__k6__) && !defined (__athlon__) && !defined (__k8__)
169 /* borrowed from mpeg2dec */
170 b_amd
= ( i_ebx
== 0x68747541 ) && ( i_ecx
== 0x444d4163 )
171 && ( i_edx
== 0x69746e65 );
173 /* test for the MMX flag */
176 # if !defined (__MMX__)
177 if( ! (i_edx
& 0x00800000) )
180 i_capabilities
|= CPU_CAPABILITY_MMX
;
181 # if defined (__SSE__)
182 i_capabilities
|= CPU_CAPABILITY_MMXEXT
| CPU_CAPABILITY_SSE
;
184 if( i_edx
& 0x02000000 )
186 i_capabilities
|= CPU_CAPABILITY_MMXEXT
;
188 # ifdef CAN_COMPILE_SSE
190 if( IsProcessorFeaturePresent( PF_XMMI_INSTRUCTIONS_AVAILABLE
) )
191 i_capabilities
|= CPU_CAPABILITY_SSE
;
193 check_capability( "SSE", CPU_CAPABILITY_SSE
,
194 "xorps %%xmm0,%%xmm0\n" );
200 # if defined (__SSE2__)
201 i_capabilities
|= CPU_CAPABILITY_SSE2
;
202 # elif defined (CAN_COMPILE_SSE2)
203 if( i_edx
& 0x04000000 )
206 if( IsProcessorFeaturePresent( PF_XMMI64_INSTRUCTIONS_AVAILABLE
) )
207 i_capabilities
|= CPU_CAPABILITY_SSE2
;
209 check_capability( "SSE2", CPU_CAPABILITY_SSE2
,
210 "movupd %%xmm0, %%xmm0\n" );
215 # if defined (__SSE3__)
216 i_capabilities
|= CPU_CAPABILITY_SSE3
;
217 # elif defined (CAN_COMPILE_SSE3)
218 if( i_ecx
& 0x00000001 )
221 if( IsProcessorFeaturePresent( PF_SSE3_INSTRUCTIONS_AVAILABLE
) )
222 i_capabilities
|= CPU_CAPABILITY_SSE3
;
224 check_capability( "SSE3", CPU_CAPABILITY_SSE3
,
225 "movsldup %%xmm1, %%xmm0\n" );
230 # if defined (__SSSE3__)
231 i_capabilities
|= CPU_CAPABILITY_SSSE3
;
232 # elif defined (CAN_COMPILE_SSSE3)
234 /* FIXME: IsProcessorFeaturePresent can't check for SSSE3 */
236 if( i_ecx
& 0x00000200 )
237 check_capability( "SSSE3", CPU_CAPABILITY_SSSE3
,
238 "pabsw %%xmm1, %%xmm0\n" );
242 # if defined (__SSE4_1__)
243 i_capabilities
|= CPU_CAPABILITY_SSE4_1
;
244 # elif defined (CAN_COMPILE_SSE4_1)
246 /* FIXME: IsProcessorFeaturePresent can't check for SSE4.1 */
248 if( i_ecx
& 0x00080000 )
249 check_capability( "SSE4.1", CPU_CAPABILITY_SSE4_1
,
250 "pmaxsb %%xmm1, %%xmm0\n" );
254 # if defined (__SSE4_2__)
255 i_capabilities
|= CPU_CAPABILITY_SSE4_2
;
256 # elif defined (CAN_COMPILE_SSE4_2)
258 /* FIXME: IsProcessorFeaturePresent can't check for SSE4.2 */
260 if( i_ecx
& 0x00100000 )
261 check_capability( "SSE4.2", CPU_CAPABILITY_SSE4_2
,
262 "pcmpgtq %%xmm1, %%xmm0\n" );
266 /* test for additional capabilities */
269 if( i_eax
< 0x80000001 )
272 /* list these additional capabilities */
275 # if defined (__3dNOW__)
276 i_capabilities
|= CPU_CAPABILITY_3DNOW
;
277 # elif defined (CAN_COMPILE_3DNOW)
279 if( i_edx
& 0x80000000 )
282 if( IsProcessorFeaturePresent( PF_3DNOW_INSTRUCTIONS_AVAILABLE
) )
283 i_capabilities
|= CPU_CAPABILITY_3DNOW
;
285 check_capability( "3D Now!", CPU_CAPABILITY_3DNOW
,
286 "pfadd %%mm0,%%mm0\n" "femms\n" );
291 if( b_amd
&& ( i_edx
& 0x00400000 ) )
293 i_capabilities
|= CPU_CAPABILITY_MMXEXT
;
297 #elif defined( __arm__ )
298 # if defined( __ARM_NEON__ )
299 i_capabilities
|= CPU_CAPABILITY_NEON
;
302 #elif defined( __powerpc__ ) || defined( __ppc__ ) || defined( __powerpc64__ ) \
303 || defined( __ppc64__ )
305 # if defined(__APPLE__)
306 int selectors
[2] = { CTL_HW
, HW_VECTORUNIT
};
307 int i_has_altivec
= 0;
308 size_t i_length
= sizeof( i_has_altivec
);
309 int i_error
= sysctl( selectors
, 2, &i_has_altivec
, &i_length
, NULL
, 0);
311 if( i_error
== 0 && i_has_altivec
!= 0 )
312 i_capabilities
|= CPU_CAPABILITY_ALTIVEC
;
314 # elif defined( CAN_COMPILE_ALTIVEC )
318 signal(SIGILL
, SIG_DFL
);
319 asm volatile ("mtspr 256, %0\n\t"
320 "vand %%v0, %%v0, %%v0"
326 if( check_OS_capability( "Altivec", pid
) )
327 i_capabilities
|= CPU_CAPABILITY_ALTIVEC
;
332 return i_capabilities
;
335 uint32_t cpu_flags
= 0;
338 /*****************************************************************************
339 * vlc_CPU: get pre-computed CPU capability flags
340 ****************************************************************************/
341 unsigned vlc_CPU (void)
351 #if defined ( __i386__ ) || defined ( __x86_64__ )
352 { CPU_CAPABILITY_MMX
, "mmx" },
353 { CPU_CAPABILITY_MMXEXT
, "mmxext" },
354 { CPU_CAPABILITY_3DNOW
, "3dnow" },
355 { CPU_CAPABILITY_SSE
, "sse" },
357 #if defined (__ppc__) || defined (__ppc64__) || defined (__powerpc__)
358 { CPU_CAPABILITY_ALTIVEC
, "altivec" },
360 #if defined (__arm__)
361 { CPU_CAPABILITY_NEON
, "arm_neon" },
366 * Check if a directory name contains usable plugins w.r.t. the hardware
367 * capabilities. Loading a plugin when the hardware has insufficient
368 * capabilities may lead to illegal instructions (SIGILL) and must be avoided.
370 * @param name the name of the directory (<b>not</b> the path)
372 * @return true if the hardware has sufficient capabilities or the directory
373 * does not require any special capability; false if the running hardware has
374 * insufficient capabilities.
376 bool vlc_CPU_CheckPluginDir (const char *name
)
378 const unsigned flags
= vlc_CPU ();
379 for (size_t i
= 0; i
< sizeof (cap_dirs
) / sizeof (cap_dirs
[0]); i
++)
381 if (strcmp (name
, cap_dirs
[i
].name
))
383 return (flags
& cap_dirs
[i
].value
) != 0;
388 static vlc_memcpy_t pf_vlc_memcpy
= memcpy
;
389 static vlc_memset_t pf_vlc_memset
= memset
;
391 void vlc_fastmem_register (vlc_memcpy_t cpy
, vlc_memset_t set
)
400 * vlc_memcpy: fast CPU-dependent memcpy
402 void *vlc_memcpy (void *tgt
, const void *src
, size_t n
)
404 return pf_vlc_memcpy (tgt
, src
, n
);
408 * vlc_memset: fast CPU-dependent memset
410 void *vlc_memset (void *tgt
, int c
, size_t n
)
412 return pf_vlc_memset (tgt
, c
, n
);