/*****************************************************************************
* cpu.c: CPU detection code
*****************************************************************************
- * Copyright (C) 1998-2004 VideoLAN
+ * Copyright (C) 1998-2004 VLC authors and VideoLAN
* $Id$
*
* Authors: Samuel Hocevar <sam@zoy.org>
* Christophe Massiot <massiot@via.ecp.fr>
* Eugenio Jarosiewicz <ej0@cise.ufl.eduEujenio>
*
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms of the GNU Lesser General Public License as published by
+ * the Free Software Foundation; either version 2.1 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU Lesser General Public License for more details.
*
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111, USA.
+ * You should have received a copy of the GNU Lesser General Public License
+ * along with this program; if not, write to the Free Software Foundation,
+ * Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
*****************************************************************************/
/*****************************************************************************
* Preamble
*****************************************************************************/
-#include <vlc/vlc.h>
-
-#ifdef HAVE_SIGNAL_H
-# include <signal.h> /* SIGHUP, SIGINT, SIGKILL */
-# include <setjmp.h> /* longjmp, setjmp */
+#ifdef HAVE_CONFIG_H
+# include "config.h"
#endif
-#ifdef SYS_DARWIN
-#include <sys/sysctl.h>
-#endif
+#include <vlc_common.h>
+#include <vlc_cpu.h>
+#include "libvlc.h"
-#include "vlc_cpu.h"
+#include <assert.h>
-/*****************************************************************************
- * Local prototypes
- *****************************************************************************/
-#ifdef HAVE_SIGNAL_H
-static void SigHandler ( int );
+#ifndef __linux__
+#include <sys/types.h>
+#ifndef WIN32
+#include <unistd.h>
+#include <sys/wait.h>
+#include <signal.h>
+#else
+#include <errno.h>
#endif
-/*****************************************************************************
- * Global variables - they're needed for signal handling
- *****************************************************************************/
-#ifdef HAVE_SIGNAL_H
-static jmp_buf env;
-static int i_illegal;
-#if defined( __i386__ ) || defined( __x86_64__ )
-static char *psz_capability;
+#ifdef __APPLE__
+#include <sys/sysctl.h>
#endif
+
+#if defined(__OpenBSD__) && defined(__powerpc__)
+#include <sys/param.h>
+#include <sys/sysctl.h>
+#include <machine/cpu.h>
#endif
-/*****************************************************************************
- * CPUCapabilities: get the CPU capabilities
- *****************************************************************************
- * This function is called to list extensions the CPU may have.
- *****************************************************************************/
-uint32_t CPUCapabilities( void )
+static uint32_t cpu_flags;
+
+#if defined (__i386__) || defined (__x86_64__) || defined (__powerpc__) \
+ || defined (__ppc__) || defined (__ppc64__) || defined (__powerpc64__)
+# if !defined (WIN32) && !defined (__OS2__)
+static bool vlc_CPU_check (const char *name, void (*func) (void))
{
- volatile uint32_t i_capabilities = CPU_CAPABILITY_NONE;
+ pid_t pid = fork();
-#if defined( SYS_DARWIN )
- int selectors[2] = { CTL_HW, HW_VECTORUNIT };
- int i_has_altivec = 0;
- size_t i_length = sizeof( i_has_altivec );
- int i_error = sysctl( selectors, 2, &i_has_altivec, &i_length, NULL, 0);
+ switch (pid)
+ {
+ case 0:
+ signal (SIGILL, SIG_DFL);
+ func ();
+ //__asm__ __volatile__ ( code : : input );
+ _exit (0);
+ case -1:
+ return false;
+ }
+ //i_capabilities |= (flag);
- i_capabilities |= CPU_CAPABILITY_FPU;
+ int status;
+ while( waitpid( pid, &status, 0 ) == -1 );
- if( i_error == 0 && i_has_altivec != 0 )
- i_capabilities |= CPU_CAPABILITY_ALTIVEC;
+ if( WIFEXITED( status ) && WEXITSTATUS( status ) == 0 )
+ return true;
- return i_capabilities;
+ fprintf (stderr, "Warning: your CPU has %s instructions, but not your "
+ "operating system.\n", name);
+ fprintf( stderr, " some optimizations will be disabled unless "
+ "you upgrade your OS\n" );
+ return false;
+}
-#elif defined( __i386__ ) || defined( __x86_64__ )
- volatile unsigned int i_eax, i_ebx, i_ecx, i_edx;
- volatile vlc_bool_t b_amd;
+#if defined (CAN_COMPILE_SSE) && !defined (__SSE__)
+VLC_SSE static void SSE_test (void)
+{
+ asm volatile ("xorps %%xmm0,%%xmm0\n" : : : "xmm0", "xmm1");
+}
+#endif
+#if defined (CAN_COMPILE_SSE2) && !defined (__SSE2__)
+VLC_SSE static void SSE2_test (void)
+{
+ asm volatile ("movupd %%xmm0, %%xmm0\n" : : : "xmm0", "xmm1");
+}
+#endif
+#if defined (CAN_COMPILE_SSE3) && !defined (__SSE3__)
+VLC_SSE static void SSE3_test (void)
+{
+ asm volatile ("movsldup %%xmm1, %%xmm0\n" : : : "xmm0", "xmm1");
+}
+#endif
+#if defined (CAN_COMPILE_SSSE3) && !defined (__SSSE3__)
+VLC_SSE static void SSSE3_test (void)
+{
+ asm volatile ("pabsw %%xmm1, %%xmm0\n" : : : "xmm0", "xmm1");
+}
+#endif
+#if defined (CAN_COMPILE_SSE4_1) && !defined (__SSE4_1__)
+VLC_SSE static void SSE4_1_test (void)
+{
+ asm volatile ("pmaxsb %%xmm1, %%xmm0\n" : : : "xmm0", "xmm1");
+}
+#endif
+#if defined (CAN_COMPILE_SSE4_2) && !defined (__SSE4_2__)
+VLC_SSE static void SSE4_2_test (void)
+{
+ asm volatile ("pcmpgtq %%xmm1, %%xmm0\n" : : : "xmm0", "xmm1");
+}
+#endif
+#if defined (CAN_COMPILE_3DNOW) && !defined (__3dNOW__)
+VLC_MMX static void ThreeD_Now_test (void)
+{
+ asm volatile ("pfadd %%mm0,%%mm0\n" "femms\n" : : : "mm0");
+}
+#endif
- /* Needed for x86 CPU capabilities detection */
-# define cpuid( reg ) \
- asm volatile ( "push %%ebx\n\t" \
- "cpuid\n\t" \
- "movl %%ebx,%1\n\t" \
- "pop %%ebx\n\t" \
- : "=a" ( i_eax ), \
- "=r" ( i_ebx ), \
- "=c" ( i_ecx ), \
- "=d" ( i_edx ) \
- : "a" ( reg ) \
- : "cc" );
-
-# if defined( CAN_COMPILE_SSE ) || defined ( CAN_COMPILE_3DNOW ) \
- && defined( HAVE_SIGNAL_H )
- void (*pf_sigill) (int) = signal( SIGILL, SigHandler );
-# endif
+#if defined (CAN_COMPILE_ALTIVEC)
+static void Altivec_test (void)
+{
+ asm volatile ("mtspr 256, %0\n" "vand %%v0, %%v0, %%v0\n" : : "r" (-1));
+}
+#endif
+
+#else /* WIN32 || __OS2__ */
+# define vlc_CPU_check(name, func) (1)
+#endif
+#endif
- i_capabilities |= CPU_CAPABILITY_FPU;
+/**
+ * Determines the CPU capabilities and stores them in cpu_flags.
+ * The result can be retrieved with vlc_CPU().
+ */
+void vlc_CPU_init (void)
+{
+ uint32_t i_capabilities = 0;
+
+#if defined( __i386__ ) || defined( __x86_64__ )
+ unsigned int i_eax, i_ebx, i_ecx, i_edx;
+ bool b_amd;
+ /* Needed for x86 CPU capabilities detection */
+# if defined (__i386__) && defined (__PIC__)
+# define cpuid(reg) \
+ asm volatile ("xchgl %%ebx,%1\n\t" \
+ "cpuid\n\t" \
+ "xchgl %%ebx,%1\n\t" \
+ : "=a" (i_eax), "=r" (i_ebx), "=c" (i_ecx), "=d" (i_edx) \
+ : "a" (reg) \
+ : "cc");
+# else
+# define cpuid(reg) \
+ asm volatile ("cpuid\n\t" \
+ : "=a" (i_eax), "=b" (i_ebx), "=c" (i_ecx), "=d" (i_edx) \
+ : "a" (reg) \
+ : "cc");
+# endif
+ /* Check if the OS really supports the requested instructions */
+# if defined (__i386__) && !defined (__i486__) && !defined (__i586__) \
+ && !defined (__i686__) && !defined (__pentium4__) \
+ && !defined (__k6__) && !defined (__athlon__) && !defined (__k8__)
+ /* check if cpuid instruction is supported */
asm volatile ( "push %%ebx\n\t"
"pushf\n\t"
"pop %%eax\n\t"
: "cc" );
if( i_eax == i_ebx )
- {
-# if defined( CAN_COMPILE_SSE ) || defined ( CAN_COMPILE_3DNOW ) \
- && defined( HAVE_SIGNAL_H )
- signal( SIGILL, pf_sigill );
-# endif
- return i_capabilities;
- }
-
- i_capabilities |= CPU_CAPABILITY_486;
+ goto out;
+# endif
/* the CPU supports the CPUID instruction - get its level */
cpuid( 0x00000000 );
+# if defined (__i386__) && !defined (__i586__) \
+ && !defined (__i686__) && !defined (__pentium4__) \
+ && !defined (__k6__) && !defined (__athlon__) && !defined (__k8__)
if( !i_eax )
- {
-# if defined( CAN_COMPILE_SSE ) || defined ( CAN_COMPILE_3DNOW ) \
- && defined( HAVE_SIGNAL_H )
- signal( SIGILL, pf_sigill );
-# endif
- return i_capabilities;
- }
-
- /* FIXME: this isn't correct, since some 486s have cpuid */
- i_capabilities |= CPU_CAPABILITY_586;
+ goto out;
+#endif
/* borrowed from mpeg2dec */
b_amd = ( i_ebx == 0x68747541 ) && ( i_ecx == 0x444d4163 )
/* test for the MMX flag */
cpuid( 0x00000001 );
-
+# if !defined (__MMX__)
if( ! (i_edx & 0x00800000) )
- {
-# if defined( CAN_COMPILE_SSE ) || defined ( CAN_COMPILE_3DNOW ) \
- && defined( HAVE_SIGNAL_H )
- signal( SIGILL, pf_sigill );
-# endif
- return i_capabilities;
- }
-
+ goto out;
+# endif
i_capabilities |= CPU_CAPABILITY_MMX;
+# if defined (__SSE__)
+ i_capabilities |= CPU_CAPABILITY_MMXEXT | CPU_CAPABILITY_SSE;
+# else
if( i_edx & 0x02000000 )
{
i_capabilities |= CPU_CAPABILITY_MMXEXT;
# ifdef CAN_COMPILE_SSE
- /* We test if OS supports the SSE instructions */
- psz_capability = "SSE";
- i_illegal = 0;
-
- if( setjmp( env ) == 0 )
- {
- /* Test a SSE instruction */
- __asm__ __volatile__ ( "xorps %%xmm0,%%xmm0\n" : : );
- }
-
- if( i_illegal == 0 )
- {
+ if (vlc_CPU_check ("SSE", SSE_test))
i_capabilities |= CPU_CAPABILITY_SSE;
- }
-# endif
- }
-
- if( i_edx & 0x04000000 )
- {
-# if defined(CAN_COMPILE_SSE)
- /* We test if OS supports the SSE instructions */
- psz_capability = "SSE2";
- i_illegal = 0;
-
- if( setjmp( env ) == 0 )
- {
- /* Test a SSE2 instruction */
- __asm__ __volatile__ ( "movupd %%xmm0, %%xmm0\n" : : );
- }
-
- if( i_illegal == 0 )
- {
- i_capabilities |= CPU_CAPABILITY_SSE2;
- }
# endif
}
+# endif
+
+# if defined (__SSE2__)
+ i_capabilities |= CPU_CAPABILITY_SSE2;
+# elif defined (CAN_COMPILE_SSE2)
+ if ((i_edx & 0x04000000) && vlc_CPU_check ("SSE2", SSE2_test))
+ i_capabilities |= CPU_CAPABILITY_SSE2;
+# endif
+
+# if defined (__SSE3__)
+ i_capabilities |= CPU_CAPABILITY_SSE3;
+# elif defined (CAN_COMPILE_SSE3)
+ if ((i_ecx & 0x00000001) && vlc_CPU_check ("SSE3", SSE3_test))
+ i_capabilities |= CPU_CAPABILITY_SSE3;
+# endif
+
+# if defined (__SSSE3__)
+ i_capabilities |= CPU_CAPABILITY_SSSE3;
+# elif defined (CAN_COMPILE_SSSE3)
+ if ((i_ecx & 0x00000200) && vlc_CPU_check ("SSSE3", SSSE3_test))
+ i_capabilities |= CPU_CAPABILITY_SSSE3;
+# endif
+
+# if defined (__SSE4_1__)
+ i_capabilities |= CPU_CAPABILITY_SSE4_1;
+# elif defined (CAN_COMPILE_SSE4_1)
+ if ((i_ecx & 0x00080000) && vlc_CPU_check ("SSE4.1", SSE4_1_test))
+ i_capabilities |= CPU_CAPABILITY_SSE4_1;
+# endif
+
+# if defined (__SSE4_2__)
+ i_capabilities |= CPU_CAPABILITY_SSE4_2;
+# elif defined (CAN_COMPILE_SSE4_2)
+ if ((i_ecx & 0x00100000) && vlc_CPU_check ("SSE4.2", SSE4_2_test))
+ i_capabilities |= CPU_CAPABILITY_SSE4_2;
+# endif
/* test for additional capabilities */
cpuid( 0x80000000 );
if( i_eax < 0x80000001 )
- {
-# if defined( CAN_COMPILE_SSE ) || defined ( CAN_COMPILE_3DNOW ) \
- && defined( HAVE_SIGNAL_H )
- signal( SIGILL, pf_sigill );
-# endif
- return i_capabilities;
- }
+ goto out;
/* list these additional capabilities */
cpuid( 0x80000001 );
-# ifdef CAN_COMPILE_3DNOW
- if( i_edx & 0x80000000 )
- {
- psz_capability = "3D Now!";
- i_illegal = 0;
-
- if( setjmp( env ) == 0 )
- {
- /* Test a 3D Now! instruction */
- __asm__ __volatile__ ( "pfadd %%mm0,%%mm0\n" "femms\n" : : );
- }
-
- if( i_illegal == 0 )
- {
- i_capabilities |= CPU_CAPABILITY_3DNOW;
- }
- }
-# endif
+# if defined (__3dNOW__)
+ i_capabilities |= CPU_CAPABILITY_3DNOW;
+# elif defined (CAN_COMPILE_3DNOW)
+ if ((i_edx & 0x80000000) && vlc_CPU_check ("3D Now!", ThreeD_Now_test))
+ i_capabilities |= CPU_CAPABILITY_3DNOW;
+# endif
if( b_amd && ( i_edx & 0x00400000 ) )
{
i_capabilities |= CPU_CAPABILITY_MMXEXT;
}
+out:
-# if defined( CAN_COMPILE_SSE ) || defined ( CAN_COMPILE_3DNOW ) \
- && defined( HAVE_SIGNAL_H )
- signal( SIGILL, pf_sigill );
-# endif
- return i_capabilities;
-
-#elif defined( __powerpc__ )
-
-# ifdef CAN_COMPILE_ALTIVEC && defined( HAVE_SIGNAL_H )
- void (*pf_sigill) (int) = signal( SIGILL, SigHandler );
-
- i_capabilities |= CPU_CAPABILITY_FPU;
+#elif defined( __powerpc__ ) || defined( __ppc__ ) || defined( __powerpc64__ ) \
+ || defined( __ppc64__ )
- i_illegal = 0;
+# if defined(__APPLE__) || defined(__OpenBSD__)
+# if defined(__OpenBSD__)
+ int selectors[2] = { CTL_MACHDEP, CPU_ALTIVEC };
+# else
+ int selectors[2] = { CTL_HW, HW_VECTORUNIT };
+# endif
+ int i_has_altivec = 0;
+ size_t i_length = sizeof( i_has_altivec );
+ int i_error = sysctl( selectors, 2, &i_has_altivec, &i_length, NULL, 0);
- if( setjmp( env ) == 0 )
- {
- asm volatile ("mtspr 256, %0\n\t"
- "vand %%v0, %%v0, %%v0"
- :
- : "r" (-1));
- }
+ if( i_error == 0 && i_has_altivec != 0 )
+ i_capabilities |= CPU_CAPABILITY_ALTIVEC;
- if( i_illegal == 0 )
- {
+# elif defined( CAN_COMPILE_ALTIVEC )
+ if (vlc_CPU_check ("Altivec", Altivec_test))
i_capabilities |= CPU_CAPABILITY_ALTIVEC;
- }
- signal( SIGILL, pf_sigill );
# endif
- return i_capabilities;
-
-#elif defined( __sparc__ )
-
- i_capabilities |= CPU_CAPABILITY_FPU;
- return i_capabilities;
-
-#elif defined( _MSC_VER ) && !defined( UNDER_CE )
- i_capabilities |= CPU_CAPABILITY_FPU;
- return i_capabilities;
+#endif
-#else
- /* default behaviour */
- return i_capabilities;
+ cpu_flags = i_capabilities;
+}
+/**
+ * Retrieves pre-computed CPU capability flags
+ */
+unsigned vlc_CPU (void)
+{
+/* On Windows and OS/2,
+ * initialized from DllMain() and _DLL_InitTerm() respectively, instead */
+#if !defined(WIN32) && !defined(__OS2__)
+ static pthread_once_t once = PTHREAD_ONCE_INIT;
+ pthread_once (&once, vlc_CPU_init);
#endif
+ return cpu_flags;
}
+#endif
-/*****************************************************************************
- * SigHandler: system signal handler
- *****************************************************************************
- * This function is called when an illegal instruction signal is received by
- * the program. We use this function to test OS and CPU capabilities
- *****************************************************************************/
-#if defined( HAVE_SIGNAL_H )
-static void SigHandler( int i_signal )
+void vlc_CPU_dump (vlc_object_t *obj)
{
- /* Acknowledge the signal received */
- i_illegal = 1;
+ const unsigned flags = vlc_CPU();
+ char buf[200], *p = buf;
+
+#define PRINT_CAPABILITY( capability, string ) \
+ if (flags & (capability)) \
+ p += sprintf (p, "%s ", (string) )
+
+#if defined (__i386__) || defined (__x86_64__)
+ PRINT_CAPABILITY(CPU_CAPABILITY_MMX, "MMX");
+ PRINT_CAPABILITY(CPU_CAPABILITY_3DNOW, "3DNow!");
+ PRINT_CAPABILITY(CPU_CAPABILITY_MMXEXT, "MMXEXT");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSE, "SSE");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSE2, "SSE2");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSE3, "SSE3");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSSE3, "SSSE3");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSE4_1, "SSE4.1");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSE4_2, "SSE4.2");
+ PRINT_CAPABILITY(CPU_CAPABILITY_SSE4A, "SSE4A");
+
+#elif defined (__powerpc__) || defined (__ppc__) || defined (__ppc64__)
+ PRINT_CAPABILITY(CPU_CAPABILITY_ALTIVEC, "AltiVec");
+
+#elif defined (__arm__)
+ PRINT_CAPABILITY(CPU_CAPABILITY_NEON, "NEONv1");
-#ifdef HAVE_SIGRELSE
- sigrelse( i_signal );
-#endif
+#else
+ (void) flags;
-#if defined( __i386__ )
- fprintf( stderr, "warning: your CPU has %s instructions, but not your "
- "operating system.\n", psz_capability );
- fprintf( stderr, " some optimizations will be disabled unless "
- "you upgrade your OS\n" );
-# if defined( SYS_LINUX )
- fprintf( stderr, " (for instance Linux kernel 2.4.x or later)\n" );
-# endif
#endif
- longjmp( env, 1 );
-}
+#if HAVE_FPU
+ p += sprintf (p, "FPU ");
#endif
+ if (p > buf)
+ msg_Dbg (obj, "CPU has capabilities %s", buf);
+}