| /* |
| * x86 feature check |
| * |
| * Copyright (C) 2013 Intel Corporation. All rights reserved. |
| * Author: |
| * Jim Kukunas |
| * |
| * For conditions of distribution and use, see copyright notice in zlib.h |
| */ |
| |
| #include "x86.h" |
| |
| int x86_cpu_enable_simd = 0; |
| |
| #ifndef _MSC_VER |
| #include <pthread.h> |
| |
| pthread_once_t cpu_check_inited_once = PTHREAD_ONCE_INIT; |
| static void _x86_check_features(void); |
| |
| void x86_check_features(void) |
| { |
| pthread_once(&cpu_check_inited_once, _x86_check_features); |
| } |
| |
| static void _x86_check_features(void) |
| { |
| int x86_cpu_has_sse2; |
| int x86_cpu_has_sse42; |
| int x86_cpu_has_pclmulqdq; |
| unsigned eax, ebx, ecx, edx; |
| |
| eax = 1; |
| #ifdef __i386__ |
| __asm__ __volatile__ ( |
| "xchg %%ebx, %1\n\t" |
| "cpuid\n\t" |
| "xchg %1, %%ebx\n\t" |
| : "+a" (eax), "=S" (ebx), "=c" (ecx), "=d" (edx) |
| ); |
| #else |
| __asm__ __volatile__ ( |
| "cpuid\n\t" |
| : "+a" (eax), "=b" (ebx), "=c" (ecx), "=d" (edx) |
| ); |
| #endif /* (__i386__) */ |
| |
| x86_cpu_has_sse2 = edx & 0x4000000; |
| x86_cpu_has_sse42 = ecx & 0x100000; |
| x86_cpu_has_pclmulqdq = ecx & 0x2; |
| |
| x86_cpu_enable_simd = x86_cpu_has_sse2 && |
| x86_cpu_has_sse42 && |
| x86_cpu_has_pclmulqdq; |
| } |
| #else |
| #include <intrin.h> |
| #include <windows.h> |
| #include <stdint.h> |
| |
| static volatile int32_t once_control = 0; |
| static void _x86_check_features(void); |
| static int fake_pthread_once(volatile int32_t *once_control, |
| void (*init_routine)(void)); |
| |
| void x86_check_features(void) |
| { |
| fake_pthread_once(&once_control, _x86_check_features); |
| } |
| |
| /* Copied from "perftools_pthread_once" in tcmalloc */ |
| static int fake_pthread_once(volatile int32_t *once_control, |
| void (*init_routine)(void)) { |
| // Try for a fast path first. Note: this should be an acquire semantics read |
| // It is on x86 and x64, where Windows runs. |
| if (*once_control != 1) { |
| while (1) { |
| switch (InterlockedCompareExchange(once_control, 2, 0)) { |
| case 0: |
| init_routine(); |
| InterlockedExchange(once_control, 1); |
| return 0; |
| case 1: |
| // The initializer has already been executed |
| return 0; |
| default: |
| // The initializer is being processed by another thread |
| SwitchToThread(); |
| } |
| } |
| } |
| return 0; |
| } |
| |
| static void _x86_check_features(void) |
| { |
| int x86_cpu_has_sse2; |
| int x86_cpu_has_sse42; |
| int x86_cpu_has_pclmulqdq; |
| int regs[4]; |
| |
| __cpuid(regs, 1); |
| |
| x86_cpu_has_sse2 = regs[3] & 0x4000000; |
| x86_cpu_has_sse42= regs[2] & 0x100000; |
| x86_cpu_has_pclmulqdq = regs[2] & 0x2; |
| |
| x86_cpu_enable_simd = x86_cpu_has_sse2 && |
| x86_cpu_has_sse42 && |
| x86_cpu_has_pclmulqdq; |
| } |
| #endif /* _MSC_VER */ |