RetroArch/libretro-common/features/features_cpu.c

728 lines
20 KiB
C
Raw Normal View History

/* Copyright (C) 2010-2016 The RetroArch team
*
* ---------------------------------------------------------------------------------------
* The following license statement only applies to this file (features_cpu.c).
* ---------------------------------------------------------------------------------------
*
* Permission is hereby granted, free of charge,
* to any person obtaining a copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation the rights to
* use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software,
* and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
* WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
2013-11-27 22:36:46 +00:00
#include <stdio.h>
#include <stdlib.h>
2016-05-10 07:17:04 +00:00
#if defined(_WIN32)
#include <direct.h>
#else
2013-02-05 08:41:10 +00:00
#include <unistd.h>
#endif
2012-11-01 21:31:24 +00:00
2016-05-10 16:43:23 +00:00
#include <compat/strl.h>
#include <streams/file_stream.h>
#include <libretro.h>
2016-05-13 23:32:05 +00:00
#include <features/features_cpu.h>
2016-05-10 16:43:23 +00:00
2013-12-13 02:58:58 +00:00
#if defined(_WIN32) && !defined(_XBOX)
#include <windows.h>
2013-12-29 10:48:00 +00:00
#include <intrin.h>
2013-12-13 02:58:58 +00:00
#endif
#if defined(__CELLOS_LV2__)
#ifndef _PPU_INTRINSICS_H
#include <ppu_intrinsics.h>
#endif
2012-10-01 20:25:13 +00:00
#elif defined(_XBOX360)
#include <PPCIntrinsics.h>
#elif defined(_POSIX_MONOTONIC_CLOCK) || defined(ANDROID) || defined(__QNX__)
2015-06-26 16:35:35 +00:00
/* POSIX_MONOTONIC_CLOCK is not being defined in Android headers despite support being present. */
2013-02-05 08:41:10 +00:00
#include <time.h>
#endif
#if defined(__QNX__) && !defined(CLOCK_MONOTONIC)
#define CLOCK_MONOTONIC 2
#endif
#if defined(PSP)
#include <sys/time.h>
#include <psprtc.h>
#endif
#if defined(VITA)
#include <psp2/kernel/processmgr.h>
#include <psp2/rtc.h>
#endif
2013-02-05 08:41:10 +00:00
#if defined(__PSL1GHT__)
2012-10-16 17:55:39 +00:00
#include <sys/time.h>
2013-02-05 08:41:10 +00:00
#elif defined(__CELLOS_LV2__)
#include <sys/sys_time.h>
#endif
#ifdef GEKKO
#include <ogc/lwp_watchdog.h>
#endif
2015-06-26 16:35:35 +00:00
/* iOS/OSX specific. Lacks clock_gettime(), so implement it. */
2013-02-05 08:41:10 +00:00
#ifdef __MACH__
#include <sys/time.h>
#ifndef CLOCK_MONOTONIC
#define CLOCK_MONOTONIC 0
#endif
#ifndef CLOCK_REALTIME
#define CLOCK_REALTIME 0
#endif
static int clock_gettime(int clk_ik, struct timespec *t)
{
struct timeval now;
int rv = gettimeofday(&now, NULL);
if (rv)
return rv;
t->tv_sec = now.tv_sec;
t->tv_nsec = now.tv_usec * 1000;
return 0;
}
2013-02-05 08:41:10 +00:00
#endif
#ifdef EMSCRIPTEN
#include <emscripten.h>
#endif
#if defined(BSD) || defined(__APPLE__)
#include <sys/sysctl.h>
#endif
#include <string.h>
/**
2016-05-10 07:17:04 +00:00
* cpu_features_get_perf_counter:
*
* Gets performance counter.
*
* Returns: performance counter.
**/
2016-05-10 07:17:04 +00:00
retro_perf_tick_t cpu_features_get_perf_counter(void)
{
retro_perf_tick_t time_ticks = 0;
#if defined(_WIN32)
long tv_sec, tv_usec;
2016-05-14 00:54:56 +00:00
static const unsigned __int64 epoch = 11644473600000000ULL;
FILETIME file_time;
SYSTEMTIME system_time;
ULARGE_INTEGER ularge;
GetSystemTime(&system_time);
SystemTimeToFileTime(&system_time, &file_time);
2016-05-14 00:54:56 +00:00
ularge.LowPart = file_time.dwLowDateTime;
ularge.HighPart = file_time.dwHighDateTime;
2016-05-14 00:54:56 +00:00
tv_sec = (long)((ularge.QuadPart - epoch) / 10000000L);
tv_usec = (long)(system_time.wMilliseconds * 1000);
time_ticks = (1000000 * tv_sec + tv_usec);
#elif defined(__linux__) || defined(__QNX__) || defined(__MACH__)
2012-10-16 17:55:39 +00:00
struct timespec tv;
if (clock_gettime(CLOCK_MONOTONIC, &tv) == 0)
time_ticks = (retro_perf_tick_t)tv.tv_sec * 1000000000 +
2014-09-15 05:03:54 +00:00
(retro_perf_tick_t)tv.tv_nsec;
2012-10-16 17:55:39 +00:00
2016-05-10 07:17:04 +00:00
#elif defined(__GNUC__) && defined(__i386__) || defined(__i486__) || defined(__i686__)
2015-06-26 15:03:05 +00:00
__asm__ volatile ("rdtsc" : "=A" (time_ticks));
2016-05-10 07:17:04 +00:00
#elif defined(__GNUC__) && defined(__x86_64__)
unsigned a, d;
2015-06-26 15:03:05 +00:00
__asm__ volatile ("rdtsc" : "=a" (a), "=d" (d));
time_ticks = (retro_perf_tick_t)a | ((retro_perf_tick_t)d << 32);
2013-02-05 08:41:10 +00:00
#elif defined(__ARM_ARCH_6__)
2015-06-26 15:03:05 +00:00
__asm__ volatile( "mrc p15, 0, %0, c9, c13, 0" : "=r"(time_ticks) );
#elif defined(__CELLOS_LV2__) || defined(_XBOX360) || defined(__powerpc__) || defined(__ppc__) || defined(__POWERPC__)
time_ticks = __mftb();
#elif defined(GEKKO)
time_ticks = gettime();
#elif defined(PSP) || defined(VITA)
sceRtcGetCurrentTick(&time_ticks);
2015-04-01 21:14:13 +00:00
#elif defined(_3DS)
time_ticks = svcGetSystemTick();
#elif defined(__mips__)
struct timeval tv;
gettimeofday(&tv,NULL);
time_ticks = (1000000 * tv.tv_sec + tv.tv_usec);
#endif
return time_ticks;
}
2012-11-01 21:31:24 +00:00
/**
2016-05-10 07:17:04 +00:00
* cpu_features_get_time_usec:
*
* Gets time in microseconds.
*
* Returns: time in microseconds.
**/
2016-05-10 07:17:04 +00:00
retro_time_t cpu_features_get_time_usec(void)
2013-02-05 08:41:10 +00:00
{
#if defined(_WIN32)
static LARGE_INTEGER freq;
2015-04-12 17:18:00 +00:00
LARGE_INTEGER count;
2014-09-15 05:03:54 +00:00
/* Frequency is guaranteed to not change. */
if (!freq.QuadPart && !QueryPerformanceFrequency(&freq))
return 0;
if (!QueryPerformanceCounter(&count))
return 0;
return count.QuadPart * 1000000 / freq.QuadPart;
2013-02-05 08:41:10 +00:00
#elif defined(__CELLOS_LV2__)
return sys_time_get_system_time();
#elif defined(GEKKO)
return ticks_to_microsecs(gettime());
#elif defined(_POSIX_MONOTONIC_CLOCK) || defined(__QNX__) || defined(ANDROID) || defined(__MACH__)
2015-06-02 14:51:10 +00:00
struct timespec tv = {0};
2013-02-05 08:41:10 +00:00
if (clock_gettime(CLOCK_MONOTONIC, &tv) < 0)
return 0;
2013-02-05 20:42:30 +00:00
return tv.tv_sec * INT64_C(1000000) + (tv.tv_nsec + 500) / 1000;
#elif defined(EMSCRIPTEN)
return emscripten_get_now() * 1000;
#elif defined(__mips__)
struct timeval tv;
gettimeofday(&tv,NULL);
return (1000000 * tv.tv_sec + tv.tv_usec);
2015-04-01 21:14:13 +00:00
#elif defined(_3DS)
2015-04-02 02:58:53 +00:00
return osGetTime() * 1000;
#elif defined(VITA)
return sceKernelGetProcessTimeWide();
2013-02-05 08:41:10 +00:00
#else
2016-05-10 07:17:04 +00:00
#error "Your platform does not have a timer function implemented in cpu_features_get_time_usec(). Cannot continue."
2013-02-05 08:41:10 +00:00
#endif
}
2012-11-01 21:31:24 +00:00
#if defined(__x86_64__) || defined(__i386__) || defined(__i486__) || defined(__i686__)
#define CPU_X86
#endif
2012-11-10 12:46:24 +00:00
#if defined(_MSC_VER) && !defined(_XBOX)
2012-11-01 21:31:24 +00:00
#include <intrin.h>
#endif
2016-01-20 23:56:47 +00:00
#if defined(CPU_X86) && !defined(__MACH__)
2015-12-25 05:10:29 +00:00
void x86_cpuid(int func, int flags[4])
2012-11-01 21:31:24 +00:00
{
/* On Android, we compile RetroArch with PIC, and we
2014-09-15 05:03:54 +00:00
* are not allowed to clobber the ebx register. */
2012-11-02 20:25:54 +00:00
#ifdef __x86_64__
#define REG_b "rbx"
#define REG_S "rsi"
#else
#define REG_b "ebx"
#define REG_S "esi"
#endif
#if defined(__GNUC__)
2015-06-26 15:03:05 +00:00
__asm__ volatile (
2012-11-03 21:22:49 +00:00
"mov %%" REG_b ", %%" REG_S "\n"
2012-11-02 20:25:54 +00:00
"cpuid\n"
2012-11-03 21:22:49 +00:00
"xchg %%" REG_b ", %%" REG_S "\n"
2012-11-02 20:25:54 +00:00
: "=a"(flags[0]), "=S"(flags[1]), "=c"(flags[2]), "=d"(flags[3])
: "a"(func));
2012-11-01 21:31:24 +00:00
#elif defined(_MSC_VER)
__cpuid(flags, func);
#else
2016-05-10 07:17:04 +00:00
printf("Unknown compiler. Cannot check CPUID with inline assembly.\n");
memset(flags, 0, 4 * sizeof(int));
2012-11-01 21:31:24 +00:00
#endif
}
2014-09-15 05:03:54 +00:00
/* Only runs on i686 and above. Needs to be conditionally run. */
2014-10-20 22:11:50 +00:00
static uint64_t xgetbv_x86(uint32_t idx)
{
2013-12-29 10:48:00 +00:00
#if defined(__GNUC__)
uint32_t eax, edx;
2015-06-26 15:03:05 +00:00
__asm__ volatile (
/* Older GCC versions (Apple's GCC for example) do
2014-09-15 05:03:54 +00:00
* not understand xgetbv instruction.
* Stamp out the machine code directly.
*/
2013-12-29 10:48:00 +00:00
".byte 0x0f, 0x01, 0xd0\n"
2014-10-20 22:11:50 +00:00
: "=a"(eax), "=d"(edx) : "c"(idx));
return ((uint64_t)edx << 32) | eax;
2014-09-15 05:03:54 +00:00
#elif _MSC_FULL_VER >= 160040219
/* Intrinsic only works on 2010 SP1 and above. */
2014-10-20 22:11:50 +00:00
return _xgetbv(idx);
2013-12-29 10:48:00 +00:00
#else
2016-05-10 07:17:04 +00:00
printf("Unknown compiler. Cannot check xgetbv bits.\n");
2013-12-29 10:48:00 +00:00
return 0;
#endif
}
2012-11-01 21:31:24 +00:00
#endif
2015-09-17 23:21:24 +00:00
#if defined(__ARM_NEON__)
static void arm_enable_runfast_mode(void)
{
/* RunFast mode. Enables flush-to-zero and some
2014-09-15 05:03:54 +00:00
* floating point optimizations. */
2013-12-30 09:19:32 +00:00
static const unsigned x = 0x04086060;
static const unsigned y = 0x03000000;
int r;
2015-06-26 15:03:05 +00:00
__asm__ volatile(
2014-09-15 05:03:54 +00:00
"fmrx %0, fpscr \n\t" /* r0 = FPSCR */
"and %0, %0, %1 \n\t" /* r0 = r0 & 0x04086060 */
"orr %0, %0, %2 \n\t" /* r0 = r0 | 0x03000000 */
"fmxr fpscr, %0 \n\t" /* FPSCR = r0 */
: "=r"(r)
: "r"(x), "r"(y)
);
}
#endif
2016-05-12 10:22:32 +00:00
#if defined(__linux__) && !defined(CPU_X86)
static unsigned char check_arm_cpu_feature(const char* feature)
{
2016-06-02 22:17:09 +00:00
char line[1024];
unsigned char status = 0;
2016-06-03 01:14:42 +00:00
RFILE *fp = filestream_open("/proc/cpuinfo", RFILE_MODE_READ_TEXT, -1);
2016-06-02 22:17:09 +00:00
if (!fp)
return 0;
while (filestream_gets(fp, line, sizeof(line)) != NULL)
{
2016-06-02 22:17:09 +00:00
if (strncmp(line, "Features\t: ", 11))
continue;
2016-06-02 22:17:09 +00:00
if (strstr(line + 11, feature) != NULL)
status = 1;
2016-06-02 22:17:09 +00:00
break;
}
2016-06-02 22:17:09 +00:00
filestream_close(fp);
return status;
}
#if !defined(_SC_NPROCESSORS_ONLN)
/* Parse an decimal integer starting from 'input', but not going further
* than 'limit'. Return the value into '*result'.
*
* NOTE: Does not skip over leading spaces, or deal with sign characters.
* NOTE: Ignores overflows.
*
* The function returns NULL in case of error (bad format), or the new
* position after the decimal number in case of success (which will always
* be <= 'limit').
*/
static const char *parse_decimal(const char* input,
const char* limit, int* result)
{
const char* p = input;
int val = 0;
while (p < limit)
{
int d = (*p - '0');
if ((unsigned)d >= 10U)
break;
val = val*10 + d;
p++;
}
if (p == input)
return NULL;
*result = val;
return p;
}
/* Parse a textual list of cpus and store the result inside a CpuList object.
* Input format is the following:
* - comma-separated list of items (no spaces)
* - each item is either a single decimal number (cpu index), or a range made
* of two numbers separated by a single dash (-). Ranges are inclusive.
*
* Examples: 0
* 2,4-127,128-143
* 0-1
*/
static void cpulist_parse(CpuList* list, char **buf, ssize_t length)
{
const char* p = (const char*)buf;
const char* end = p + length;
/* NOTE: the input line coming from sysfs typically contains a
* trailing newline, so take care of it in the code below
*/
while (p < end && *p != '\n')
{
int val, start_value, end_value;
/* Find the end of current item, and put it into 'q' */
const char *q = (const char*)memchr(p, ',', end-p);
if (!q)
q = end;
/* Get first value */
p = parse_decimal(p, q, &start_value);
if (p == NULL)
return;
end_value = start_value;
/* If we're not at the end of the item, expect a dash and
* and integer; extract end value.
*/
if (p < q && *p == '-')
{
p = parse_decimal(p+1, q, &end_value);
if (p == NULL)
return;
}
/* Set bits CPU list bits */
for (val = start_value; val <= end_value; val++)
{
if ((unsigned)val < 32)
list->mask |= (uint32_t)(1U << val);
}
/* Jump to next item */
p = q;
if (p < end)
p++;
}
}
/* Read a CPU list from one sysfs file */
static void cpulist_read_from(CpuList* list, const char* filename)
{
ssize_t length;
char *buf = NULL;
list->mask = 0;
if (filestream_read_file(filename, (void**)&buf, &length) != 1)
return;
cpulist_parse(list, &buf, length);
if (buf)
free(buf);
buf = NULL;
}
#endif
#endif
/**
2016-05-10 07:17:04 +00:00
* cpu_features_get_core_amount:
*
* Gets the amount of available CPU cores.
*
* Returns: amount of CPU cores available.
**/
2016-05-10 07:17:04 +00:00
unsigned cpu_features_get_core_amount(void)
{
2014-09-15 05:03:54 +00:00
#if defined(_WIN32) && !defined(_XBOX)
/* Win32 */
SYSTEM_INFO sysinfo;
GetSystemInfo(&sysinfo);
return sysinfo.dwNumberOfProcessors;
#elif defined(GEKKO)
return 1;
#elif defined(PSP)
return 1;
#elif defined(VITA)
return 4;
2015-04-01 21:14:13 +00:00
#elif defined(_3DS)
return 1;
2014-09-15 05:03:54 +00:00
#elif defined(_SC_NPROCESSORS_ONLN)
/* Linux, most UNIX-likes. */
long ret = sysconf(_SC_NPROCESSORS_ONLN);
if (ret <= 0)
2014-04-19 18:16:29 +00:00
return (unsigned)1;
return ret;
2014-09-15 05:03:54 +00:00
#elif defined(BSD) || defined(__APPLE__)
/* BSD */
/* Copypasta from stackoverflow, dunno if it works. */
int num_cpu = 0;
int mib[4];
size_t len = sizeof(num_cpu);
mib[0] = CTL_HW;
mib[1] = HW_AVAILCPU;
sysctl(mib, 2, &num_cpu, &len, NULL, 0);
if (num_cpu < 1)
{
mib[1] = HW_NCPU;
sysctl(mib, 2, &num_cpu, &len, NULL, 0);
if (num_cpu < 1)
num_cpu = 1;
}
return num_cpu;
#elif defined(__linux__)
CpuList cpus_present[1];
CpuList cpus_possible[1];
int amount = 0;
cpulist_read_from(cpus_present, "/sys/devices/system/cpu/present");
cpulist_read_from(cpus_possible, "/sys/devices/system/cpu/possible");
/* Compute the intersection of both sets to get the actual number of
* CPU cores that can be used on this device by the kernel.
*/
cpus_present->mask &= cpus_possible->mask;
amount = __builtin_popcount(cpus_present->mask);
if (amount == 0)
return 1;
return amount;
#elif defined(_XBOX360)
return 3;
#else
2014-09-15 05:03:54 +00:00
/* No idea, assume single core. */
return 1;
#endif
}
2015-12-25 05:17:17 +00:00
/* According to http://en.wikipedia.org/wiki/CPUID */
#define VENDOR_INTEL_b 0x756e6547
#define VENDOR_INTEL_c 0x6c65746e
#define VENDOR_INTEL_d 0x49656e69
/**
2016-05-10 07:17:04 +00:00
* cpu_features_get:
*
* Gets CPU features..
*
* Returns: bitmask of all CPU features available.
**/
2016-05-10 07:17:04 +00:00
uint64_t cpu_features_get(void)
2012-11-01 21:31:24 +00:00
{
2015-04-12 17:18:00 +00:00
int flags[4];
2015-06-26 17:22:21 +00:00
int vendor_shuffle[3];
2015-06-30 13:49:40 +00:00
char vendor[13] = {0};
size_t len = 0;
2015-06-30 13:49:40 +00:00
uint64_t cpu_flags = 0;
uint64_t cpu = 0;
unsigned max_flag = 0;
#if defined(CPU_X86) && !defined(__MACH__)
2015-12-25 05:17:17 +00:00
int vendor_is_intel = 0;
2015-06-26 17:22:21 +00:00
const int avx_flags = (1 << 27) | (1 << 28);
#endif
2014-10-09 23:05:39 +00:00
2015-06-26 16:35:35 +00:00
char buf[sizeof(" MMX MMXEXT SSE SSE2 SSE3 SSSE3 SS4 SSE4.2 AES AVX AVX2 NEON VMX VMX128 VFPU PS")];
memset(buf, 0, sizeof(buf));
2016-02-25 23:47:53 +00:00
(void)len;
2015-06-26 17:22:21 +00:00
(void)cpu_flags;
2015-04-12 17:18:00 +00:00
(void)flags;
2015-06-27 15:26:35 +00:00
(void)max_flag;
2015-06-26 17:22:21 +00:00
(void)vendor;
(void)vendor_shuffle;
2015-04-12 17:18:00 +00:00
#if defined(__MACH__)
2016-02-25 23:47:53 +00:00
len = sizeof(size_t);
if (sysctlbyname("hw.optional.mmx", NULL, &len, NULL, 0) == 0)
{
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_MMX;
cpu |= RETRO_SIMD_MMXEXT;
}
len = sizeof(size_t);
if (sysctlbyname("hw.optional.sse", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.sse2", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE2;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.sse3", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE3;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.supplementalsse3", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSSE3;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.sse4_1", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE4;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.sse4_2", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE42;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.aes", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_AES;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.avx1_0", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_AVX;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.avx2_0", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_AVX2;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.altivec", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_VMX;
len = sizeof(size_t);
if (sysctlbyname("hw.optional.neon", NULL, &len, NULL, 0) == 0)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_NEON;
#elif defined(CPU_X86)
2015-06-26 17:22:21 +00:00
(void)avx_flags;
2012-11-01 21:31:24 +00:00
2015-06-26 17:22:21 +00:00
x86_cpuid(0, flags);
vendor_shuffle[0] = flags[1];
vendor_shuffle[1] = flags[3];
vendor_shuffle[2] = flags[2];
2012-11-01 21:31:24 +00:00
memcpy(vendor, vendor_shuffle, sizeof(vendor_shuffle));
2015-06-26 17:22:21 +00:00
2016-05-14 21:20:35 +00:00
/* printf("[CPUID]: Vendor: %s\n", vendor); */
2012-11-01 21:31:24 +00:00
2015-12-25 05:17:17 +00:00
vendor_is_intel = (
flags[1] == VENDOR_INTEL_b &&
flags[2] == VENDOR_INTEL_c &&
flags[3] == VENDOR_INTEL_d);
2015-06-26 17:22:21 +00:00
max_flag = flags[0];
2014-09-15 05:03:54 +00:00
if (max_flag < 1) /* Does CPUID not support func = 1? (unlikely ...) */
return 0;
2012-11-01 21:31:24 +00:00
x86_cpuid(1, flags);
2013-12-25 20:34:03 +00:00
if (flags[3] & (1 << 23))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_MMX;
2013-12-25 20:34:03 +00:00
2012-11-05 10:57:40 +00:00
if (flags[3] & (1 << 25))
{
2014-09-15 05:03:54 +00:00
/* SSE also implies MMXEXT (according to FFmpeg source). */
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE;
cpu |= RETRO_SIMD_MMXEXT;
}
2012-11-05 10:57:40 +00:00
if (flags[3] & (1 << 26))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE2;
2012-11-01 21:31:24 +00:00
if (flags[2] & (1 << 0))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE3;
2013-12-12 09:56:21 +00:00
if (flags[2] & (1 << 9))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSSE3;
2013-12-12 09:56:21 +00:00
if (flags[2] & (1 << 19))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE4;
if (flags[2] & (1 << 20))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_SSE42;
if ((flags[2] & (1 << 23)))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_POPCNT;
2015-12-25 05:17:17 +00:00
if (vendor_is_intel && (flags[2] & (1 << 22)))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_MOVBE;
2015-12-25 05:17:17 +00:00
2014-09-02 18:50:43 +00:00
if (flags[2] & (1 << 25))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_AES;
2014-09-02 18:50:43 +00:00
2014-09-15 05:03:54 +00:00
/* Must only perform xgetbv check if we have
2014-09-15 05:03:54 +00:00
* AVX CPU support (guaranteed to have at least i686). */
if (((flags[2] & avx_flags) == avx_flags)
2014-09-15 05:03:54 +00:00
&& ((xgetbv_x86(0) & 0x6) == 0x6))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_AVX;
if (max_flag >= 7)
{
x86_cpuid(7, flags);
if (flags[1] & (1 << 5))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_AVX2;
}
x86_cpuid(0x80000000, flags);
max_flag = flags[0];
if (max_flag >= 0x80000001u)
{
x86_cpuid(0x80000001, flags);
if (flags[3] & (1 << 23))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_MMX;
if (flags[3] & (1 << 22))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_MMXEXT;
}
#elif defined(__linux__)
if (check_arm_cpu_feature("neon"))
{
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_NEON;
#ifdef __ARM_NEON__
arm_enable_runfast_mode();
#endif
}
if (check_arm_cpu_feature("vfpv3"))
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_VFPV3;
if (check_arm_cpu_feature("vfpv4"))
cpu |= RETRO_SIMD_VFPV4;
#if 0
check_arm_cpu_feature("swp");
check_arm_cpu_feature("half");
check_arm_cpu_feature("thumb");
check_arm_cpu_feature("fastmult");
check_arm_cpu_feature("vfp");
check_arm_cpu_feature("edsp");
check_arm_cpu_feature("thumbee");
check_arm_cpu_feature("tls");
check_arm_cpu_feature("idiva");
check_arm_cpu_feature("idivt");
#endif
#elif defined(__ARM_NEON__)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_NEON;
arm_enable_runfast_mode();
#elif defined(__ALTIVEC__)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_VMX;
#elif defined(XBOX360)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_VMX128;
2014-02-16 16:32:54 +00:00
#elif defined(PSP)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_VFPU;
#elif defined(GEKKO)
2016-05-10 16:43:23 +00:00
cpu |= RETRO_SIMD_PS;
#endif
2016-05-10 16:43:23 +00:00
if (cpu & RETRO_SIMD_MMX) strlcat(buf, " MMX", sizeof(buf));
if (cpu & RETRO_SIMD_MMXEXT) strlcat(buf, " MMXEXT", sizeof(buf));
if (cpu & RETRO_SIMD_SSE) strlcat(buf, " SSE", sizeof(buf));
if (cpu & RETRO_SIMD_SSE2) strlcat(buf, " SSE2", sizeof(buf));
if (cpu & RETRO_SIMD_SSE3) strlcat(buf, " SSE3", sizeof(buf));
if (cpu & RETRO_SIMD_SSSE3) strlcat(buf, " SSSE3", sizeof(buf));
if (cpu & RETRO_SIMD_SSE4) strlcat(buf, " SSE4", sizeof(buf));
if (cpu & RETRO_SIMD_SSE42) strlcat(buf, " SSE4.2", sizeof(buf));
if (cpu & RETRO_SIMD_AES) strlcat(buf, " AES", sizeof(buf));
if (cpu & RETRO_SIMD_AVX) strlcat(buf, " AVX", sizeof(buf));
if (cpu & RETRO_SIMD_AVX2) strlcat(buf, " AVX2", sizeof(buf));
if (cpu & RETRO_SIMD_NEON) strlcat(buf, " NEON", sizeof(buf));
if (cpu & RETRO_SIMD_VFPV3) strlcat(buf, " VFPv3", sizeof(buf));
if (cpu & RETRO_SIMD_VFPV4) strlcat(buf, " VFPv4", sizeof(buf));
if (cpu & RETRO_SIMD_VMX) strlcat(buf, " VMX", sizeof(buf));
if (cpu & RETRO_SIMD_VMX128) strlcat(buf, " VMX128", sizeof(buf));
if (cpu & RETRO_SIMD_VFPU) strlcat(buf, " VFPU", sizeof(buf));
if (cpu & RETRO_SIMD_PS) strlcat(buf, " PS", sizeof(buf));
2014-10-09 23:05:39 +00:00
return cpu;
}