2012-10-01 21:45:09 +02:00
|
|
|
/* RetroArch - A frontend for libretro.
|
2014-01-01 01:50:59 +01:00
|
|
|
* Copyright (C) 2010-2014 - Hans-Kristian Arntzen
|
|
|
|
* Copyright (C) 2011-2014 - Daniel De Matteis
|
2012-10-01 21:45:09 +02:00
|
|
|
*
|
|
|
|
* RetroArch is free software: you can redistribute it and/or modify it under the terms
|
|
|
|
* of the GNU General Public License as published by the Free Software Found-
|
|
|
|
* ation, either version 3 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* RetroArch is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
|
|
|
|
* without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
|
|
|
|
* PURPOSE. See the GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License along with RetroArch.
|
|
|
|
* If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
2013-11-27 23:36:46 +01:00
|
|
|
#include <stdio.h>
|
2013-12-17 19:10:21 +01:00
|
|
|
#include "libretro.h"
|
2012-11-01 06:21:18 +01:00
|
|
|
#include "performance.h"
|
2013-02-05 09:41:10 +01:00
|
|
|
#include "general.h"
|
2014-10-10 00:05:39 +01:00
|
|
|
#include "compat/strl.h"
|
2013-02-05 09:41:10 +01:00
|
|
|
|
2012-11-02 05:27:58 +01:00
|
|
|
#ifdef ANDROID
|
2013-11-27 22:57:49 +01:00
|
|
|
#include "performance/performance_android.h"
|
2012-11-02 05:27:58 +01:00
|
|
|
#endif
|
|
|
|
|
2013-02-05 09:41:10 +01:00
|
|
|
#if !defined(_WIN32) && !defined(RARCH_CONSOLE)
|
|
|
|
#include <unistd.h>
|
|
|
|
#endif
|
2012-11-01 22:31:24 +01:00
|
|
|
|
2013-12-13 03:58:58 +01:00
|
|
|
#if defined(_WIN32) && !defined(_XBOX)
|
|
|
|
#include <windows.h>
|
2013-12-29 11:48:00 +01:00
|
|
|
#include <intrin.h>
|
2013-12-13 03:58:58 +01:00
|
|
|
#endif
|
|
|
|
|
2012-10-01 22:02:20 +02:00
|
|
|
#if defined(__CELLOS_LV2__) || defined(GEKKO)
|
|
|
|
#ifndef _PPU_INTRINSICS_H
|
2012-10-01 21:45:09 +02:00
|
|
|
#include <ppu_intrinsics.h>
|
|
|
|
#endif
|
2012-10-01 22:25:13 +02:00
|
|
|
#elif defined(_XBOX360)
|
|
|
|
#include <PPCIntrinsics.h>
|
2013-02-27 09:33:16 +01:00
|
|
|
#elif defined(_POSIX_MONOTONIC_CLOCK) || defined(ANDROID) || defined(__QNX__)
|
2013-02-05 09:41:10 +01:00
|
|
|
// POSIX_MONOTONIC_CLOCK is not being defined in Android headers despite support being present.
|
|
|
|
#include <time.h>
|
|
|
|
#endif
|
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
#if defined(__QNX__) && !defined(CLOCK_MONOTONIC)
|
2013-02-25 02:36:42 +01:00
|
|
|
#define CLOCK_MONOTONIC 2
|
|
|
|
#endif
|
|
|
|
|
2014-02-17 15:58:46 +01:00
|
|
|
#if defined(__mips__)
|
|
|
|
#include <sys/time.h>
|
|
|
|
#endif
|
|
|
|
|
2013-02-05 09:41:10 +01:00
|
|
|
#if defined(__PSL1GHT__)
|
2012-10-16 19:55:39 +02:00
|
|
|
#include <sys/time.h>
|
2013-02-05 09:41:10 +01:00
|
|
|
#elif defined(__CELLOS_LV2__)
|
|
|
|
#include <sys/sys_time.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef GEKKO
|
|
|
|
#include <ogc/lwp_watchdog.h>
|
2012-10-01 22:02:20 +02:00
|
|
|
#endif
|
2012-10-01 21:45:09 +02:00
|
|
|
|
2013-02-05 09:41:10 +01:00
|
|
|
// OSX specific. OSX lacks clock_gettime().
|
|
|
|
#ifdef __MACH__
|
|
|
|
#include <mach/clock.h>
|
|
|
|
#include <mach/mach.h>
|
2014-07-26 04:35:00 +02:00
|
|
|
#include <mach/mach_time.h>
|
2013-02-05 09:41:10 +01:00
|
|
|
#endif
|
2012-11-02 05:27:58 +01:00
|
|
|
|
2013-07-17 20:26:01 -04:00
|
|
|
#ifdef EMSCRIPTEN
|
|
|
|
#include <emscripten.h>
|
|
|
|
#endif
|
|
|
|
|
2014-04-15 17:55:40 +02:00
|
|
|
#if defined(BSD) || defined(__APPLE__)
|
|
|
|
#include <sys/sysctl.h>
|
|
|
|
#endif
|
|
|
|
|
2013-12-13 04:05:21 +01:00
|
|
|
#include <string.h>
|
|
|
|
|
2014-06-01 18:44:30 +02:00
|
|
|
const struct retro_perf_counter *perf_counters_rarch[MAX_COUNTERS];
|
|
|
|
const struct retro_perf_counter *perf_counters_libretro[MAX_COUNTERS];
|
|
|
|
unsigned perf_ptr_rarch;
|
|
|
|
unsigned perf_ptr_libretro;
|
2012-10-30 23:28:54 +01:00
|
|
|
|
2013-12-17 19:10:21 +01:00
|
|
|
void rarch_perf_register(struct retro_perf_counter *perf)
|
2012-10-30 23:28:54 +01:00
|
|
|
{
|
2014-09-15 07:03:54 +02:00
|
|
|
if (!g_extern.perfcnt_enable || perf->registered
|
|
|
|
|| perf_ptr_rarch >= MAX_COUNTERS)
|
2012-10-30 23:28:54 +01:00
|
|
|
return;
|
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
perf_counters_rarch[perf_ptr_rarch++] = perf;
|
2012-10-30 23:28:54 +01:00
|
|
|
perf->registered = true;
|
|
|
|
}
|
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
void retro_perf_register(struct retro_perf_counter *perf)
|
|
|
|
{
|
|
|
|
if (perf->registered || perf_ptr_libretro >= MAX_COUNTERS)
|
|
|
|
return;
|
|
|
|
|
|
|
|
perf_counters_libretro[perf_ptr_libretro++] = perf;
|
|
|
|
perf->registered = true;
|
|
|
|
}
|
2013-12-18 19:03:08 +01:00
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
void retro_perf_clear(void)
|
|
|
|
{
|
|
|
|
perf_ptr_libretro = 0;
|
|
|
|
memset(perf_counters_libretro, 0, sizeof(perf_counters_libretro));
|
|
|
|
}
|
|
|
|
|
2014-09-15 07:03:54 +02:00
|
|
|
static void log_counters(
|
|
|
|
const struct retro_perf_counter **counters, unsigned num)
|
2012-10-30 23:28:54 +01:00
|
|
|
{
|
2013-10-19 19:39:38 +02:00
|
|
|
unsigned i;
|
2013-12-18 19:10:57 +01:00
|
|
|
for (i = 0; i < num; i++)
|
|
|
|
{
|
2014-06-01 20:24:55 +02:00
|
|
|
if (counters[i]->call_cnt)
|
|
|
|
{
|
|
|
|
RARCH_LOG(PERF_LOG_FMT,
|
|
|
|
counters[i]->ident,
|
2014-09-15 07:03:54 +02:00
|
|
|
(unsigned long long)counters[i]->total /
|
|
|
|
(unsigned long long)counters[i]->call_cnt,
|
2014-06-01 20:24:55 +02:00
|
|
|
(unsigned long long)counters[i]->call_cnt);
|
|
|
|
}
|
2013-12-18 19:10:57 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void rarch_perf_log(void)
|
|
|
|
{
|
2014-06-01 22:16:22 +02:00
|
|
|
if (!g_extern.perfcnt_enable)
|
|
|
|
return;
|
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
RARCH_LOG("[PERF]: Performance counters (RetroArch):\n");
|
|
|
|
log_counters(perf_counters_rarch, perf_ptr_rarch);
|
|
|
|
}
|
|
|
|
|
|
|
|
void retro_perf_log(void)
|
|
|
|
{
|
|
|
|
RARCH_LOG("[PERF]: Performance counters (libretro):\n");
|
|
|
|
log_counters(perf_counters_libretro, perf_ptr_libretro);
|
2012-10-30 23:28:54 +01:00
|
|
|
}
|
|
|
|
|
2013-12-17 19:10:21 +01:00
|
|
|
retro_perf_tick_t rarch_get_perf_counter(void)
|
2012-10-01 21:45:09 +02:00
|
|
|
{
|
2013-12-17 19:10:21 +01:00
|
|
|
retro_perf_tick_t time = 0;
|
2014-07-26 04:43:36 +02:00
|
|
|
#if defined(__MACH__) && defined(__APPLE__)
|
2014-07-26 04:35:00 +02:00
|
|
|
struct mach_timebase_info convfact;
|
|
|
|
mach_timebase_info(&convfact);
|
|
|
|
time = mach_absolute_time();
|
|
|
|
#elif defined(__linux__) || defined(__QNX__)
|
2012-10-16 19:55:39 +02:00
|
|
|
struct timespec tv;
|
2012-10-16 23:29:03 +02:00
|
|
|
if (clock_gettime(CLOCK_MONOTONIC, &tv) == 0)
|
2014-09-15 07:03:54 +02:00
|
|
|
time = (retro_perf_tick_t)tv.tv_sec * 1000000000 +
|
|
|
|
(retro_perf_tick_t)tv.tv_nsec;
|
2012-10-16 19:55:39 +02:00
|
|
|
else
|
|
|
|
time = 0;
|
|
|
|
|
2014-02-10 10:19:11 +11:00
|
|
|
#elif defined(__GNUC__) && !defined(RARCH_CONSOLE)
|
2012-10-01 23:43:16 +02:00
|
|
|
|
2012-11-01 22:31:24 +01:00
|
|
|
#if defined(__i386__) || defined(__i486__) || defined(__i686__)
|
2012-10-01 23:43:16 +02:00
|
|
|
asm volatile ("rdtsc" : "=A" (time));
|
|
|
|
#elif defined(__x86_64__)
|
|
|
|
unsigned a, d;
|
|
|
|
asm volatile ("rdtsc" : "=a" (a), "=d" (d));
|
2013-12-17 19:10:21 +01:00
|
|
|
time = (retro_perf_tick_t)a | ((retro_perf_tick_t)d << 32);
|
2012-10-01 23:43:16 +02:00
|
|
|
#endif
|
2012-10-16 19:55:39 +02:00
|
|
|
|
2013-02-05 09:41:10 +01:00
|
|
|
#elif defined(__ARM_ARCH_6__)
|
2013-12-18 19:10:57 +01:00
|
|
|
asm volatile( "mrc p15, 0, %0, c9, c13, 0" : "=r"(time) );
|
2014-02-09 23:10:40 +01:00
|
|
|
#elif defined(__CELLOS_LV2__) || defined(GEKKO) || defined(_XBOX360) || defined(__powerpc__) || defined(__ppc__) || defined(__POWERPC__)
|
2012-10-01 23:04:15 +02:00
|
|
|
time = __mftb();
|
2014-02-17 15:58:46 +01:00
|
|
|
#elif defined(__mips__)
|
|
|
|
struct timeval tv;
|
2014-02-17 16:49:31 +01:00
|
|
|
gettimeofday(&tv,NULL);
|
|
|
|
time = (1000000 * tv.tv_sec + tv.tv_usec);
|
2014-06-03 21:50:32 +02:00
|
|
|
#elif defined(_WIN32)
|
|
|
|
long tv_sec, tv_usec;
|
|
|
|
static const unsigned __int64 epoch = 11644473600000000Ui64;
|
|
|
|
FILETIME file_time;
|
|
|
|
SYSTEMTIME system_time;
|
|
|
|
ULARGE_INTEGER ularge;
|
|
|
|
|
|
|
|
GetSystemTime(&system_time);
|
|
|
|
SystemTimeToFileTime(&system_time, &file_time);
|
|
|
|
ularge.LowPart = file_time.dwLowDateTime;
|
|
|
|
ularge.HighPart = file_time.dwHighDateTime;
|
|
|
|
|
|
|
|
tv_sec = (long)((ularge.QuadPart - epoch) / 10000000L);
|
|
|
|
tv_usec = (long)(system_time.wMilliseconds * 1000);
|
|
|
|
|
|
|
|
time = (1000000 * tv_sec + tv_usec);
|
2012-10-01 21:45:09 +02:00
|
|
|
#endif
|
2012-10-01 23:43:16 +02:00
|
|
|
|
2012-10-01 21:45:09 +02:00
|
|
|
return time;
|
|
|
|
}
|
2012-11-01 22:31:24 +01:00
|
|
|
|
2013-12-17 19:10:21 +01:00
|
|
|
retro_time_t rarch_get_time_usec(void)
|
2013-02-05 09:41:10 +01:00
|
|
|
{
|
2013-02-05 21:49:21 +01:00
|
|
|
#if defined(_WIN32)
|
2013-02-05 13:03:16 +01:00
|
|
|
static LARGE_INTEGER freq;
|
2014-09-15 07:03:54 +02:00
|
|
|
/* Frequency is guaranteed to not change. */
|
|
|
|
if (!freq.QuadPart && !QueryPerformanceFrequency(&freq))
|
2013-02-05 13:03:16 +01:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
LARGE_INTEGER count;
|
|
|
|
if (!QueryPerformanceCounter(&count))
|
|
|
|
return 0;
|
|
|
|
return count.QuadPart * 1000000 / freq.QuadPart;
|
2013-02-05 09:41:10 +01:00
|
|
|
#elif defined(__CELLOS_LV2__)
|
|
|
|
return sys_time_get_system_time();
|
|
|
|
#elif defined(GEKKO)
|
|
|
|
return ticks_to_microsecs(gettime());
|
2014-09-15 07:03:54 +02:00
|
|
|
#elif defined(__MACH__)
|
|
|
|
/* OSX doesn't have clock_gettime. */
|
2013-02-05 09:41:10 +01:00
|
|
|
clock_serv_t cclock;
|
|
|
|
mach_timespec_t mts;
|
|
|
|
host_get_clock_service(mach_host_self(), CALENDAR_CLOCK, &cclock);
|
|
|
|
clock_get_time(cclock, &mts);
|
|
|
|
mach_port_deallocate(mach_task_self(), cclock);
|
2013-02-05 21:42:30 +01:00
|
|
|
return mts.tv_sec * INT64_C(1000000) + (mts.tv_nsec + 500) / 1000;
|
2013-02-27 09:33:16 +01:00
|
|
|
#elif defined(_POSIX_MONOTONIC_CLOCK) || defined(__QNX__) || defined(ANDROID)
|
2013-02-05 09:41:10 +01:00
|
|
|
struct timespec tv;
|
|
|
|
if (clock_gettime(CLOCK_MONOTONIC, &tv) < 0)
|
|
|
|
return 0;
|
2013-02-05 21:42:30 +01:00
|
|
|
return tv.tv_sec * INT64_C(1000000) + (tv.tv_nsec + 500) / 1000;
|
2013-07-17 20:26:01 -04:00
|
|
|
#elif defined(EMSCRIPTEN)
|
|
|
|
return emscripten_get_now() * 1000;
|
2014-02-17 16:49:31 +01:00
|
|
|
#elif defined(__mips__)
|
|
|
|
struct timeval tv;
|
|
|
|
gettimeofday(&tv,NULL);
|
|
|
|
return (1000000 * tv.tv_sec + tv.tv_usec);
|
2013-02-05 09:41:10 +01:00
|
|
|
#else
|
|
|
|
#error "Your platform does not have a timer function implemented in rarch_get_time_usec(). Cannot continue."
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2012-11-01 22:31:24 +01:00
|
|
|
#if defined(__x86_64__) || defined(__i386__) || defined(__i486__) || defined(__i686__)
|
|
|
|
#define CPU_X86
|
|
|
|
#endif
|
|
|
|
|
2012-11-10 13:46:24 +01:00
|
|
|
#if defined(_MSC_VER) && !defined(_XBOX)
|
2012-11-01 22:31:24 +01:00
|
|
|
#include <intrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef CPU_X86
|
|
|
|
static void x86_cpuid(int func, int flags[4])
|
|
|
|
{
|
2014-09-15 07:03:54 +02:00
|
|
|
/* On Android, we compile RetroArch with PIC, and we
|
|
|
|
* are not allowed to clobber the ebx register. */
|
2012-11-02 21:25:54 +01:00
|
|
|
#ifdef __x86_64__
|
|
|
|
#define REG_b "rbx"
|
|
|
|
#define REG_S "rsi"
|
|
|
|
#else
|
|
|
|
#define REG_b "ebx"
|
|
|
|
#define REG_S "esi"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if defined(__GNUC__)
|
|
|
|
asm volatile (
|
2012-11-03 22:22:49 +01:00
|
|
|
"mov %%" REG_b ", %%" REG_S "\n"
|
2012-11-02 21:25:54 +01:00
|
|
|
"cpuid\n"
|
2012-11-03 22:22:49 +01:00
|
|
|
"xchg %%" REG_b ", %%" REG_S "\n"
|
2012-11-02 21:25:54 +01:00
|
|
|
: "=a"(flags[0]), "=S"(flags[1]), "=c"(flags[2]), "=d"(flags[3])
|
|
|
|
: "a"(func));
|
2012-11-01 22:31:24 +01:00
|
|
|
#elif defined(_MSC_VER)
|
|
|
|
__cpuid(flags, func);
|
2013-01-06 00:20:26 +01:00
|
|
|
#else
|
|
|
|
RARCH_WARN("Unknown compiler. Cannot check CPUID with inline assembly.\n");
|
|
|
|
memset(flags, 0, 4 * sizeof(int));
|
2012-11-01 22:31:24 +01:00
|
|
|
#endif
|
|
|
|
}
|
2013-12-22 18:22:26 -05:00
|
|
|
|
2014-09-15 07:03:54 +02:00
|
|
|
/* Only runs on i686 and above. Needs to be conditionally run. */
|
2013-12-29 11:48:00 +01:00
|
|
|
static uint64_t xgetbv_x86(uint32_t index)
|
2013-12-22 18:22:26 -05:00
|
|
|
{
|
2013-12-29 11:48:00 +01:00
|
|
|
#if defined(__GNUC__)
|
2013-12-22 18:22:26 -05:00
|
|
|
uint32_t eax, edx;
|
2013-12-29 11:48:00 +01:00
|
|
|
asm volatile (
|
2014-09-15 07:03:54 +02:00
|
|
|
/* Older GCC versions (Apple's GCC for example) do
|
|
|
|
* not understand xgetbv instruction.
|
|
|
|
* Stamp out the machine code directly.
|
|
|
|
*/
|
2013-12-29 11:48:00 +01:00
|
|
|
".byte 0x0f, 0x01, 0xd0\n"
|
|
|
|
: "=a"(eax), "=d"(edx) : "c"(index));
|
2013-12-22 18:22:26 -05:00
|
|
|
return ((uint64_t)edx << 32) | eax;
|
2014-09-15 07:03:54 +02:00
|
|
|
#elif _MSC_FULL_VER >= 160040219
|
|
|
|
/* Intrinsic only works on 2010 SP1 and above. */
|
2013-12-29 11:48:00 +01:00
|
|
|
return _xgetbv(index);
|
|
|
|
#else
|
|
|
|
RARCH_WARN("Unknown compiler. Cannot check xgetbv bits.\n");
|
|
|
|
return 0;
|
|
|
|
#endif
|
2013-12-22 18:22:26 -05:00
|
|
|
}
|
2012-11-01 22:31:24 +01:00
|
|
|
#endif
|
|
|
|
|
2014-07-26 20:18:37 +02:00
|
|
|
#if defined(__ARM_NEON__)
|
2013-12-30 07:58:18 +01:00
|
|
|
static void arm_enable_runfast_mode(void)
|
|
|
|
{
|
2014-09-15 07:03:54 +02:00
|
|
|
/* RunFast mode. Enables flush-to-zero and some
|
|
|
|
* floating point optimizations. */
|
2013-12-30 10:19:32 +01:00
|
|
|
static const unsigned x = 0x04086060;
|
|
|
|
static const unsigned y = 0x03000000;
|
2013-12-30 07:58:18 +01:00
|
|
|
int r;
|
|
|
|
asm volatile(
|
2014-09-15 07:03:54 +02:00
|
|
|
"fmrx %0, fpscr \n\t" /* r0 = FPSCR */
|
|
|
|
"and %0, %0, %1 \n\t" /* r0 = r0 & 0x04086060 */
|
|
|
|
"orr %0, %0, %2 \n\t" /* r0 = r0 | 0x03000000 */
|
|
|
|
"fmxr fpscr, %0 \n\t" /* FPSCR = r0 */
|
2013-12-30 07:58:18 +01:00
|
|
|
: "=r"(r)
|
|
|
|
: "r"(x), "r"(y)
|
|
|
|
);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2014-04-15 17:55:40 +02:00
|
|
|
unsigned rarch_get_cpu_cores(void)
|
|
|
|
{
|
2014-09-15 07:03:54 +02:00
|
|
|
#if defined(_WIN32) && !defined(_XBOX)
|
|
|
|
/* Win32 */
|
2014-04-15 17:55:40 +02:00
|
|
|
SYSTEM_INFO sysinfo;
|
|
|
|
GetSystemInfo(&sysinfo);
|
|
|
|
return sysinfo.dwNumberOfProcessors;
|
2014-04-15 22:42:10 +02:00
|
|
|
#elif defined(ANDROID)
|
|
|
|
return android_getCpuCount();
|
2014-04-16 03:33:10 +02:00
|
|
|
#elif defined(GEKKO)
|
|
|
|
return 1;
|
2014-09-15 07:03:54 +02:00
|
|
|
#elif defined(_SC_NPROCESSORS_ONLN)
|
|
|
|
/* Linux, most UNIX-likes. */
|
2014-04-15 17:55:40 +02:00
|
|
|
long ret = sysconf(_SC_NPROCESSORS_ONLN);
|
|
|
|
if (ret <= 0)
|
2014-04-19 20:16:29 +02:00
|
|
|
return (unsigned)1;
|
2014-04-15 17:55:40 +02:00
|
|
|
return ret;
|
2014-09-15 07:03:54 +02:00
|
|
|
#elif defined(BSD) || defined(__APPLE__)
|
|
|
|
/* BSD */
|
|
|
|
/* Copypasta from stackoverflow, dunno if it works. */
|
2014-04-15 17:55:40 +02:00
|
|
|
int num_cpu = 0;
|
|
|
|
int mib[4];
|
|
|
|
size_t len = sizeof(num_cpu);
|
|
|
|
|
|
|
|
mib[0] = CTL_HW;
|
|
|
|
mib[1] = HW_AVAILCPU;
|
|
|
|
sysctl(mib, 2, &num_cpu, &len, NULL, 0);
|
|
|
|
if (num_cpu < 1)
|
|
|
|
{
|
|
|
|
mib[1] = HW_NCPU;
|
|
|
|
sysctl(mib, 2, &num_cpu, &len, NULL, 0);
|
|
|
|
if (num_cpu < 1)
|
|
|
|
num_cpu = 1;
|
|
|
|
}
|
|
|
|
return num_cpu;
|
2014-04-15 22:42:10 +02:00
|
|
|
#elif defined(_XBOX360)
|
|
|
|
return 3;
|
2014-04-15 17:55:40 +02:00
|
|
|
#else
|
2014-09-15 07:03:54 +02:00
|
|
|
/* No idea, assume single core. */
|
2014-04-15 17:55:40 +02:00
|
|
|
return 1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
uint64_t rarch_get_cpu_features(void)
|
2012-11-01 22:31:24 +01:00
|
|
|
{
|
2013-12-18 19:10:57 +01:00
|
|
|
uint64_t cpu = 0;
|
2012-11-01 22:31:24 +01:00
|
|
|
|
2014-10-10 19:02:44 +02:00
|
|
|
const unsigned MAX_FEATURES = \
|
2014-10-10 00:05:39 +01:00
|
|
|
sizeof(" MMX MMXEXT SSE SSE2 SSE3 SSSE3 SS4 SSE4.2 AES AVX AVX2 NEON VMX VMX128 VFPU PS");
|
|
|
|
char buf[MAX_FEATURES];
|
|
|
|
memset(buf, 0, MAX_FEATURES);
|
|
|
|
|
2012-11-02 21:25:54 +01:00
|
|
|
#if defined(CPU_X86)
|
2012-11-01 22:31:24 +01:00
|
|
|
int flags[4];
|
|
|
|
x86_cpuid(0, flags);
|
|
|
|
|
|
|
|
char vendor[13] = {0};
|
|
|
|
const int vendor_shuffle[3] = { flags[1], flags[3], flags[2] };
|
|
|
|
memcpy(vendor, vendor_shuffle, sizeof(vendor_shuffle));
|
|
|
|
RARCH_LOG("[CPUID]: Vendor: %s\n", vendor);
|
|
|
|
|
2014-02-16 16:25:14 +01:00
|
|
|
unsigned max_flag = flags[0];
|
2014-09-15 07:03:54 +02:00
|
|
|
if (max_flag < 1) /* Does CPUID not support func = 1? (unlikely ...) */
|
2013-12-18 19:10:57 +01:00
|
|
|
return 0;
|
2012-11-01 22:31:24 +01:00
|
|
|
|
|
|
|
x86_cpuid(1, flags);
|
2012-11-05 09:06:00 +01:00
|
|
|
|
2013-12-25 21:34:03 +01:00
|
|
|
if (flags[3] & (1 << 23))
|
|
|
|
cpu |= RETRO_SIMD_MMX;
|
|
|
|
|
2012-11-05 11:57:40 +01:00
|
|
|
if (flags[3] & (1 << 25))
|
2014-02-16 16:25:14 +01:00
|
|
|
{
|
2014-09-15 07:03:54 +02:00
|
|
|
/* SSE also implies MMXEXT (according to FFmpeg source). */
|
2013-12-18 19:10:57 +01:00
|
|
|
cpu |= RETRO_SIMD_SSE;
|
2014-02-16 16:25:14 +01:00
|
|
|
cpu |= RETRO_SIMD_MMXEXT;
|
|
|
|
}
|
2012-11-05 09:06:00 +01:00
|
|
|
|
2012-11-05 11:57:40 +01:00
|
|
|
if (flags[3] & (1 << 26))
|
2013-12-18 19:10:57 +01:00
|
|
|
cpu |= RETRO_SIMD_SSE2;
|
2012-11-01 22:31:24 +01:00
|
|
|
|
2013-12-12 05:50:22 +01:00
|
|
|
if (flags[2] & (1 << 0))
|
2013-12-18 19:10:57 +01:00
|
|
|
cpu |= RETRO_SIMD_SSE3;
|
2013-12-12 05:50:22 +01:00
|
|
|
|
2013-12-12 10:56:21 +01:00
|
|
|
if (flags[2] & (1 << 9))
|
2013-12-18 19:10:57 +01:00
|
|
|
cpu |= RETRO_SIMD_SSSE3;
|
2013-12-12 10:56:21 +01:00
|
|
|
|
2014-02-16 16:25:14 +01:00
|
|
|
if (flags[2] & (1 << 19))
|
|
|
|
cpu |= RETRO_SIMD_SSE4;
|
|
|
|
|
|
|
|
if (flags[2] & (1 << 20))
|
|
|
|
cpu |= RETRO_SIMD_SSE42;
|
|
|
|
|
2014-09-02 20:50:43 +02:00
|
|
|
if (flags[2] & (1 << 25))
|
|
|
|
cpu |= RETRO_SIMD_AES;
|
|
|
|
|
2012-11-05 11:57:40 +01:00
|
|
|
const int avx_flags = (1 << 27) | (1 << 28);
|
2014-09-15 07:03:54 +02:00
|
|
|
|
|
|
|
/* Must only perform xgetbv check if we have
|
|
|
|
* AVX CPU support (guaranteed to have at least i686). */
|
|
|
|
if (((flags[2] & avx_flags) == avx_flags)
|
|
|
|
&& ((xgetbv_x86(0) & 0x6) == 0x6))
|
2013-12-18 19:10:57 +01:00
|
|
|
cpu |= RETRO_SIMD_AVX;
|
2012-11-05 09:06:00 +01:00
|
|
|
|
2014-02-16 16:25:14 +01:00
|
|
|
if (max_flag >= 7)
|
|
|
|
{
|
|
|
|
x86_cpuid(7, flags);
|
|
|
|
if (flags[1] & (1 << 5))
|
|
|
|
cpu |= RETRO_SIMD_AVX2;
|
|
|
|
}
|
|
|
|
|
|
|
|
x86_cpuid(0x80000000, flags);
|
|
|
|
max_flag = flags[0];
|
|
|
|
if (max_flag >= 0x80000001u)
|
|
|
|
{
|
|
|
|
x86_cpuid(0x80000001, flags);
|
|
|
|
if (flags[3] & (1 << 23))
|
|
|
|
cpu |= RETRO_SIMD_MMX;
|
|
|
|
if (flags[3] & (1 << 22))
|
|
|
|
cpu |= RETRO_SIMD_MMXEXT;
|
|
|
|
}
|
|
|
|
|
2012-11-02 21:25:54 +01:00
|
|
|
#elif defined(ANDROID) && defined(ANDROID_ARM)
|
|
|
|
uint64_t cpu_flags = android_getCpuFeatures();
|
2013-12-30 07:58:18 +01:00
|
|
|
(void)cpu_flags;
|
2012-11-05 09:06:00 +01:00
|
|
|
|
2014-07-26 20:18:37 +02:00
|
|
|
#ifdef __ARM_NEON__
|
2012-11-05 11:57:40 +01:00
|
|
|
if (cpu_flags & ANDROID_CPU_ARM_FEATURE_NEON)
|
2013-12-30 07:58:18 +01:00
|
|
|
{
|
2013-12-18 19:10:57 +01:00
|
|
|
cpu |= RETRO_SIMD_NEON;
|
2013-12-30 07:58:18 +01:00
|
|
|
arm_enable_runfast_mode();
|
|
|
|
}
|
|
|
|
#endif
|
2012-11-05 09:06:00 +01:00
|
|
|
|
2014-07-26 20:18:37 +02:00
|
|
|
#elif defined(__ARM_NEON__)
|
2013-12-26 18:07:09 +01:00
|
|
|
cpu |= RETRO_SIMD_NEON;
|
2013-12-30 07:58:18 +01:00
|
|
|
arm_enable_runfast_mode();
|
2014-02-11 12:02:17 +01:00
|
|
|
#elif defined(__ALTIVEC__)
|
2013-12-26 18:07:09 +01:00
|
|
|
cpu |= RETRO_SIMD_VMX;
|
2012-11-05 09:06:00 +01:00
|
|
|
#elif defined(XBOX360)
|
2013-12-26 18:07:09 +01:00
|
|
|
cpu |= RETRO_SIMD_VMX128;
|
2014-02-16 17:32:54 +01:00
|
|
|
#elif defined(PSP)
|
|
|
|
cpu |= RETRO_SIMD_VFPU;
|
2014-03-08 05:00:52 +01:00
|
|
|
#elif defined(GEKKO)
|
|
|
|
cpu |= RETRO_SIMD_PS;
|
2012-11-02 05:27:58 +01:00
|
|
|
#endif
|
2013-12-18 19:10:57 +01:00
|
|
|
|
2014-10-10 00:05:39 +01:00
|
|
|
if (cpu & RETRO_SIMD_MMX) strlcat(buf, " MMX", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_MMXEXT) strlcat(buf, " MMXEXT", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_SSE) strlcat(buf, " SSE", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_SSE2) strlcat(buf, " SSE2", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_SSE3) strlcat(buf, " SSE3", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_SSSE3) strlcat(buf, " SSSE3", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_SSE4) strlcat(buf, " SSE4", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_SSE42) strlcat(buf, " SSE4.2", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_AES) strlcat(buf, " AES", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_AVX) strlcat(buf, " AVX", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_AVX2) strlcat(buf, " AVX2", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_NEON) strlcat(buf, " NEON", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_VMX) strlcat(buf, " VMX", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_VMX128) strlcat(buf, " VMX128", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_VFPU) strlcat(buf, " VFPU", sizeof(buf));
|
|
|
|
if (cpu & RETRO_SIMD_PS) strlcat(buf, " PS", sizeof(buf));
|
|
|
|
|
|
|
|
RARCH_LOG("[CPUID]: Features:%s\n", buf);
|
|
|
|
|
|
|
|
|
2013-12-18 19:10:57 +01:00
|
|
|
return cpu;
|
2012-11-02 05:27:58 +01:00
|
|
|
}
|