2012-10-01 19:45:09 +00:00
|
|
|
/* RetroArch - A frontend for libretro.
|
2013-01-01 00:37:37 +00:00
|
|
|
* Copyright (C) 2010-2013 - Hans-Kristian Arntzen
|
|
|
|
* Copyright (C) 2011-2013 - Daniel De Matteis
|
2012-10-01 19:45:09 +00:00
|
|
|
*
|
|
|
|
* RetroArch is free software: you can redistribute it and/or modify it under the terms
|
|
|
|
* of the GNU General Public License as published by the Free Software Found-
|
|
|
|
* ation, either version 3 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* RetroArch is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
|
|
|
|
* without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
|
|
|
|
* PURPOSE. See the GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License along with RetroArch.
|
|
|
|
* If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
2012-11-01 05:21:18 +00:00
|
|
|
#include "performance.h"
|
2012-10-01 19:45:09 +00:00
|
|
|
|
2012-11-02 04:27:58 +00:00
|
|
|
#ifdef ANDROID
|
|
|
|
#include "android/native/jni/cpufeatures.h"
|
|
|
|
#endif
|
|
|
|
|
2012-11-01 21:31:24 +00:00
|
|
|
#ifdef PERF_TEST
|
|
|
|
|
2012-10-01 20:02:20 +00:00
|
|
|
#if defined(__CELLOS_LV2__) || defined(GEKKO)
|
|
|
|
#ifndef _PPU_INTRINSICS_H
|
2012-10-01 19:45:09 +00:00
|
|
|
#include <ppu_intrinsics.h>
|
|
|
|
#endif
|
2012-10-01 20:25:13 +00:00
|
|
|
#elif defined(_XBOX360)
|
|
|
|
#include <PPCIntrinsics.h>
|
2012-10-16 17:55:39 +00:00
|
|
|
#elif defined(__linux__)
|
|
|
|
#include <sys/time.h>
|
2012-10-01 20:02:20 +00:00
|
|
|
#endif
|
2012-10-01 19:45:09 +00:00
|
|
|
|
2012-11-02 04:27:58 +00:00
|
|
|
|
2012-10-30 22:28:54 +00:00
|
|
|
#define MAX_COUNTERS 64
|
|
|
|
static struct rarch_perf_counter *perf_counters[MAX_COUNTERS];
|
|
|
|
static unsigned perf_ptr;
|
|
|
|
|
|
|
|
void rarch_perf_register(struct rarch_perf_counter *perf)
|
|
|
|
{
|
|
|
|
if (perf_ptr >= MAX_COUNTERS)
|
|
|
|
return;
|
|
|
|
|
|
|
|
perf_counters[perf_ptr++] = perf;
|
|
|
|
perf->registered = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void rarch_perf_log(void)
|
|
|
|
{
|
|
|
|
RARCH_LOG("[PERF]: Performance counters:\n");
|
|
|
|
for (unsigned i = 0; i < perf_ptr; i++)
|
|
|
|
RARCH_PERFORMANCE_LOG(perf_counters[i]->ident, *perf_counters[i]);
|
|
|
|
}
|
|
|
|
|
2012-10-01 21:43:16 +00:00
|
|
|
rarch_perf_tick_t rarch_get_perf_counter(void)
|
2012-10-01 19:45:09 +00:00
|
|
|
{
|
2012-10-01 21:43:16 +00:00
|
|
|
rarch_perf_tick_t time = 0;
|
2012-10-01 21:04:15 +00:00
|
|
|
#ifdef _XBOX1
|
2012-10-01 21:43:16 +00:00
|
|
|
|
2012-10-01 21:04:15 +00:00
|
|
|
#define rdtsc __asm __emit 0fh __asm __emit 031h
|
|
|
|
LARGE_INTEGER time_tmp;
|
|
|
|
rdtsc;
|
|
|
|
__asm mov time_tmp.LowPart, eax;
|
|
|
|
__asm mov time_tmp.HighPart, edx;
|
|
|
|
time = time_tmp.QuadPart;
|
2012-10-01 21:43:16 +00:00
|
|
|
|
2012-10-16 17:55:39 +00:00
|
|
|
#elif defined(__linux__)
|
|
|
|
struct timespec tv;
|
2012-10-16 21:29:03 +00:00
|
|
|
if (clock_gettime(CLOCK_MONOTONIC, &tv) == 0)
|
2012-10-16 17:55:39 +00:00
|
|
|
time = (rarch_perf_tick_t)tv.tv_sec * 1000000000 + (rarch_perf_tick_t)tv.tv_nsec;
|
|
|
|
else
|
|
|
|
time = 0;
|
|
|
|
|
2012-10-01 22:47:20 +00:00
|
|
|
#elif defined(__GNUC__) && !defined(RARCH_CONSOLE)
|
2012-10-01 21:43:16 +00:00
|
|
|
|
2012-11-01 21:31:24 +00:00
|
|
|
#if defined(__i386__) || defined(__i486__) || defined(__i686__)
|
2012-10-01 21:43:16 +00:00
|
|
|
asm volatile ("rdtsc" : "=A" (time));
|
|
|
|
#elif defined(__x86_64__)
|
|
|
|
unsigned a, d;
|
|
|
|
asm volatile ("rdtsc" : "=a" (a), "=d" (d));
|
|
|
|
time = (rarch_perf_tick_t)a | ((rarch_perf_tick_t)d << 32);
|
|
|
|
#endif
|
2012-10-16 17:55:39 +00:00
|
|
|
|
2012-10-02 22:02:46 +00:00
|
|
|
#elif defined(__ARM_ARCH_6__) || defined(ANDROID)
|
2012-10-02 21:59:19 +00:00
|
|
|
asm volatile( "mrc p15, 0, %0, c9, c13, 0" : "=r"(time) );
|
2012-10-01 21:04:15 +00:00
|
|
|
#elif defined(__CELLOS_LV2__) || defined(GEKKO) || defined(_XBOX360)
|
|
|
|
time = __mftb();
|
2012-10-01 19:45:09 +00:00
|
|
|
#endif
|
2012-10-01 21:43:16 +00:00
|
|
|
|
2012-10-01 19:45:09 +00:00
|
|
|
return time;
|
|
|
|
}
|
2012-11-01 21:31:24 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#if defined(__x86_64__) || defined(__i386__) || defined(__i486__) || defined(__i686__)
|
|
|
|
#define CPU_X86
|
|
|
|
#endif
|
|
|
|
|
2012-11-10 12:46:24 +00:00
|
|
|
#if defined(_MSC_VER) && !defined(_XBOX)
|
2012-11-01 21:31:24 +00:00
|
|
|
#include <intrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef CPU_X86
|
|
|
|
static void x86_cpuid(int func, int flags[4])
|
|
|
|
{
|
2012-11-02 20:25:54 +00:00
|
|
|
// On Android, we compile RetroArch with PIC, and we are not allowed to clobber the ebx
|
|
|
|
// register.
|
|
|
|
#ifdef __x86_64__
|
|
|
|
#define REG_b "rbx"
|
|
|
|
#define REG_S "rsi"
|
|
|
|
#else
|
|
|
|
#define REG_b "ebx"
|
|
|
|
#define REG_S "esi"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if defined(__GNUC__)
|
|
|
|
asm volatile (
|
2012-11-03 21:22:49 +00:00
|
|
|
"mov %%" REG_b ", %%" REG_S "\n"
|
2012-11-02 20:25:54 +00:00
|
|
|
"cpuid\n"
|
2012-11-03 21:22:49 +00:00
|
|
|
"xchg %%" REG_b ", %%" REG_S "\n"
|
2012-11-02 20:25:54 +00:00
|
|
|
: "=a"(flags[0]), "=S"(flags[1]), "=c"(flags[2]), "=d"(flags[3])
|
|
|
|
: "a"(func));
|
2012-11-01 21:31:24 +00:00
|
|
|
#elif defined(_MSC_VER)
|
|
|
|
__cpuid(flags, func);
|
2013-01-05 23:20:26 +00:00
|
|
|
#else
|
|
|
|
RARCH_WARN("Unknown compiler. Cannot check CPUID with inline assembly.\n");
|
|
|
|
memset(flags, 0, 4 * sizeof(int));
|
2012-11-01 21:31:24 +00:00
|
|
|
#endif
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
void rarch_get_cpu_features(struct rarch_cpu_features *cpu)
|
|
|
|
{
|
|
|
|
memset(cpu, 0, sizeof(*cpu));
|
|
|
|
|
2012-11-02 20:25:54 +00:00
|
|
|
#if defined(CPU_X86)
|
2012-11-01 21:31:24 +00:00
|
|
|
int flags[4];
|
|
|
|
x86_cpuid(0, flags);
|
|
|
|
|
|
|
|
char vendor[13] = {0};
|
|
|
|
const int vendor_shuffle[3] = { flags[1], flags[3], flags[2] };
|
|
|
|
memcpy(vendor, vendor_shuffle, sizeof(vendor_shuffle));
|
|
|
|
RARCH_LOG("[CPUID]: Vendor: %s\n", vendor);
|
|
|
|
|
|
|
|
if (flags[0] < 1) // Does CPUID not support func = 1? (unlikely ...)
|
|
|
|
return;
|
|
|
|
|
|
|
|
x86_cpuid(1, flags);
|
2012-11-05 08:06:00 +00:00
|
|
|
|
2012-11-05 10:57:40 +00:00
|
|
|
if (flags[3] & (1 << 25))
|
2012-11-05 08:06:00 +00:00
|
|
|
cpu->simd |= RARCH_SIMD_SSE;
|
|
|
|
|
2012-11-05 10:57:40 +00:00
|
|
|
if (flags[3] & (1 << 26))
|
2012-11-05 08:06:00 +00:00
|
|
|
cpu->simd |= RARCH_SIMD_SSE2;
|
2012-11-01 21:31:24 +00:00
|
|
|
|
2012-11-05 10:57:40 +00:00
|
|
|
const int avx_flags = (1 << 27) | (1 << 28);
|
|
|
|
if ((flags[2] & avx_flags) == avx_flags)
|
2012-11-05 08:06:00 +00:00
|
|
|
cpu->simd |= RARCH_SIMD_AVX;
|
|
|
|
|
2012-11-06 00:50:10 +00:00
|
|
|
RARCH_LOG("[CPUID]: SSE: %u\n", !!(cpu->simd & RARCH_SIMD_SSE));
|
|
|
|
RARCH_LOG("[CPUID]: SSE2: %u\n", !!(cpu->simd & RARCH_SIMD_SSE2));
|
|
|
|
RARCH_LOG("[CPUID]: AVX: %u\n", !!(cpu->simd & RARCH_SIMD_AVX));
|
2012-11-02 20:25:54 +00:00
|
|
|
#elif defined(ANDROID) && defined(ANDROID_ARM)
|
|
|
|
uint64_t cpu_flags = android_getCpuFeatures();
|
2012-11-05 08:06:00 +00:00
|
|
|
|
2012-11-05 10:57:40 +00:00
|
|
|
if (cpu_flags & ANDROID_CPU_ARM_FEATURE_NEON)
|
2012-11-05 08:06:00 +00:00
|
|
|
cpu->simd |= RARCH_SIMD_NEON;
|
|
|
|
|
2012-11-06 00:50:10 +00:00
|
|
|
RARCH_LOG("[CPUID]: NEON: %u\n", !!(cpu->simd & RARCH_SIMD_NEON));
|
2012-11-05 08:06:00 +00:00
|
|
|
#elif defined(__CELLOS_LV2__)
|
|
|
|
cpu->simd |= RARCH_SIMD_VMX;
|
2012-11-06 00:50:10 +00:00
|
|
|
RARCH_LOG("[CPUID]: VMX: %u\n", !!(cpu->simd & RARCH_SIMD_VMX));
|
2012-11-05 08:06:00 +00:00
|
|
|
#elif defined(XBOX360)
|
|
|
|
cpu->simd |= RARCH_SIMD_VMX128;
|
2012-11-06 00:50:10 +00:00
|
|
|
RARCH_LOG("[CPUID]: VMX128: %u\n", !!(cpu->simd & RARCH_SIMD_VMX128));
|
2012-11-02 04:27:58 +00:00
|
|
|
#endif
|
|
|
|
}
|