2017-11-16 20:11:51 +00:00
|
|
|
// ppc-simd.cpp - written and placed in the public domain by
|
2017-09-11 07:05:04 +00:00
|
|
|
// Jeffrey Walton, Uri Blumenthal and Marcel Raad.
|
|
|
|
//
|
|
|
|
// This source file uses intrinsics to gain access to AltiVec,
|
|
|
|
// Power8 and in-core crypto instructions. A separate source file
|
|
|
|
// is needed because additional CXXFLAGS are required to enable the
|
|
|
|
// appropriate instructions sets in some build configurations.
|
|
|
|
|
2018-01-11 18:16:13 +00:00
|
|
|
// TODO: we still need to implement Power8 SHA. Once we have Power8 SHA,
|
2018-01-11 22:59:24 +00:00
|
|
|
// we should be able to use CRYPTOPP_POWER8_AES_AVAILABLE and
|
2018-01-11 18:16:13 +00:00
|
|
|
// CRYPTOPP_POWER8_SHA_AVAILABLE instead of the broader
|
|
|
|
// CRYPTOPP_POWER8_AVAILABLE. The change will need to be coordinated
|
|
|
|
// with the defines in config.h.
|
|
|
|
|
|
|
|
// TODO: Bob Wilkinson reported we are misdetecting CRYPTOPP_POWER8_AVAILABLE.
|
|
|
|
// The problem is, the updated compiler supports them but the down-level
|
2018-01-11 18:20:29 +00:00
|
|
|
// assembler and linker do not. We will probably need to fix it through
|
|
|
|
// the makefile, similar to the way x86 AES and SHA are handled. For the time
|
|
|
|
// being CRYPTOPP_DISABLE_POWER8 will have to be applied manually. Another
|
2018-01-11 18:16:13 +00:00
|
|
|
// twist is, we don't have access to a test machine and it must be fixed
|
|
|
|
// for two compilers (IBM XL C/C++ and GCC). Ugh...
|
|
|
|
|
2017-09-11 07:05:04 +00:00
|
|
|
#include "pch.h"
|
|
|
|
#include "config.h"
|
|
|
|
#include "stdcpp.h"
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
#if defined(CRYPTOPP_ALTIVEC_AVAILABLE)
|
2017-12-12 12:15:59 +00:00
|
|
|
# include "ppc-simd.h"
|
2017-09-11 07:05:04 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY
|
|
|
|
# include <signal.h>
|
|
|
|
# include <setjmp.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef EXCEPTION_EXECUTE_HANDLER
|
|
|
|
# define EXCEPTION_EXECUTE_HANDLER 1
|
|
|
|
#endif
|
|
|
|
|
2018-07-06 05:22:38 +00:00
|
|
|
// Squash MS LNK4221 and libtool warnings
|
|
|
|
extern const char PPC_SIMD_FNAME[] = __FILE__;
|
|
|
|
|
2017-09-11 07:05:04 +00:00
|
|
|
NAMESPACE_BEGIN(CryptoPP)
|
|
|
|
|
|
|
|
#ifdef CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY
|
|
|
|
extern "C" {
|
|
|
|
typedef void (*SigHandler)(int);
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
static jmp_buf s_jmpSIGILL;
|
|
|
|
static void SigIllHandler(int)
|
|
|
|
{
|
|
|
|
longjmp(s_jmpSIGILL, 1);
|
|
|
|
}
|
2018-03-31 17:06:44 +00:00
|
|
|
}
|
2017-09-11 07:05:04 +00:00
|
|
|
#endif // Not CRYPTOPP_MS_STYLE_INLINE_ASSEMBLY
|
|
|
|
|
2017-09-12 09:49:38 +00:00
|
|
|
#if (CRYPTOPP_BOOL_PPC32 || CRYPTOPP_BOOL_PPC64)
|
2017-09-12 02:39:59 +00:00
|
|
|
bool CPU_ProbeAltivec()
|
2017-09-11 07:05:04 +00:00
|
|
|
{
|
2017-09-20 01:08:37 +00:00
|
|
|
#if defined(CRYPTOPP_NO_CPU_FEATURE_PROBES)
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2017-09-20 01:08:37 +00:00
|
|
|
#elif (CRYPTOPP_ALTIVEC_AVAILABLE)
|
2017-09-11 07:05:04 +00:00
|
|
|
# if defined(CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY)
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
// longjmp and clobber warnings. Volatile is required.
|
|
|
|
// http://github.com/weidai11/cryptopp/issues/24 and http://stackoverflow.com/q/7721854
|
|
|
|
volatile int result = true;
|
|
|
|
|
|
|
|
volatile SigHandler oldHandler = signal(SIGILL, SigIllHandler);
|
|
|
|
if (oldHandler == SIG_ERR)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
volatile sigset_t oldMask;
|
|
|
|
if (sigprocmask(0, NULLPTR, (sigset_t*)&oldMask))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (setjmp(s_jmpSIGILL))
|
|
|
|
result = false;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
const byte b1[16] = {0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0};
|
|
|
|
const byte b2[16] = {1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};
|
|
|
|
byte b3[16];
|
|
|
|
|
|
|
|
const uint8x16_p v1 = (uint8x16_p)VectorLoad(0, b1);
|
|
|
|
const uint8x16_p v2 = (uint8x16_p)VectorLoad(0, b2);
|
|
|
|
const uint8x16_p v3 = (uint8x16_p)VectorXor(v1, v2);
|
|
|
|
VectorStore(v3, b3);
|
|
|
|
|
|
|
|
result = (0 == std::memcmp(b2, b3, 16));
|
|
|
|
}
|
|
|
|
|
|
|
|
sigprocmask(SIG_SETMASK, (sigset_t*)&oldMask, NULLPTR);
|
|
|
|
signal(SIGILL, oldHandler);
|
|
|
|
return result;
|
2017-09-11 07:05:04 +00:00
|
|
|
# endif
|
|
|
|
#else
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
#endif // CRYPTOPP_ALTIVEC_AVAILABLE
|
|
|
|
}
|
|
|
|
|
2017-09-12 02:39:59 +00:00
|
|
|
bool CPU_ProbePower7()
|
2017-09-11 07:05:04 +00:00
|
|
|
{
|
2017-09-20 01:08:37 +00:00
|
|
|
#if defined(CRYPTOPP_NO_CPU_FEATURE_PROBES)
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2017-10-18 02:50:45 +00:00
|
|
|
#elif (CRYPTOPP_POWER7_AVAILABLE)
|
2017-09-11 07:05:04 +00:00
|
|
|
# if defined(CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY)
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
// longjmp and clobber warnings. Volatile is required.
|
|
|
|
// http://github.com/weidai11/cryptopp/issues/24 and http://stackoverflow.com/q/7721854
|
|
|
|
volatile int result = false;
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
volatile SigHandler oldHandler = signal(SIGILL, SigIllHandler);
|
|
|
|
if (oldHandler == SIG_ERR)
|
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
volatile sigset_t oldMask;
|
|
|
|
if (sigprocmask(0, NULLPTR, (sigset_t*)&oldMask))
|
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
if (setjmp(s_jmpSIGILL))
|
|
|
|
result = false;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
byte b1[19] = {255, 255, 255, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, b2[17];
|
|
|
|
const uint8x16_p v1 = (uint8x16_p)VectorLoad(0, b1+3);
|
|
|
|
VectorStore(v1, b2+1);
|
2017-10-18 02:50:45 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
result = (0 == std::memcmp(b1+3, b2+1, 16));
|
|
|
|
}
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
sigprocmask(SIG_SETMASK, (sigset_t*)&oldMask, NULLPTR);
|
|
|
|
signal(SIGILL, oldHandler);
|
|
|
|
return result;
|
2017-09-11 07:05:04 +00:00
|
|
|
# endif
|
|
|
|
#else
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
#endif // CRYPTOPP_POWER7_AVAILABLE
|
|
|
|
}
|
|
|
|
|
2017-09-12 02:39:59 +00:00
|
|
|
bool CPU_ProbePower8()
|
2017-09-11 07:05:04 +00:00
|
|
|
{
|
2017-09-20 01:08:37 +00:00
|
|
|
#if defined(CRYPTOPP_NO_CPU_FEATURE_PROBES)
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2018-01-11 18:16:13 +00:00
|
|
|
#elif (CRYPTOPP_POWER8_AVAILABLE)
|
2017-09-11 07:05:04 +00:00
|
|
|
# if defined(CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY)
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
// longjmp and clobber warnings. Volatile is required.
|
|
|
|
// http://github.com/weidai11/cryptopp/issues/24 and http://stackoverflow.com/q/7721854
|
|
|
|
volatile int result = true;
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
volatile SigHandler oldHandler = signal(SIGILL, SigIllHandler);
|
|
|
|
if (oldHandler == SIG_ERR)
|
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
volatile sigset_t oldMask;
|
|
|
|
if (sigprocmask(0, NULLPTR, (sigset_t*)&oldMask))
|
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
if (setjmp(s_jmpSIGILL))
|
|
|
|
result = false;
|
|
|
|
else
|
|
|
|
{
|
2018-08-03 05:27:39 +00:00
|
|
|
// POWER8 added 64-bit SIMD operations
|
|
|
|
const word64 m = W64LIT(0xffffffffffffffff);
|
|
|
|
word64 w1[2] = {m, m}, w2[2] = {3, 4}, w3[2];
|
|
|
|
const uint64x2_p v1 = (uint64x2_p)VectorLoad(0, w1);
|
|
|
|
const uint64x2_p v2 = (uint64x2_p)VectorLoad(0, w2);
|
|
|
|
VectorStore(VectorAdd(v1, v2), w3);
|
|
|
|
|
|
|
|
// The 64-bit add will overflow.
|
|
|
|
result = (w3[0] == 2 && w3[1] == 3);
|
2017-12-17 01:26:59 +00:00
|
|
|
}
|
2017-09-11 07:05:04 +00:00
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
sigprocmask(SIG_SETMASK, (sigset_t*)&oldMask, NULLPTR);
|
|
|
|
signal(SIGILL, oldHandler);
|
|
|
|
return result;
|
2017-09-11 07:05:04 +00:00
|
|
|
# endif
|
|
|
|
#else
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2018-01-11 18:04:59 +00:00
|
|
|
#endif // CRYPTOPP_POWER8_AVAILABLE
|
2017-09-11 07:05:04 +00:00
|
|
|
}
|
|
|
|
|
2017-09-12 02:39:59 +00:00
|
|
|
bool CPU_ProbeAES()
|
2017-09-11 07:05:04 +00:00
|
|
|
{
|
2017-09-20 01:08:37 +00:00
|
|
|
#if defined(CRYPTOPP_NO_CPU_FEATURE_PROBES)
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2018-01-11 18:04:59 +00:00
|
|
|
#elif (CRYPTOPP_POWER8_AVAILABLE)
|
2017-09-11 07:05:04 +00:00
|
|
|
# if defined(CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY)
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
// longjmp and clobber warnings. Volatile is required.
|
|
|
|
// http://github.com/weidai11/cryptopp/issues/24 and http://stackoverflow.com/q/7721854
|
|
|
|
volatile int result = true;
|
|
|
|
|
|
|
|
volatile SigHandler oldHandler = signal(SIGILL, SigIllHandler);
|
|
|
|
if (oldHandler == SIG_ERR)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
volatile sigset_t oldMask;
|
|
|
|
if (sigprocmask(0, NULLPTR, (sigset_t*)&oldMask))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (setjmp(s_jmpSIGILL))
|
|
|
|
result = false;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
byte key[16] = {0xA0, 0xFA, 0xFE, 0x17, 0x88, 0x54, 0x2c, 0xb1,
|
|
|
|
0x23, 0xa3, 0x39, 0x39, 0x2a, 0x6c, 0x76, 0x05};
|
|
|
|
byte state[16] = {0x19, 0x3d, 0xe3, 0xb3, 0xa0, 0xf4, 0xe2, 0x2b,
|
|
|
|
0x9a, 0xc6, 0x8d, 0x2a, 0xe9, 0xf8, 0x48, 0x08};
|
|
|
|
byte r[16] = {255}, z[16] = {};
|
|
|
|
|
|
|
|
uint8x16_p k = (uint8x16_p)VectorLoad(0, key);
|
|
|
|
uint8x16_p s = (uint8x16_p)VectorLoad(0, state);
|
|
|
|
s = VectorEncrypt(s, k);
|
|
|
|
s = VectorEncryptLast(s, k);
|
|
|
|
s = VectorDecrypt(s, k);
|
|
|
|
s = VectorDecryptLast(s, k);
|
|
|
|
VectorStore(s, r);
|
|
|
|
|
|
|
|
result = (0 != std::memcmp(r, z, 16));
|
|
|
|
}
|
|
|
|
|
|
|
|
sigprocmask(SIG_SETMASK, (sigset_t*)&oldMask, NULLPTR);
|
|
|
|
signal(SIGILL, oldHandler);
|
|
|
|
return result;
|
2017-09-11 07:05:04 +00:00
|
|
|
# endif
|
|
|
|
#else
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
#endif // CRYPTOPP_ALTIVEC_AVAILABLE
|
|
|
|
}
|
|
|
|
|
2017-09-22 12:58:50 +00:00
|
|
|
bool CPU_ProbeSHA256()
|
2017-09-11 07:05:04 +00:00
|
|
|
{
|
2017-09-20 01:08:37 +00:00
|
|
|
#if defined(CRYPTOPP_NO_CPU_FEATURE_PROBES)
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2018-01-11 18:04:59 +00:00
|
|
|
#elif (CRYPTOPP_POWER8_AVAILABLE)
|
2017-09-11 07:05:04 +00:00
|
|
|
# if defined(CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY)
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
// longjmp and clobber warnings. Volatile is required.
|
|
|
|
// http://github.com/weidai11/cryptopp/issues/24 and http://stackoverflow.com/q/7721854
|
|
|
|
volatile int result = false;
|
|
|
|
|
|
|
|
volatile SigHandler oldHandler = signal(SIGILL, SigIllHandler);
|
|
|
|
if (oldHandler == SIG_ERR)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
volatile sigset_t oldMask;
|
|
|
|
if (sigprocmask(0, NULLPTR, (sigset_t*)&oldMask))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (setjmp(s_jmpSIGILL))
|
|
|
|
result = false;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
byte r[16], z[16] = {0};
|
|
|
|
uint8x16_p x = ((uint8x16_p){0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0});
|
|
|
|
|
|
|
|
x = VectorSHA256<0,0>(x);
|
|
|
|
x = VectorSHA256<0,1>(x);
|
|
|
|
x = VectorSHA256<1,0>(x);
|
|
|
|
x = VectorSHA256<1,1>(x);
|
|
|
|
VectorStore(x, r);
|
|
|
|
|
2018-03-05 12:05:12 +00:00
|
|
|
result = (0 == std::memcmp(r, z, 16));
|
2017-12-17 01:26:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
sigprocmask(SIG_SETMASK, (sigset_t*)&oldMask, NULLPTR);
|
|
|
|
signal(SIGILL, oldHandler);
|
|
|
|
return result;
|
2017-09-11 07:05:04 +00:00
|
|
|
# endif
|
|
|
|
#else
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2017-09-11 07:05:04 +00:00
|
|
|
#endif // CRYPTOPP_ALTIVEC_AVAILABLE
|
|
|
|
}
|
|
|
|
|
2017-09-22 12:58:50 +00:00
|
|
|
bool CPU_ProbeSHA512()
|
2017-09-11 07:05:04 +00:00
|
|
|
{
|
2017-09-20 01:08:37 +00:00
|
|
|
#if defined(CRYPTOPP_NO_CPU_FEATURE_PROBES)
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2018-01-11 18:04:59 +00:00
|
|
|
#elif (CRYPTOPP_POWER8_AVAILABLE)
|
2017-09-11 07:05:04 +00:00
|
|
|
# if defined(CRYPTOPP_GNU_STYLE_INLINE_ASSEMBLY)
|
|
|
|
|
2017-12-17 01:26:59 +00:00
|
|
|
// longjmp and clobber warnings. Volatile is required.
|
|
|
|
// http://github.com/weidai11/cryptopp/issues/24 and http://stackoverflow.com/q/7721854
|
|
|
|
volatile int result = false;
|
|
|
|
|
|
|
|
volatile SigHandler oldHandler = signal(SIGILL, SigIllHandler);
|
|
|
|
if (oldHandler == SIG_ERR)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
volatile sigset_t oldMask;
|
|
|
|
if (sigprocmask(0, NULLPTR, (sigset_t*)&oldMask))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
if (setjmp(s_jmpSIGILL))
|
|
|
|
result = false;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
byte r[16], z[16] = {0};
|
|
|
|
uint8x16_p x = ((uint8x16_p){0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0});
|
|
|
|
|
|
|
|
x = VectorSHA512<0,0>(x);
|
|
|
|
x = VectorSHA512<0,1>(x);
|
|
|
|
x = VectorSHA512<1,0>(x);
|
|
|
|
x = VectorSHA512<1,1>(x);
|
|
|
|
VectorStore(x, r);
|
|
|
|
|
2018-03-05 12:05:12 +00:00
|
|
|
result = (0 == std::memcmp(r, z, 16));
|
2017-12-17 01:26:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
sigprocmask(SIG_SETMASK, (sigset_t*)&oldMask, NULLPTR);
|
|
|
|
signal(SIGILL, oldHandler);
|
|
|
|
return result;
|
2017-09-11 07:05:04 +00:00
|
|
|
# endif
|
|
|
|
#else
|
2017-12-17 01:26:59 +00:00
|
|
|
return false;
|
2018-01-11 18:04:59 +00:00
|
|
|
#endif // CRYPTOPP_POWER8_AVAILABLE
|
2017-09-11 07:05:04 +00:00
|
|
|
}
|
2017-09-12 09:49:38 +00:00
|
|
|
# endif // CRYPTOPP_BOOL_PPC32 || CRYPTOPP_BOOL_PPC64
|
2017-09-11 07:05:04 +00:00
|
|
|
NAMESPACE_END
|