mirror of
https://github.com/paboyle/Grid.git
synced 2025-06-12 20:27:06 +01:00
Typo fixes and rotate for CLANG
This commit is contained in:
@ -41,6 +41,16 @@ Author: paboyle <paboyle@ph.ed.ac.uk>
|
|||||||
|
|
||||||
namespace Grid{
|
namespace Grid{
|
||||||
namespace Optimization {
|
namespace Optimization {
|
||||||
|
|
||||||
|
union u512f {
|
||||||
|
__m512 v;
|
||||||
|
float f[16];
|
||||||
|
};
|
||||||
|
|
||||||
|
union u512d {
|
||||||
|
__m512d v;
|
||||||
|
double f[8];
|
||||||
|
};
|
||||||
|
|
||||||
struct Vsplat{
|
struct Vsplat{
|
||||||
//Complex float
|
//Complex float
|
||||||
@ -361,7 +371,7 @@ namespace Optimization {
|
|||||||
// Some Template specialization
|
// Some Template specialization
|
||||||
|
|
||||||
// Hack for CLANG until mm512_reduce_add_ps etc... are implemented in GCC and Clang releases
|
// Hack for CLANG until mm512_reduce_add_ps etc... are implemented in GCC and Clang releases
|
||||||
#undef GNU_CLANG_COMPILER
|
#define GNU_CLANG_COMPILER
|
||||||
#ifdef GNU_CLANG_COMPILER
|
#ifdef GNU_CLANG_COMPILER
|
||||||
//Complex float Reduce
|
//Complex float Reduce
|
||||||
template<>
|
template<>
|
||||||
|
@ -53,7 +53,7 @@ Author: paboyle <paboyle@ph.ed.ac.uk>
|
|||||||
|
|
||||||
#define ZMULMEM2SPd(O,P,tmp,B,C,Briir,Biirr,Criir,Ciirr)\
|
#define ZMULMEM2SPd(O,P,tmp,B,C,Briir,Biirr,Criir,Ciirr)\
|
||||||
VSHUFMEMd(O,P,tmp) \
|
VSHUFMEMd(O,P,tmp) \
|
||||||
VMULMEMd(O,P,B,Biirr) \
|
VMULMEMd(O,P,B,Biirr) \
|
||||||
VMULMEMd(O,P,C,Ciirr) \
|
VMULMEMd(O,P,C,Ciirr) \
|
||||||
VMULd(tmp,B,Briir) \
|
VMULd(tmp,B,Briir) \
|
||||||
VMULd(tmp,C,Criir)
|
VMULd(tmp,C,Criir)
|
||||||
|
@ -37,7 +37,7 @@ Author: paboyle <paboyle@ph.ed.ac.uk>
|
|||||||
// Opcodes common
|
// Opcodes common
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////////
|
////////////////////////////////////////////////////////////////////////////////////////////////////
|
||||||
#define MASK_REGS \
|
#define MASK_REGS \
|
||||||
__asm__ ("mov $0xAAAA, %%eax \n"\
|
__asm__ ("mov $0xAAAA, %%eax \n"\
|
||||||
"kmovw %%eax, %%k6 \n"\
|
"kmovw %%eax, %%k6 \n"\
|
||||||
"mov $0x5555, %%eax \n"\
|
"mov $0x5555, %%eax \n"\
|
||||||
"kmovw %%eax, %%k7 \n" : : : "%eax");
|
"kmovw %%eax, %%k7 \n" : : : "%eax");
|
||||||
|
Reference in New Issue
Block a user