1
0
mirror of https://github.com/paboyle/Grid.git synced 2025-10-26 09:39:34 +00:00

revised sU addressing scheme

This commit is contained in:
nmeyer-ur
2020-04-09 14:44:25 +02:00
parent 9f224a1647
commit 326de36467
4 changed files with 4 additions and 4 deletions

View File

@@ -283,7 +283,7 @@ asm ( \
// MULT_2SPIN
#define MULT_2SPIN_A64FXd(A) \
{ \
const auto & ref(U[sU][A]); \
const auto & ref(U[sU](A)); \
asm ( \
"ld1d { z24.d }, p5/z, [%[fetchptr], -6, mul vl] \n\t" \
"ld1d { z25.d }, p5/z, [%[fetchptr], -3, mul vl] \n\t" \

View File

@@ -295,7 +295,7 @@ asm ( \
// MULT_2SPIN
#define MULT_2SPIN_A64FXf(A) \
{ \
const auto & ref(U[sU][A]); \
const auto & ref(U[sU](A)); \
asm ( \
"ld1d { z24.f }, p5/z, [%[fetchptr], -6, mul vl] \n\t" \
"ld1d { z25.f }, p5/z, [%[fetchptr], -3, mul vl] \n\t" \

View File

@@ -261,7 +261,7 @@ Author: Nils Meyer <nils.meyer@ur.de>
// MULT_2SPIN
#define MULT_2SPIN_A64FXd(A) \
{ \
const auto & ref(U[sU][A]); \
const auto & ref(U[sU](A)); \
U_00 = svld1(pg1, (float64_t*)((uint64_t)&ref[2][0] + -6 * 64)); \
U_10 = svld1(pg1, (float64_t*)((uint64_t)&ref[2][0] + -3 * 64)); \
U_20 = svld1(pg1, (float64_t*)((uint64_t)&ref[2][0] + 0 * 64)); \

View File

@@ -268,7 +268,7 @@ Author: Nils Meyer <nils.meyer@ur.de>
// MULT_2SPIN
#define MULT_2SPIN_A64FXf(A) \
{ \
const auto & ref(U[sU][A]); \
const auto & ref(U[sU](A)); \
U_00 = svld1(pg1, (float32_t*)((uint64_t)&ref[2][0] + -6 * 64)); \
U_10 = svld1(pg1, (float32_t*)((uint64_t)&ref[2][0] + -3 * 64)); \
U_20 = svld1(pg1, (float32_t*)((uint64_t)&ref[2][0] + 0 * 64)); \