From 87acd06990090acae4f19ae147ca794d243764f5 Mon Sep 17 00:00:00 2001 From: paboyle Date: Mon, 26 Sep 2016 10:11:34 +0100 Subject: [PATCH] Use streaming stores --- lib/simd/Intel512common.h | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/lib/simd/Intel512common.h b/lib/simd/Intel512common.h index dabbf6d8..74793638 100644 --- a/lib/simd/Intel512common.h +++ b/lib/simd/Intel512common.h @@ -139,8 +139,8 @@ Author: paboyle #define ZLOADd(OFF,PTR,ri,ir) VLOADd(OFF,PTR,ir) VSHUFd(ir,ri) -#define VSTOREf(OFF,PTR,SRC) "vmovaps " #SRC "," #OFF "*64(" #PTR ")" ";\n" -#define VSTOREd(OFF,PTR,SRC) "vmovapd " #SRC "," #OFF "*64(" #PTR ")" ";\n" +#define VSTOREf(OFF,PTR,SRC) "vmovntps " #SRC "," #OFF "*64(" #PTR ")" ";\n" +#define VSTOREd(OFF,PTR,SRC) "vmovntpd " #SRC "," #OFF "*64(" #PTR ")" ";\n" // Swaps Re/Im ; could unify this with IMCI #define VSHUFd(A,DEST) "vpshufd $0x4e," #A "," #DEST ";\n"