nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						5abec5b8a9
					 | 
					
						
						
							
							SVE_readme update, update Grid_vector_types.h
						
						
						
						
						
						
					 | 
					
						2020-04-25 13:48:26 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						499edc0636
					 | 
					
						
						
							
							updated SVE_README.txt; defined ARMCLANGCOMPAT macro
						
						
						
						
						
						
					 | 
					
						2020-04-25 13:41:24 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						d990e61be3
					 | 
					
						
						
							
							armclang 20.1 settings in SVE readme
						
						
						
						
						
						
					 | 
					
						2020-04-25 12:11:43 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						3edb2dc2da
					 | 
					
						
						
							
							removed -static from gcc CXXFLAGS
						
						
						
						
						
						
					 | 
					
						2020-04-24 13:04:34 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						f1fe444d4f
					 | 
					
						
						
							
							blocked precision promotion infrastructure upgrade
						
						
						
						
						
						
					 | 
					
						2020-04-24 06:27:20 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						345721220e
					 | 
					
						
						
							
							resolved merge conflict
						
						
						
						
						
						
					 | 
					
						2020-04-24 10:14:21 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						6db68d6ecb
					 | 
					
						
						
							
							added SVE configure for armclang and gcc
						
						
						
						
						
						
					 | 
					
						2020-04-24 10:10:47 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						dae820aa96
					 | 
					
						
						
							
							Merge pull request #277 from mmphys/bugfix/grid-config
						
						
						
						
						
						
						
						Bugfix/grid config 
						
						
					 | 
					
						2020-04-23 10:26:54 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Michael Marshall
							
						 
					 | 
					
						
						
							
						
						5daf176f4a
					 | 
					
						
						
							
							Updated to expose GRID_CXXLD in addition to CXXLD.
						
						
						
						
						
						
						
						NB: CXXLD required as this is what drives linking behaviour. 
						
						
					 | 
					
						2020-04-23 15:25:53 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Michael Marshall
							
						 
					 | 
					
						
						
							
						
						e96c86ec14
					 | 
					
						
						
							
							Make grid-config message more specific for --cxx and --cxxld
						
						
						
						
						
						
					 | 
					
						2020-04-23 13:10:45 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						09f0963d1f
					 | 
					
						
						
							
							changes in configure.ac ; to be verified
						
						
						
						
						
						
					 | 
					
						2020-04-23 11:27:03 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						6f44e3c192
					 | 
					
						
						
							
							reverted changes in configure.ac ; included SVE configure readme
						
						
						
						
						
						
					 | 
					
						2020-04-23 11:18:50 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						c2c3cad20d
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
					 | 
					
						2020-04-23 04:35:42 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						edec9ee2e2
					 | 
					
						
						
							
							Conserved current rewrite done. Zmobius working
						
						
						
						
						
						
					 | 
					
						2020-04-23 04:34:01 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						ed70cce542
					 | 
					
						
						
							
							Test for 5D DWF obserevables
						
						
						
						
						
						
					 | 
					
						2020-04-23 04:29:45 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Michael Marshall
							
						 
					 | 
					
						
						
							
						
						4701201b5f
					 | 
					
						
						
							
							grid-config: Expose CXXLD (for GPU build) and update help
						
						
						
						
						
						
					 | 
					
						2020-04-22 18:42:30 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						5893888f87
					 | 
					
						
						
							
							removed default no-strict-aliasing for gcc-10.0.1 exclusively
						
						
						
						
						
						
					 | 
					
						2020-04-22 19:29:55 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						39b448affb
					 | 
					
						
						
							
							Merge remote-tracking branch 'origin/develop' into feature/a64fx-2
						
						
						
						
						
						
					 | 
					
						2020-04-22 17:34:12 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						e54a8f05a9
					 | 
					
						
						
							
							Exchange1 with generic version for now, should use svtbl2 in final version
						
						
						
						
						
						
					 | 
					
						2020-04-20 22:45:27 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						0782b76ed4
					 | 
					
						
						
							
							Merge pull request #274 from paboyle/feature/zmobius_paramcompute
						
						
						
						
						
						
						
						ZMobius parameter computation 
						
						
					 | 
					
						2020-04-20 14:39:29 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christopher Kelly
							
						 
					 | 
					
						
						
							
						
						0896f2cead
					 | 
					
						
						
							
							Added missing include guards in bigfloat_double.h
						
						
						
						
						
						
					 | 
					
						2020-04-20 10:30:38 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christopher Kelly
							
						 
					 | 
					
						
						
							
						
						181709bba4
					 | 
					
						
						
							
							Merge branch 'develop' into feature/zmobius_paramcompute
						
						
						
						
						
						
					 | 
					
						2020-04-20 09:12:34 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						64b72fc17f
					 | 
					
						
						
							
							testing gcc 10.0.1: build errors in Exchange1 using -DA64FX and in Lattice_base.h building Dslash only
						
						
						
						
						
						
					 | 
					
						2020-04-19 01:25:40 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						091d5c605e
					 | 
					
						
						
							
							towards more precise blocking
						
						
						
						
						
						
					 | 
					
						2020-04-17 04:25:28 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						6fdce60492
					 | 
					
						
						
							
							revised BodyA64FX; 990 GiB/s Wilson, 687 GiB/s DW using intrinsics (armclang 20.0)
						
						
						
						
						
						
					 | 
					
						2020-04-16 22:43:32 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						90229cfb0f
					 | 
					
						
						
							
							Merge pull request #270 from milc-qcd/feature/CGinfo
						
						
						
						
						
						
						
						feature/CGinfo 
						
						
					 | 
					
						2020-04-16 11:46:08 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						0475c46ecb
					 | 
					
						
						
							
							Merge pull request #256 from djm2131/feature/BiCGSTAB
						
						
						
						
						
						
						
						Import BiCGSTAB solvers and tests 
						
						
					 | 
					
						2020-04-16 11:45:15 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						3cca10e617
					 | 
					
						
						
							
							Merge pull request #276 from nils-asmussen/fix/regression_nt
						
						
						
						
						
						
						
						fix regression in tests/core/Test_qed.cc 
						
						
					 | 
					
						2020-04-16 11:42:39 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						327da332bb
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into feature/gpt
						
						
						
						
						
						
					 | 
					
						2020-04-16 11:30:17 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						852db4626a
					 | 
					
						
						
							
							re-introduced HOTFIX cause Grid binaries give wrong results otherwise; checked in good gridverter.py
						
						
						
						
						
						
					 | 
					
						2020-04-15 18:22:19 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						43dc2814dd
					 | 
					
						
						
							
							fix regression in core/Test_qed.cc
						
						
						
						
						
						
					 | 
					
						2020-04-15 16:10:15 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						6504a098cc
					 | 
					
						
						
							
							999 GiB/s Wilson; 694 GiB/s DW (DP)
						
						
						
						
						
						
					 | 
					
						2020-04-15 15:06:52 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						79a385faca
					 | 
					
						
						
							
							disabled armclang hotfix cause armclang 20.0 performance gets a little
						
						
						
						
						
						
					 | 
					
						2020-04-15 11:46:55 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						c12a67030a
					 | 
					
						
						
							
							980 GiB/s Wilson; 680 GiB/s DW (DP)
						
						
						
						
						
						
					 | 
					
						2020-04-15 10:55:06 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						581392f2f2
					 | 
					
						
						
							
							now with pf, best results so far using intrinsics+pf
						
						
						
						
						
						
					 | 
					
						2020-04-12 22:06:14 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						113f277b6a
					 | 
					
						
						
							
							enable dslash asm using -DA64FXASM, additionaly -DDSLASHINTRIN for intrinsics impl
						
						
						
						
						
						
					 | 
					
						2020-04-11 04:55:01 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f3a8d039a2
					 | 
					
						
						
							
							Merge branch 'feature/hdcr' into develop
						
						
						
						
						
						
					 | 
					
						2020-04-10 22:01:52 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nils meyer
							
						 
					 | 
					
						
						
							
						
						974586bedc
					 | 
					
						
						
							
							Dslash finally works; cleaned up; uses MOVPRFX in assembly
						
						
						
						
						
						
					 | 
					
						2020-04-10 22:26:40 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						4e864e56c9
					 | 
					
						
						
							
							develop pull
						
						
						
						
						
						
					 | 
					
						2020-04-10 17:19:18 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						014dbfa464
					 | 
					
						
						
							
							Compile fix with OpDirAll
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:57:09 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						3b0e07882f
					 | 
					
						
						
							
							Adding another form of polynomial
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:28:33 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						8e81a811d0
					 | 
					
						
						
							
							Merge branch 'feature/hdcr' into develop
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:14:49 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						aa13118127
					 | 
					
						
						
							
							Missing conjugate already fixed in develop
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:11:24 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						6cdb09c884
					 | 
					
						
						
							
							Faster copy region
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:10:52 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						a65bc64f10
					 | 
					
						
						
							
							Accelerator peek poke
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:09:59 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						11dec4883c
					 | 
					
						
						
							
							Don't throw assert
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:09:11 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						afa458c812
					 | 
					
						
						
							
							Extra solvers
						
						
						
						
						
						
					 | 
					
						2020-04-10 11:08:19 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						dc50190b8f
					 | 
					
						
						
							
							Faster GPU basis rotation
						
						
						
						
						
						
						
						May need to later include Regensburg optimised CPU variant 
						
						
					 | 
					
						2020-04-10 11:06:04 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						160f78c1e4
					 | 
					
						
						
							
							changed debug output to variable direct 3
						
						
						
						
						
						
					 | 
					
						2020-04-10 12:23:07 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						7e4e1bbbc2
					 | 
					
						
						
							
							changed debug output to variable direct 2
						
						
						
						
						
						
					 | 
					
						2020-04-10 12:22:04 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 |