Peter Boyle
							
						 
					 | 
					
						
						
							
						
						a4afc3ea2a
					 | 
					
						
						
							
							Red black coarse space
						
						
						
						
						
						
							
						
					 | 
					
						2021-01-14 20:44:16 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						3fe75bc7cb
					 | 
					
						
						
							
							Merge pull request #329 from nmeyer-ur/feature/a64fx-3
						
						
						
						
						
						
						
						Revised dslash/dwf kernels for A64FX 
						
						
							
						
					 | 
					
						2020-12-20 08:17:15 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Nils Meyer
							
						 
					 | 
					
						
						
							
						
						45d49d8648
					 | 
					
						
						
							
							clean up
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-19 03:35:18 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Nils Meyer
							
						 
					 | 
					
						
						
							
						
						6013183361
					 | 
					
						
						
							
							removed Asm impls
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-19 03:25:01 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Nils Meyer
							
						 
					 | 
					
						
						
							
						
						4b882e8056
					 | 
					
						
						
							
							fixed lost bracket
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-19 03:09:20 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Nils Meyer
							
						 
					 | 
					
						
						
							
						
						3f9ae6e7e7
					 | 
					
						
						
							
							Merge branch 'develop' into feature/a64fx-3
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-19 02:37:11 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Nils Meyer
							
						 
					 | 
					
						
						
							
						
						909acd55cd
					 | 
					
						
						
							
							vnum variant for prefetches
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-19 02:00:22 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Nils Meyer
							
						 
					 | 
					
						
						
							
						
						4dd9e39e0d
					 | 
					
						
						
							
							up to +36% performance gain for dslash/dwf on QPACE 4 using GCC 10.1.1
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-19 00:54:31 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						7adb253e25
					 | 
					
						
						
							
							Merge pull request #328 from mmphys/feature/mrespatch
						
						
						
						
						
						
						
						Enable existing conserved current code for CUDA 
						
						
							
						
					 | 
					
						2020-12-17 11:10:29 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Michael Marshall
							
						 
					 | 
					
						
						
							
						
						873519e960
					 | 
					
						
						
							
							Enable existing conserved current code for CUDA (compiles OK for CUDA 10.1). Add option to Test_cayley_mres to load a configuration
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-14 16:06:10 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						9aec4a3c26
					 | 
					
						
						
							
							SYCL
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-10 02:11:17 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						70510d151b
					 | 
					
						
						
							
							Merge pull request #327 from paboyle/feature/gparity_twist_GPU
						
						
						
						
						
						
						
						Feature/gparity twist gpu 
						
						
							
						
					 | 
					
						2020-12-07 12:02:20 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christopher Kelly
							
						 
					 | 
					
						
						
							
						
						9e7bacb5a4
					 | 
					
						
						
							
							Merge branch 'develop' into feature/gparity_twist_GPU
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-07 11:55:39 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christopher Kelly
							
						 
					 | 
					
						
						
							
						
						2ef1fa66a8
					 | 
					
						
						
							
							Improved performance of G-parity kernel for GPUs by simplifying multLink implementation
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-07 11:53:35 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						cf76741ec6
					 | 
					
						
						
							
							Intel DPCPP Gold happy now (compiles all, runs Benchmark_dwf_fp32 )
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-03 03:47:11 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						497e7c1c40
					 | 
					
						
						
							
							Duplicate code
						
						
						
						
						
						
							
						
					 | 
					
						2020-12-02 17:55:30 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						888eacd3b8
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-24 21:46:33 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						321f0f51b5
					 | 
					
						
						
							
							Project to SU(N)
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-24 21:46:10 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						30ad9578a2
					 | 
					
						
						
							
							Merge branch 'lehner-feature/gpt' into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-24 06:10:24 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						9dce101586
					 | 
					
						
						
							
							Merge branch 'feature/gpt' of https://github.com/lehner/Grid into lehner-feature/gpt
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-24 06:10:16 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						97e264d0ff
					 | 
					
						
						
							
							Christoph's changes
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-23 15:46:11 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						683a5e5bf5
					 | 
					
						
						
							
							Stencil use host vector for integera table on enable-shared=no and mirror it on device
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-23 15:39:51 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						d4861a362c
					 | 
					
						
						
							
							Stencil use non-UVM memory for look up table on enable-shared=no
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-23 15:38:49 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						5ff3eae027
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-20 13:14:44 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						147dc15d26
					 | 
					
						
						
							
							Update
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-20 13:13:59 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						c61ea72949
					 | 
					
						
						
							
							Merge pull request #19 from paboyle/develop
						
						
						
						
						
						
						
						Sync 
						
						
							
						
					 | 
					
						2020-11-20 17:31:13 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						86e8b9fe38
					 | 
					
						
						
							
							ALLOC_ALIGN removed
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-20 17:07:16 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						612e468889
					 | 
					
						
						
							
							Configurable ALLOC_ALIGN and ALLOC_CACHE
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-20 16:48:28 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						4ea8d128c2
					 | 
					
						
						
							
							Merge pull request #18 from paboyle/develop
						
						
						
						
						
						
						
						Sync 
						
						
							
						
					 | 
					
						2020-11-20 15:36:50 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e49b7f2f88
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-19 19:24:41 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						aace3d47b9
					 | 
					
						
						
							
							partial work in progress
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-19 19:24:14 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						d5049949a4
					 | 
					
						
						
							
							Starting to fix reunitarise
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-19 19:23:41 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f1c7480e3c
					 | 
					
						
						
							
							Warning remove
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-19 19:23:03 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						5adae5d6ff
					 | 
					
						
						
							
							Unused variable remove
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-19 19:22:12 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						a8412ace05
					 | 
					
						
						
							
							Merge pull request #317 from i-kanamori/develop
						
						
						
						
						
						
						
						adding an error check for input: Parameters.StartingType 
						
						
							
						
					 | 
					
						2020-11-18 23:09:40 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						9fd1c2ad4b
					 | 
					
						
						
							
							Merge pull request #325 from DanielRichtmann/feature/threaded-clover-inversion
						
						
						
						
						
						
						
						Threaded clover term inversion 
						
						
							
						
					 | 
					
						2020-11-18 23:08:37 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						4cf3575353
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-18 03:07:36 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						804a810d68
					 | 
					
						
						
							
							Wildcard mismatch
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-18 03:06:53 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						8fcb392e24
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-17 04:51:31 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						dd8d70eeff
					 | 
					
						
						
							
							Build without LIME
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-17 04:41:15 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						aa8aba6543
					 | 
					
						
						
							
							--shm-force-mpi
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-16 20:15:50 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						13df14f96e
					 | 
					
						
						
							
							Switch off SHM paths with --disable-shm
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-16 18:07:15 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						3aab983760
					 | 
					
						
						
							
							Flop count set as in DiRAC-ITT-2020 (mistaken 20% low, but must maintain consistency)
						
						
						
						
						
						
							
 DiRAC-ITT-2020-UCX-WORKAROUND
						
					 | 
					
						2020-11-16 17:13:58 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						9c4dcc5ea3
					 | 
					
						
						
							
							Merge branch 'master' into develop
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-16 16:34:57 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						a1063ddbb9
					 | 
					
						
						
							
							Update options and simplify
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-13 04:11:03 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						18ef8056ec
					 | 
					
						
						
							
							Hide Shared Memory
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-13 04:10:40 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						1c673977fa
					 | 
					
						
						
							
							Must ask for COMMMS_THREADS
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-13 03:59:36 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e9bc748828
					 | 
					
						
						
							
							Useful GPU machine benchmark for GDR used to shakeout Booster at Juelich - see slack earlyaccess channel
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-13 03:58:34 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f48156529b
					 | 
					
						
						
							
							Work on 2,2,2,8 ranks
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-13 03:57:58 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						d05ce01809
					 | 
					
						
						
							
							TOFU behaviour now optional THREAD_MULTIPLE or THREAD_SERIALIZED
						
						
						
						
						
						
							
						
					 | 
					
						2020-11-13 03:52:19 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 |