| 
						
					 | 
					
						
						
							
						
						e61fed87db
					 | 
					
						
						
							
							SteepestDescentGaugeFix now exits when the algorithm does not converge.
						
						
						
						
						
						
						
						This behaviour can be altered by setting err_on_no_converge to false. 
						
						
					 | 
					
						2022-04-20 15:41:55 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						605cf401e1
					 | 
					
						
						
							
							Merge branch 'feature/sumd-npr' into develop
						
						
						
						
						
						
					 | 
					
						2022-03-16 22:43:12 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f99c3660d2
					 | 
					
						
						
							
							Merge branch 'feature/cpu-threaded-smp' into develop
						
						
						
						
						
						
					 | 
					
						2022-03-16 22:07:54 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						92a83a9eb3
					 | 
					
						
						
							
							Performance improve for Tesseract
						
						
						
						
						
						
					 | 
					
						2022-03-16 17:14:36 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						b615fa0f35
					 | 
					
						
						
							
							Merge pull request #388 from fjosw/feature/sumd-npr
						
						
						
						
						
						
						
						Feature/sumd npr 
						
						
					 | 
					
						2022-03-15 09:05:57 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						d1decee4cc
					 | 
					
						
						
							
							Cleaned up unused variables in Lattice_reduction_gpu.h
						
						
						
						
						
						
					 | 
					
						2022-03-02 16:54:23 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						d4ae71b880
					 | 
					
						
						
							
							sum_gpu_large and sum_gpu templates added.
						
						
						
						
						
						
					 | 
					
						2022-03-02 15:40:18 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e16fc5b2e4
					 | 
					
						
						
							
							Threaded intranode comms transfer - ideally between NUMA domains
						
						
						
						
						
						
					 | 
					
						2022-03-01 11:17:24 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						694306f202
					 | 
					
						
						
							
							Configure for mac arm
						
						
						
						
						
						
					 | 
					
						2022-03-01 10:53:44 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						9aac1e6d64
					 | 
					
						
						
							
							Merge branch 'develop' into feature/sumd-npr
						
						
						
						
						
						
					 | 
					
						2022-03-01 10:51:38 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						3e882f555d
					 | 
					
						
						
							
							Large / small sumD options
						
						
						
						
						
						
					 | 
					
						2022-03-01 08:54:45 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						63dbaeefaa
					 | 
					
						
						
							
							Extra barrier prior to finalize just in case it fixes an issue on Tursa
						
						
						
						
						
						
					 | 
					
						2022-02-16 14:01:43 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e8c187b323
					 | 
					
						
						
							
							SyCL happier?
						
						
						
						
						
						
					 | 
					
						2022-02-15 11:24:38 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						0c1618197f
					 | 
					
						
						
							
							Faster intranode MPI works now
						
						
						
						
						
						
					 | 
					
						2022-02-15 08:52:07 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f49d5c2d22
					 | 
					
						
						
							
							Updated scripts for crusher
						
						
						
						
						
						
					 | 
					
						2022-02-14 17:55:16 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						a3b022d469
					 | 
					
						
						
							
							Crusher compile
						
						
						
						
						
						
					 | 
					
						2022-02-14 15:09:08 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						48772f0976
					 | 
					
						
						
							
							Merge pull request #384 from jdmaia/hip_launchbounds
						
						
						
						
						
						
						
						Changing thread block order and adding launch_bounds 
						
						
					 | 
					
						2022-02-14 11:08:28 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						c322420580
					 | 
					
						
						
							
							Dont instantiate an Nc=3 and non-GP hardwired code for other implementations
						
						
						
						
						
						
					 | 
					
						2022-02-14 16:04:08 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Julio Maia
							
						 
					 | 
					
						
						
							
						
						86f4e17928
					 | 
					
						
						
							
							Changing thread block order and adding launch_bounds
						
						
						
						
						
						
					 | 
					
						2022-02-07 11:29:37 -06:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						215df671be
					 | 
					
						
						
							
							Merge pull request #382 from DanielRichtmann/feature/compact-clover
						
						
						
						
						
						
						
						Compact Clover Fermions 
						
						
					 | 
					
						2022-02-01 21:45:38 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Daniel Richtmann
							
						 
					 | 
					
						
						
							
						
						1b6b12589f
					 | 
					
						
						
							
							Get splitting up into implementation and instantiation files correct
						
						
						
						
						
						
					 | 
					
						2022-02-02 00:51:11 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Daniel Richtmann
							
						 
					 | 
					
						
						
							
						
						3082ab8252
					 | 
					
						
						
							
							Check in compact version of wilson clover fermions
						
						
						
						
						
						
					 | 
					
						2022-02-02 00:50:05 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Daniel Richtmann
							
						 
					 | 
					
						
						
							
						
						add86cd7f4
					 | 
					
						
						
							
							Abandon ET for clover application, use construct similar to multLink
						
						
						
						
						
						
					 | 
					
						2022-02-01 23:09:06 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Daniel Richtmann
							
						 
					 | 
					
						
						
							
						
						0b6fd20c54
					 | 
					
						
						
							
							Enable memory coalescing in clover term generation
						
						
						
						
						
						
					 | 
					
						2022-02-01 23:09:06 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Daniel Richtmann
							
						 
					 | 
					
						
						
							
						
						e83423fee6
					 | 
					
						
						
							
							Refactor clover to align with other files and prepare for upcoming changes
						
						
						
						
						
						
					 | 
					
						2022-02-01 23:09:06 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Daniel Richtmann
							
						 
					 | 
					
						
						
							
						
						b4f8e87982
					 | 
					
						
						
							
							Have Grid's cli interface understand floats
						
						
						
						
						
						
					 | 
					
						2022-02-01 23:09:06 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						135808dcfa
					 | 
					
						
						
							
							Less verbose
						
						
						
						
						
						
					 | 
					
						2021-12-07 16:24:24 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						7f7d06d963
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
					 | 
					
						2021-12-07 09:06:42 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						2bf3b4d576
					 | 
					
						
						
							
							Update to reduce memory footpring in benchmark test
						
						
						
						
						
						
					 | 
					
						2021-12-07 09:02:02 -08:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f34d34bd17
					 | 
					
						
						
							
							2 nodes
						
						
						
						
						
						
					 | 
					
						2021-11-22 22:27:16 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e32d5141b4
					 | 
					
						
						
							
							Updated to make MPI reliable still gives good perf, but MPI will be slow
						
						
						
						
						
						
						
						intranode 
						
						
					 | 
					
						2021-11-22 21:46:31 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						6d5277f2d7
					 | 
					
						
						
							
							Update to Spock
						
						
						
						
						
						
					 | 
					
						2021-11-22 20:58:02 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						14d82777e0
					 | 
					
						
						
							
							Best modules for spock
						
						
						
						
						
						
					 | 
					
						2021-11-22 20:47:16 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						2a4e739513
					 | 
					
						
						
							
							Enable XGMI copy (need to rename nvlink to cover NVLINK/XGMI/XeLink)
						
						
						
						
						
						
					 | 
					
						2021-11-22 20:46:09 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						8079dc2a14
					 | 
					
						
						
							
							Cray MPI not working right yet
						
						
						
						
						
						
					 | 
					
						2021-11-22 20:45:44 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						6ceb556684
					 | 
					
						
						
							
							Intranode asynch hipMemCopy
						
						
						
						
						
						
					 | 
					
						2021-11-22 20:45:12 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						76cde73705
					 | 
					
						
						
							
							HIP improvements on messaging and intranode hipMemCopyAsynch
						
						
						
						
						
						
					 | 
					
						2021-11-22 20:44:39 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						cc094366a9
					 | 
					
						
						
							
							Merge pull request #375 from JPRichings/develop
						
						
						
						
						
						
						
						Lattice object ACCcache probe 
						
						
					 | 
					
						2021-11-09 18:19:32 -05:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						41a575ff9b
					 | 
					
						
						
							
							Format edit
						
						
						
						
						
						
					 | 
					
						2021-11-09 21:56:23 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						12ef413065
					 | 
					
						
						
							
							fix to deflation.h
						
						
						
						
						
						
					 | 
					
						2021-11-09 21:20:36 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						829a328451
					 | 
					
						
						
							
							remove deflation timing
						
						
						
						
						
						
					 | 
					
						2021-11-09 20:46:57 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						402523c62e
					 | 
					
						
						
							
							Merge branch 'develop' of https://github.com/paboyle/Grid into develop
						
						
						
						
						
						
					 | 
					
						2021-11-09 12:57:40 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						d7bef70b5c
					 | 
					
						
						
							
							Helper functions to allow probe of cache state of lattice objects.
						
						
						
						
						
						
					 | 
					
						2021-11-09 12:57:09 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						2ad1811642
					 | 
					
						
						
							
							Added timing to deflation code.
						
						
						
						
						
						
					 | 
					
						2021-11-09 12:33:25 +00:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						a65a497bae
					 | 
					
						
						
							
							Merge branch 'develop' of github.com:paboyle/Grid into develop
						
						
						
						
						
						
					 | 
					
						2021-10-29 13:01:34 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						b27b12828e
					 | 
					
						
						
							
							reverse previous "fix", missing statement was probably intentional, added a comment to that effect
						
						
						
						
						
						
					 | 
					
						2021-10-29 13:01:31 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						42d56ea6b6
					 | 
					
						
						
							
							Verbosity
						
						
						
						
						
						
					 | 
					
						2021-10-29 02:23:08 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						0b905a72dd
					 | 
					
						
						
							
							Better reduction for GPUs
						
						
						
						
						
						
					 | 
					
						2021-10-29 02:22:22 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						fe9edf8526
					 | 
					
						
						
							
							Merge branch 'develop' of https://www.github.com/paboyle/Grid into develop
						
						
						
						
						
						
					 | 
					
						2021-10-29 02:03:27 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						44204c7e06
					 | 
					
						
						
							
							Extra code
						
						
						
						
						
						
					 | 
					
						2021-10-29 02:02:56 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 |