Peter Boyle 
							
						 
					 
					
						
						
							
						
						90130e25e9 
					 
					
						
						
							
							TODO list  
						
						
						
						
					 
					
						2023-03-23 10:27:02 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						23298acb81 
					 
					
						
						
							
							Merge pull request  #424  from giltirn/feature/dirichlet-precchange  
						
						... 
						
						
						
						Precision change implementation 
						
						
					 
					
						2023-03-22 23:04:52 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						52384e34cf 
					 
					
						
						
							
							Discard on construct  
						
						
						
						
					 
					
						2023-03-22 19:40:32 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						d0bb033ea2 
					 
					
						
						
							
							Device resident GPU block buffer instead of UVM as hit likely UVM  
						
						... 
						
						
						
						bug. Code worked on CUDA 11.4 but fails on later drivers (certainly 530.30.02, but need to
find the perlmutter driver version). 
						
						
					 
					
						2023-03-22 19:07:32 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						c6621806ca 
					 
					
						
						
							
							Compiling on laptop and running  
						
						
						
						
					 
					
						2023-03-21 17:27:09 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						0b6f0f6d2f 
					 
					
						
						
							
							Merge branch 'feature/dirichlet' of  https://www.github.com/paboyle/Grid  into feature/dirichlet  
						
						
						
						
					 
					
						2023-03-21 16:06:55 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						b5b759df73 
					 
					
						
						
							
							Merge branch 'develop' into feature/dirichlet  
						
						
						
						
					 
					
						2023-03-21 16:05:46 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						7db8dd7a95 
					 
					
						
						
							
							Merge branch 'feature/dirichlet' of  https://github.com/paboyle/Grid  into feature/dirichlet  
						
						
						
						
					 
					
						2023-03-21 16:04:27 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						8b43be39c0 
					 
					
						
						
							
							Config command  
						
						
						
						
					 
					
						2023-03-21 16:00:52 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						f17f879206 
					 
					
						
						
							
							Test update  
						
						
						
						
					 
					
						2023-03-21 15:59:29 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						68428fceab 
					 
					
						
						
							
							Integrator update  
						
						
						
						
					 
					
						2023-03-21 15:58:49 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						4135f2dcd1 
					 
					
						
						
							
							Compressor  
						
						
						
						
					 
					
						2023-03-21 15:41:41 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						c5bdf61215 
					 
					
						
						
							
							AUdit fix  
						
						
						
						
					 
					
						2023-03-21 15:38:39 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						88e218e8ee 
					 
					
						
						
							
							Stencil updates  
						
						
						
						
					 
					
						2023-03-21 15:37:58 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						0f2b786436 
					 
					
						
						
							
							Vector -> vector  
						
						
						
						
					 
					
						2023-03-21 15:36:11 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						e1c326558a 
					 
					
						
						
							
							COmms improvements  
						
						
						
						
					 
					
						2023-03-21 08:53:56 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						bae0f8ea99 
					 
					
						
						
							
							Merge pull request  #425  from rrhodgson/feature/CacheLogging  
						
						... 
						
						
						
						Huge Cache 
						
						
					 
					
						2023-03-21 08:59:08 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						bbbcd36ae5 
					 
					
						
						
							
							Merge pull request  #426  from rrhodgson/feature/LCDeflation  
						
						... 
						
						
						
						Batched Local Coherence Tools 
						
						
					 
					
						2023-03-21 08:58:40 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						39c0815d9e 
					 
					
						
						
							
							WriteDiscard  
						
						
						
						
					 
					
						2023-03-21 08:57:29 -04:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						1b8176e2c0 
					 
					
						
						
							
							fix code duplication  
						
						
						
						
					 
					
						2023-03-17 14:58:00 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						cbc053c3db 
					 
					
						
						
							
							Revert "projection on Sp2n algebra, to be used instead of Ta"  
						
						... 
						
						
						
						This reverts commit ba7f9d7b70 
						
						
					 
					
						2023-03-17 11:36:58 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						cdf3f6ef6e 
					 
					
						
						
							
							Merge branch 'refactoring_sp2n' of  https://github.com/LupoA/Grid  into refactoring_sp2n  
						
						
						
						
					 
					
						2023-03-15 15:59:50 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						ba7f9d7b70 
					 
					
						
						
							
							projection on Sp2n algebra, to be used instead of Ta  
						
						
						
						
					 
					
						2023-03-15 15:55:12 +00:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						a997d24743 
					 
					
						
						
							
							Remove nofma  
						
						
						
						
					 
					
						2023-03-14 12:10:31 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						861e5d7f4c 
					 
					
						
						
							
							SYCL version update. Why do they keep making incompatible changes  
						
						
						
						
					 
					
						2023-03-14 12:10:02 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						14cc142a14 
					 
					
						
						
							
							Warning remove  
						
						
						
						
					 
					
						2023-03-14 12:09:26 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						f36b87deb5 
					 
					
						
						
							
							syscall fix  
						
						
						
						
					 
					
						2023-03-14 12:09:00 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						eeb6e0a6e3 
					 
					
						
						
							
							Renable cache blocking and efficient UPI type SHM comms  
						
						
						
						
					 
					
						2023-03-14 09:10:27 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						cad5b187dd 
					 
					
						
						
							
							Cleanup  
						
						
						
						
					 
					
						2023-03-14 09:08:16 -07:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						87697eb07e 
					 
					
						
						
							
							SHared compile  
						
						
						
						
					 
					
						2023-03-14 09:07:36 -07:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						371fd123fb 
					 
					
						
						
							
							consequence of iSUnMatrix being no longer a member of the SU class  
						
						
						
						
					 
					
						2023-03-14 10:47:07 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						d6ff644aab 
					 
					
						
						
							
							Towards the day all tests compile  
						
						
						
						
					 
					
						2023-03-14 10:43:25 +00:00 
						 
				 
			
				
					
						
							
							
								Julian Lenz 
							
						 
					 
					
						
						
							
						
						29586f6b5e 
					 
					
						
						
							
							Deactivate some tests for Nc!=3  
						
						
						
						
					 
					
						2023-03-13 08:17:14 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						fd057c838f 
					 
					
						
						
							
							add ProjectOnGaugeGroup and ProjectGn to allow future templating in GaugeImplTypes  
						
						
						
						
					 
					
						2023-03-10 12:10:46 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						f51222086c 
					 
					
						
						
							
							Move functions from GaugeGroup to group specific implementations  
						
						
						
						
					 
					
						2023-03-09 16:22:20 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						a3e935c902 
					 
					
						
						
							
							Batched block project/promote size checks  
						
						
						
						
					 
					
						2023-02-27 11:38:16 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						7731c7db8e 
					 
					
						
						
							
							Add huge cache type and allow Ncache==0  
						
						
						
						
					 
					
						2023-02-26 14:15:28 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						ff97340324 
					 
					
						
						
							
							Expose cached bytes  
						
						
						
						
					 
					
						2023-02-26 12:22:45 +00:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						83d86943db 
					 
					
						
						
							
							Fixed compile bug in MemoryManagerShared caused by Audit function not being passed a string  
						
						
						
						
					 
					
						2023-02-23 13:09:45 -05:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						e82cf1d311 
					 
					
						
						
							
							Further prec-change improvements  
						
						... 
						
						
						
						Mixed prec CG algorithm has been modified to precompute precision change workspaces
As the original Test_dwf_mixedcg_prec has been coopted to do a performance stability and reproducibility test, requiring the single-prec CG to be run 200 times, I have created a new version of Test_dwf_mixedcg_prec in the solver subdirectory that just does the mixed vs double CG test 
						
						
					 
					
						2023-02-23 09:45:29 -05:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						1db58a8acc 
					 
					
						
						
							
							Precision change improvements  
						
						... 
						
						
						
						Added a new, much faster implementation of precision change that uses (optionally) a precomputed workspace containing pointer offsets that is device resident, such that all lattice copying occurs only on the device and no host<->device transfer is required, other than the pointer table. It also avoids the need to unpack and repack the fields using explicit lane copying. When this new precisionChange is called without a workspace, one will be computed on-the-fly; however it is still considerably faster than the original implementation.
In the special case of using double2 and when the Grids are the same, calls to the new precisionChange will automatically use precisionChangeFast, such that there is a single API call for all precision changes.
Reliable update and mixed-prec multishift have been modified to precompute precision change workspaces
Renamed the original precisionChange as precisionChangeOrig
Fixed incorrect pointer offset bug in copyLane
Added a test and a benchmark for precisionChange
Added a test for reliable update CG 
						
						
					 
					
						2023-02-21 10:52:42 -05:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						920a51438d 
					 
					
						
						
							
							Added batched Mixed precision CG  
						
						
						
						
					 
					
						2023-02-14 17:04:13 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						be528b6d27 
					 
					
						
						
							
							Add batched block project/promote functions  
						
						
						
						
					 
					
						2023-02-14 14:37:10 +00:00 
						 
				 
			
				
					
						
							
							
								Alessandro Lupo 
							
						 
					 
					
						
						
							
						
						f73691ec47 
					 
					
						
						
							
							Merge pull request  #18  from nickforce989/sp2n/newbranch  
						
						... 
						
						
						
						Sp2n/newbranch 
						
						
					 
					
						2023-02-13 10:22:27 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						ccd21f96ff 
					 
					
						
						
							
							Plaquette agreeing and moving to final form (slowly) need to optimise  
						
						
						
						
					 
					
						2023-02-01 22:57:44 -05:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						4b90cb8888 
					 
					
						
						
							
							First cut passes combining padded cell with general stencil towards fast plaquette and staggered force  
						
						
						
						
					 
					
						2023-02-01 22:14:10 -05:00 
						 
				 
			
				
					
						
							
							
								Niccolo Forzano 
							
						 
					 
					
						
						
							
						
						7ebda3e9ec 
					 
					
						
						
							
							Merge commit 'b10e1b7bc8bec809f874e9e48a3ccc7b2619c9d1' into sp2n/newbranch  
						
						
						
						
					 
					
						2023-01-19 12:10:18 +00:00 
						 
				 
			
				
					
						
							
							
								Niccolo Forzano 
							
						 
					 
					
						
						
							
						
						b10e1b7bc8 
					 
					
						
						
							
							Fixed files giving zero force computation on GPU, issue  #8  
						
						
						
						
					 
					
						2023-01-18 18:04:47 +00:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						796abfad80 
					 
					
						
						
							
							Merge pull request  #422  from fjosw/fix/NVCC_DIAG_PRAGMA_SUPPORT  
						
						... 
						
						
						
						Disable diagnostic pragma warnings for CUDA 12+ 
						
						
					 
					
						2023-01-17 09:34:49 -05:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						ad0270ac8c 
					 
					
						
						
							
							fix: diagnostic pragma warnings fixed for CUDA 12+  
						
						
						
						
					 
					
						2023-01-12 12:36:30 +00:00