paboyle 
							
						 
					 
					
						
						
							
						
						5918769f97 
					 
					
						
						
							
							Subtle Naik term bug updated in Stencil; less on logical && with a function call on right  
						
						
						
						
					 
					
						2017-09-16 12:51:26 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						b542d349b8 
					 
					
						
						
							
							Minor cosmetic changes  
						
						
						
						
					 
					
						2017-09-15 11:48:36 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						91eaace19d 
					 
					
						
						
							
							Added support for FFT accelerated updates  
						
						
						
						
					 
					
						2017-09-15 11:33:45 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						1950ac9294 
					 
					
						
						
							
							Fixed the Intel compiler problem with the JSON classes  
						
						
						
						
					 
					
						2017-09-08 15:18:59 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						13fa70ac1a 
					 
					
						
						
							
							Merge branch 'develop' into feature/json-fix  
						
						
						
						
					 
					
						2017-09-08 13:42:20 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						7cb2b11f26 
					 
					
						
						
							
							Fixing Intel compiler error for the JSON parser  
						
						
						
						
					 
					
						2017-09-08 13:41:53 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						1184ed29ae 
					 
					
						
						
							
							Merge pull request  #124  from nmeyer-ur/feature/arm-neon  
						
						... 
						
						
						
						Added integer reduce functionality 
						
						
					 
					
						2017-09-08 10:54:35 +02:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						203c7bf6fa 
					 
					
						
						
							
							Merge branch 'hotfix/dirac-ITT-fix' into develop  
						
						
						
						
					 
					
						2017-09-05 15:08:51 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						aed5de4d50 
					 
					
						
						
							
							Patching macos compile  
						
						
						
						
					 
					
						2017-09-05 15:07:07 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						ba27cc6571 
					 
					
						
						
							
							Mac os happiness  
						
						
						
						
					 
					
						2017-09-05 15:00:16 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						d856327250 
					 
					
						
						
							
							Merge branch 'release/dirac-ITT' into develop  
						
						
						
						
					 
					
						2017-09-05 14:56:12 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						bf973d0d56 
					 
					
						
						
							
							SHM complete  
						
						
						
						
					 
					
						2017-09-05 14:30:29 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						837bf8a5be 
					 
					
						
						
							
							Updating to control the SHM allocation scheme under configure time options  
						
						
						
						
					 
					
						2017-09-05 12:51:02 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						c05b2199f6 
					 
					
						
						
							
							Improvements to huge memory  
						
						
						
						
					 
					
						2017-09-04 10:41:21 -04:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						a5fe07c077 
					 
					
						
						
							
							Merge branch 'develop' of  https://github.com/paboyle/Grid  into develop  
						
						
						
						
					 
					
						2017-09-04 14:10:15 +01:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						b83b2b1415 
					 
					
						
						
							
							Stability improvement to BCG. Force m_rr hermitian beyond rounding.  
						
						
						
						
					 
					
						2017-09-04 14:09:47 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						7359df3501 
					 
					
						
						
							
							Full reporting for benchmark; save robustness factor  
						
						
						
						
					 
					
						2017-08-31 10:42:35 +01:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						59bd1fe21b 
					 
					
						
						
							
							Fix for 'perm' and 'local' not being set for hand-unrolled external-site Dslash, which caused incorrect behavior of G-parity kernel  
						
						
						
						
					 
					
						2017-08-29 13:07:37 -07:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						a56e3b40c4 
					 
					
						
						
							
							Merge branch 'develop' into feature/hadrons  
						
						
						
						
					 
					
						2017-08-29 11:03:53 -06:00 
						 
				 
			
				
					
						
							
							
								Nils Meyer 
							
						 
					 
					
						
						
							
						
						4e907fef2c 
					 
					
						
						
							
							Merge remote-tracking branch 'grid/develop' into feature/arm-neon  
						
						
						
						
					 
					
						2017-08-29 17:47:36 +02:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						74af885d4e 
					 
					
						
						
							
							Removed some no-longer-needed associated with G-parity hand unrolled kernel  
						
						
						
						
					 
					
						2017-08-29 09:50:37 -04:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						4b4c2a715b 
					 
					
						
						
							
							fcntl.h needed  
						
						
						
						
					 
					
						2017-08-26 11:38:04 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						54a5e6c1d0 
					 
					
						
						
							
							Check if we get huge pages on linux. Larry Meadows piece of magic.  
						
						
						
						
					 
					
						2017-08-25 22:36:08 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						80c5bce5bb 
					 
					
						
						
							
							Merge branch 'develop' into feature/multi-communicator  
						
						
						
						
					 
					
						2017-08-25 20:21:26 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						f68b5de9c8 
					 
					
						
						
							
							No compile fix on Clang  
						
						
						
						
					 
					
						2017-08-25 19:35:21 +01:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						f365a83fae 
					 
					
						
						
							
							In G-parity unrolled kernel, replaced calls to permute and exchange with run-time-evaluated permute type with explicit calls to appropriate underlying functions  
						
						
						
						
					 
					
						2017-08-25 14:24:11 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						c289699d9a 
					 
					
						
						
							
							updated from cambridge mpi3 shakeout  
						
						
						
						
					 
					
						2017-08-25 11:41:01 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						c3b1263e75 
					 
					
						
						
							
							Benchmark prep  
						
						
						
						
					 
					
						2017-08-25 09:25:54 +01:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						34a9aeb331 
					 
					
						
						
							
							Reduced number of if-statement evaluations in G-parity unrolled kernel  
						
						
						
						
					 
					
						2017-08-24 13:53:50 -07:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						21b02760c3 
					 
					
						
						
							
							Merge branch 'develop' into feature/hadrons  
						
						
						
						
					 
					
						2017-08-24 17:05:45 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						5fa386ddc9 
					 
					
						
						
							
							FFT test compile fixed  
						
						
						
						
					 
					
						2017-08-24 10:17:52 +01:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						ce5df177ee 
					 
					
						
						
							
							Removed superfluous implementation of G-parity twist for hand-unrolled kernel from GparityWilsonImpl  
						
						
						
						
					 
					
						2017-08-23 15:05:22 -04:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						a0bb8e5b46 
					 
					
						
						
							
							Added hand-unrolled kernel implementations of all the other dslash precision / comms precision combinations with G-parity  
						
						
						
						
					 
					
						2017-08-23 14:44:40 -04:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						46f88e6d72 
					 
					
						
						
							
							G-parity hand-unrolled intrinsics twist now uses one less permute and one less temporary  
						
						
						
						
					 
					
						2017-08-23 13:21:10 -04:00 
						 
				 
			
				
					
						
							
							
								David Murphy 
							
						 
					 
					
						
						
							
						
						dd8f1ea189 
					 
					
						
						
							
							Vectorized Mobius EOFA Dperp + shift operation  
						
						
						
						
					 
					
						2017-08-23 13:17:26 -04:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						b61835c1a5 
					 
					
						
						
							
							Added inplace version of intrinsic G-parity twist to hand-unrolled kernel  
						
						
						
						
					 
					
						2017-08-23 12:33:48 -04:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						d9cd4f0273 
					 
					
						
						
							
							Staggered multinode block cg debugged. Missing global sum.  
						
						... 
						
						
						
						Code stalls and resumes on KNL at cambridge. Curious.
CG iterations 23ms each, then 3200 ms pauses. Mean bandwidth reports
as 200MB/s. Comms dominant in the report. However, the time behaviour suggests it
is *bursty*.... Could be swap to disk? 
						
						
					 
					
						2017-08-23 15:07:18 +01:00 
						 
				 
			
				
					
						
							
							
								David Murphy 
							
						 
					 
					
						
						
							
						
						459f70e8d4 
					 
					
						
						
							
							Check-in of working Mobius EOFA class and tests  
						
						
						
						
					 
					
						2017-08-22 22:38:30 -04:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						061e48fd73 
					 
					
						
						
							
							Replaced slow unpack-repack in G-parity BC twist with intrinsics version  
						
						
						
						
					 
					
						2017-08-22 18:12:12 -04:00 
						 
				 
			
				
					
						
							
							
								Christopher Kelly 
							
						 
					 
					
						
						
							
						
						ab50145001 
					 
					
						
						
							
							Implemented first, unoptimized version of hand-unrolled G-parity kernels  
						
						... 
						
						
						
						Improved Test_gparity 
						
						
					 
					
						2017-08-22 17:12:25 -04:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						b49bec0cec 
					 
					
						
						
							
							MAP_HUGETLB portability fix  
						
						
						
						
					 
					
						2017-08-20 03:08:54 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						1cdf999668 
					 
					
						
						
							
							Moving multicommunicator into mpi3 also for threading  
						
						
						
						
					 
					
						2017-08-20 02:39:10 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						11062fb686 
					 
					
						
						
							
							Comms none fail fix  
						
						
						
						
					 
					
						2017-08-20 01:37:07 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						a446d95c33 
					 
					
						
						
							
							Trying to pass TeamCity and Travis  
						
						
						
						
					 
					
						2017-08-20 01:10:50 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						be66e7dd95 
					 
					
						
						
							
							Merge branch 'develop' into feature/multi-communicator  
						
						
						
						
					 
					
						2017-08-19 23:12:38 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						0b0cf62193 
					 
					
						
						
							
							Fix mpi 3 interface change  
						
						
						
						
					 
					
						2017-08-19 13:18:50 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						7d88198387 
					 
					
						
						
							
							Merge branch 'develop' into feature/multi-communicator  
						
						
						
						
					 
					
						2017-08-19 13:03:35 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						2f619482b8 
					 
					
						
						
							
							Enable blocking stencil send  
						
						
						
						
					 
					
						2017-08-19 12:53:59 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						d6472eda8d 
					 
					
						
						
							
							Use mmap  
						
						
						
						
					 
					
						2017-08-19 12:53:18 -04:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						bcefdd7c4e 
					 
					
						
						
							
							Align both allocator calls to 2MB  
						
						
						
						
					 
					
						2017-08-19 12:49:02 -04:00