nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						465856331a
					 | 
					
						
						
							
							switch back to serialized; wrong results on single too
						
						
						
						
						
						
					 | 
					
						2020-06-15 15:39:39 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						cc958aa9ed
					 | 
					
						
						
							
							switch back to standard MPI_init due to wrong results in Benchmark_wilson using comms-overlap
						
						
						
						
						
						
					 | 
					
						2020-06-15 14:21:38 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f46f029dbb
					 | 
					
						
						
							
							Merge pull request #292 from lehner/feature/gpt-sycl
						
						
						
						
						
						
						
						Catch edge case in SharedMemoryMPI::GetShmDims; Change default units … 
						
						
					 | 
					
						2020-06-14 13:43:27 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						3dccd7aa2c
					 | 
					
						
						
							
							Catch edge case in SharedMemoryMPI::GetShmDims; Change default units to consistent MB in init args; Want last element not past last element in MemoryManagerCache.cc
						
						
						
						
						
						
					 | 
					
						2020-06-14 13:26:01 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						a25e4b3d0c
					 | 
					
						
						
							
							pred 32/64 for float/double instead of 8 in VLA patch
						
						
						
						
						
						
					 | 
					
						2020-06-13 14:44:37 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						d1210ca12a
					 | 
					
						
						
							
							switch to double/float instead of float64_t/float32_t in VLA patch
						
						
						
						
						
						
					 | 
					
						2020-06-13 13:59:32 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						36ea0e222a
					 | 
					
						
						
							
							type traits for ComplexF/D in VLA patch; cosmetics in VLS intrinsics
						
						
						
						
						
						
					 | 
					
						2020-06-13 13:42:35 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						65e6e7da6f
					 | 
					
						
						
							
							Merge pull request #291 from lehner/feature/gpt-sycl
						
						
						
						
						
						
						
						Feature/gpt sycl 
						
						
					 | 
					
						2020-06-12 20:42:32 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						b5e87e8d97
					 | 
					
						
						
							
							summit compile fixes
						
						
						
						
						
						
					 | 
					
						2020-06-12 18:16:12 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						5f5807d60a
					 | 
					
						
						
							
							cleanup
						
						
						
						
						
						
					 | 
					
						2020-06-12 14:48:23 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						92281ec22d
					 | 
					
						
						
							
							add 3 op Mult for VLA
						
						
						
						
						
						
					 | 
					
						2020-06-12 18:49:05 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						87266ce099
					 | 
					
						
						
							
							comment out fcmla in vector types: need also MultAddReal
						
						
						
						
						
						
					 | 
					
						2020-06-12 18:37:19 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						2a23f133e8
					 | 
					
						
						
							
							reenable fcmla for VLA
						
						
						
						
						
						
					 | 
					
						2020-06-12 17:30:38 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						8dbf790f62
					 | 
					
						
						
							
							correct tbl2 for sp
						
						
						
						
						
						
					 | 
					
						2020-06-12 17:12:34 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						2402b4940e
					 | 
					
						
						
							
							vec_imm in float
						
						
						
						
						
						
					 | 
					
						2020-06-12 15:17:38 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						2111052fbe
					 | 
					
						
						
							
							apply VLA patch for memcpy reduction suggested by Arm, CAS-162542-D6W7Z7
						
						
						
						
						
						
					 | 
					
						2020-06-12 14:49:19 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Christoph Lehner
							
						 
					 | 
					
						
						
							
						
						7974acff54
					 | 
					
						
						
							
							merged sycl to feature-gpt
						
						
						
						
						
						
					 | 
					
						2020-06-12 06:49:38 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						f0d17d2b49
					 | 
					
						
						
							
							Added Baryon3pt code
						
						
						
						
						
						
					 | 
					
						2020-06-12 11:35:52 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						244c003a1b
					 | 
					
						
						
							
							Updated Baryon code
						
						
						
						
						
						
					 | 
					
						2020-06-12 11:00:25 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					| 
						
					 | 
					
						
						
							
						
						0174f5f742
					 | 
					
						
						
							
							look for librt when using shm=shmopen
						
						
						
						
						
						
					 | 
					
						2020-06-11 16:50:43 +01:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						32b2b59be4
					 | 
					
						
						
							
							Offload
						
						
						
						
						
						
					 | 
					
						2020-06-10 20:36:26 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						86bb0cc24b
					 | 
					
						
						
							
							Keep on GPU
						
						
						
						
						
						
					 | 
					
						2020-06-10 20:00:00 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						84c19587e7
					 | 
					
						
						
							
							Offload
						
						
						
						
						
						
					 | 
					
						2020-06-10 19:59:31 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						237ce92540
					 | 
					
						
						
							
							Offload loops
						
						
						
						
						
						
					 | 
					
						2020-06-10 19:59:11 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						a7ffc61e82
					 | 
					
						
						
							
							acceleratorSIMTlane()
						
						
						
						
						
						
					 | 
					
						2020-06-10 19:58:33 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						fd97f64612
					 | 
					
						
						
							
							Merge branch 'sycl' of https://github.com/paboyle/Grid into sycl
						
						
						
						
						
						
					 | 
					
						2020-06-10 12:58:13 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						8720aecb80
					 | 
					
						
						
							
							Offload more loops
						
						
						
						
						
						
					 | 
					
						2020-06-10 12:57:55 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						cdf0a04fc5
					 | 
					
						
						
							
							Merge branch 'develop' into sycl
						
						
						
						
						
						
					 | 
					
						2020-06-09 04:00:12 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						616d3dd737
					 | 
					
						
						
							
							CCommpile updates
						
						
						
						
						
						
					 | 
					
						2020-06-08 18:57:41 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						8b066baca8
					 | 
					
						
						
							
							Implement transient mechanism
						
						
						
						
						
						
					 | 
					
						2020-06-08 18:28:53 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e97f3688db
					 | 
					
						
						
							
							Fix the HMC issue - kernel was launchnig asynchronously
						
						
						
						
						
						
					 | 
					
						2020-06-08 17:01:15 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						433766ac62
					 | 
					
						
						
							
							revert Add/SubTimesI and prefetching in stencil
						
						
						
						
						
						
						
						This reverts commit 9b2699226c. 
						
						
					 | 
					
						2020-06-08 12:02:53 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						93a37c8f68
					 | 
					
						
						
							
							test prefetch to L2 in stencil
						
						
						
						
						
						
					 | 
					
						2020-06-08 09:39:50 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						89a1e78390
					 | 
					
						
						
							
							Merge branch 'sycl' of https://github.com/paboyle/Grid into sycl
						
						
						
						
						
						
					 | 
					
						2020-06-05 23:20:37 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						ffbb3fc02c
					 | 
					
						
						
							
							Merge pull request #287 from felixerben/baryon-cleaner
						
						
						
						
						
						
						
						slightly cleaner baryon 2pt code 
						
						
					 | 
					
						2020-06-05 22:54:52 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						5a73ef3647
					 | 
					
						
						
							
							Minor tweak to compile
						
						
						
						
						
						
					 | 
					
						2020-06-05 21:50:15 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						87e5d2f4b7
					 | 
					
						
						
							
							Merge branch 'sycl' of https://www.github.com/paboyle/Grid into sycl
						
						
						
						
						
						
					 | 
					
						2020-06-05 17:32:21 -07:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						d720f10758
					 | 
					
						
						
							
							Liink error fix
						
						
						
						
						
						
					 | 
					
						2020-06-05 17:29:20 -07:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						14fcd0912a
					 | 
					
						
						
							
							Merge branch 'sycl' of https://github.com/paboyle/Grid into sycl
						
						
						
						
						
						
					 | 
					
						2020-06-05 19:14:17 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						3111c0bd4f
					 | 
					
						
						
							
							Single precisiono hardwire
						
						
						
						
						
						
					 | 
					
						2020-06-05 19:13:27 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e03064490e
					 | 
					
						
						
							
							Merge branch 'sycl' of https://github.com/paboyle/Grid into sycl
						
						
						
						
						
						
					 | 
					
						2020-06-05 18:53:39 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						1a4c8c3387
					 | 
					
						
						
							
							Global edit with change to View usage. autoView() creates a wrapper object that closes the view when scope closes.
						
						
						
						
						
						
					 | 
					
						2020-06-05 18:52:35 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						2b1e259441
					 | 
					
						
						
							
							Decode of SYCL devices fix
						
						
						
						
						
						
					 | 
					
						2020-06-04 17:16:55 -07:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f39c2a240b
					 | 
					
						
						
							
							Priintinig and device memory size detection
						
						
						
						
						
						
					 | 
					
						2020-06-04 14:58:03 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						0d95805cde
					 | 
					
						
						
							
							Print improvement
						
						
						
						
						
						
					 | 
					
						2020-06-03 22:50:32 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						f67830587f
					 | 
					
						
						
							
							Accelerator loop use
						
						
						
						
						
						
					 | 
					
						2020-06-03 22:50:09 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						6bf7f839ff
					 | 
					
						
						
							
							Better printing and logging
						
						
						
						
						
						
					 | 
					
						2020-06-03 09:28:57 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						e3147881a9
					 | 
					
						
						
							
							Cache scheme
						
						
						
						
						
						
					 | 
					
						2020-06-03 09:23:48 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								nmeyer-ur
							
						 
					 | 
					
						
						
							
						
						9872c76825
					 | 
					
						
						
							
							introduce AddTimesI and SubTimesI; slight benefit in operators, but < 1%; breaks all other impls
						
						
						
						
						
						
					 | 
					
						2020-06-03 15:20:13 +02:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Peter Boyle
							
						 
					 | 
					
						
						
							
						
						fb559614ad
					 | 
					
						
						
							
							Initialise meemory manager
						
						
						
						
						
						
					 | 
					
						2020-06-03 09:12:47 -04:00 | 
					
					
						
						
						
							
							
							
							
							
							
						
					 |