360cface33 
					 
					
						
						
							
							Grid tensor serialisation fully implemented and tested  
						
						
						
						
					 
					
						2018-03-08 19:12:03 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						9579c9c327 
					 
					
						
						
							
							Threading improvement  
						
						
						
						
					 
					
						2017-12-05 14:12:22 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						c24d4c8d0e 
					 
					
						
						
							
							Improved parallel RNG init  
						
						
						
						
					 
					
						2017-12-05 13:01:10 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						3e560b9462 
					 
					
						
						
							
							Faster RNG init  
						
						
						
						
					 
					
						2017-12-05 11:42:05 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						d93c6760ec 
					 
					
						
						
							
							Faster code for split unsplit  
						
						
						
						
					 
					
						2017-12-05 11:39:26 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						28ceacec45 
					 
					
						
						
							
							Split/Unsplit working  
						
						
						
						
					 
					
						2017-11-27 15:13:29 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						4987edbd44 
					 
					
						
						
							
							Merge branch 'develop' of  https://github.com/paboyle/Grid  into develop  
						
						
						
						
					 
					
						2017-11-27 12:34:56 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						1f04e56038 
					 
					
						
						
							
							Believe split/unsplit works, but need to make pretty  
						
						
						
						
					 
					
						2017-11-27 12:33:08 +00:00 
						 
				 
			
				
					
						
							
							
								azusayamaguchi 
							
						 
					 
					
						
						
							
						
						e55397bc13 
					 
					
						
						
							
							Staggerd cg  
						
						
						
						
					 
					
						2017-11-24 14:18:30 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						94b8fb5686 
					 
					
						
						
							
							Debug in progress  
						
						
						
						
					 
					
						2017-11-19 01:39:04 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						a7f72eb994 
					 
					
						
						
							
							SHaking out  
						
						
						
						
					 
					
						2017-10-30 00:22:06 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						84b441800f 
					 
					
						
						
							
							Merge branch 'develop' into feature/lanczos-reorg  
						
						
						
						
					 
					
						2017-10-27 14:21:38 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						1ef424b139 
					 
					
						
						
							
							Split grid Y2K bug fix attempt  
						
						
						
						
					 
					
						2017-10-27 14:20:35 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						08583afaff 
					 
					
						
						
							
							Red black friendly coarsening  
						
						
						
						
					 
					
						2017-10-25 23:51:18 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						08ca338875 
					 
					
						
						
							
							Split grid communication  
						
						
						
						
					 
					
						2017-10-09 23:19:45 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						4f8b6f26b4 
					 
					
						
						
							
							Merge branch 'develop' into feature/dwf-multirhs  
						
						
						
						
					 
					
						2017-10-02 11:41:49 +01:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						d9cd4f0273 
					 
					
						
						
							
							Staggered multinode block cg debugged. Missing global sum.  
						
						... 
						
						
						
						Code stalls and resumes on KNL at cambridge. Curious.
CG iterations 23ms each, then 3200 ms pauses. Mean bandwidth reports
as 200MB/s. Comms dominant in the report. However, the time behaviour suggests it
is *bursty*.... Could be swap to disk? 
						
						
					 
					
						2017-08-23 15:07:18 +01:00 
						 
				 
			
				
					
						
							
							
								azusayamaguchi 
							
						 
					 
					
						
						
							
						
						659d7d1a40 
					 
					
						
						
							
							For test/solver  
						
						... 
						
						
						
						Fixed 
						
						
					 
					
						2017-07-12 15:01:48 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						349d75e483 
					 
					
						
						
							
							Precision fix  
						
						
						
						
					 
					
						2017-06-23 02:57:59 -07:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						e9cc21900f 
					 
					
						
						
							
							Block solver complete for staggered. Now stable on mass 0.003 and  
						
						... 
						
						
						
						gives 8x (!) speed up on Haswell laptop vs. standard CG for 8 RHS solves.
166 iterations vs. 537 iterations so algorithmic gain + 2x in flop rate gain.
Better than a slap in the face with a wet kipper. 
						
						
					 
					
						2017-06-20 12:37:41 +01:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						cfe3cd76d1 
					 
					
						
						
							
							Block solver improvements  
						
						
						
						
					 
					
						2017-06-19 14:04:21 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						c85024683e 
					 
					
						
						
							
							Merge branch 'feature/parallelio' into develop  
						
						
						
						
					 
					
						2017-06-19 01:39:48 +01:00 
						 
				 
			
				
					
						
							
							
								Peter Boyle 
							
						 
					 
					
						
						
							
						
						6f687a67cd 
					 
					
						
						
							
							As local vols increase, use 64 bits for safety  
						
						
						
						
					 
					
						2017-06-01 17:36:18 -04:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						58e8d0a10d 
					 
					
						
						
							
							reverse direction lexico mapping  
						
						
						
						
					 
					
						2017-05-30 23:38:30 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						ab3596d4d3 
					 
					
						
						
							
							Using Cayley-Hamilton form for the exponential of SU(3) matrices  
						
						
						
						
					 
					
						2017-05-25 12:07:47 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						a8fb2835ca 
					 
					
						
						
							
							Merge branch 'develop' of  https://github.com/paboyle/Grid  into develop  
						
						
						
						
					 
					
						2017-05-18 14:45:00 +01:00 
						 
				 
			
				
					
						
							
							
								Azusa Yamaguchi 
							
						 
					 
					
						
						
							
						
						f46a67ffb3 
					 
					
						
						
							
							No compile issue on clang on mac fixed.  
						
						... 
						
						
						
						Compiler version was clang++-3.9 under mpicxx 
						
						
					 
					
						2017-05-17 10:51:01 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						10f2872aae 
					 
					
						
						
							
							Faster exponentiation for lattice fields  
						
						
						
						
					 
					
						2017-05-15 15:51:16 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						2439999ec8 
					 
					
						
						
							
							Warning elimination; drop to -O2 on G++ bad versions  
						
						
						
						
					 
					
						2017-05-06 14:44:49 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						697c0603ce 
					 
					
						
						
							
							SITMO I/O for NERSC working now bit repro  
						
						
						
						
					 
					
						2017-05-05 16:54:44 +01:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						3344788fa1 
					 
					
						
						
							
							Merge branch 'develop' into feature/hmc_generalise  
						
						
						
						
					 
					
						2017-05-01 12:13:56 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						8e161152e4 
					 
					
						
						
							
							MultiRHS solver improvements with slice operations moved into lattice and sped up.  
						
						... 
						
						
						
						Block solver requires a lot of performance work. 
						
						
					 
					
						2017-04-18 10:51:55 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						3141ebac10 
					 
					
						
						
							
							MultiRHS working, starting to optimise. Block doesn't and I thought it already was; puzzled.  
						
						
						
						
					 
					
						2017-04-17 10:50:19 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						7ede696126 
					 
					
						
						
							
							Non compile of tests fixed  
						
						
						
						
					 
					
						2017-04-16 23:40:00 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						bf516c3b81 
					 
					
						
						
							
							higher precision reduction variables in norm and inner product  
						
						
						
						
					 
					
						2017-04-15 12:27:28 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						441a52ee5d 
					 
					
						
						
							
							First cut at higher precision reduction  
						
						
						
						
					 
					
						2017-04-15 10:57:21 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						683550f116 
					 
					
						
						
							
							Const args improvement  
						
						
						
						
					 
					
						2017-04-09 23:41:04 +09:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						8c540333d5 
					 
					
						
						
							
							Merge branch 'develop' into feature/hmc_generalise  
						
						
						
						
					 
					
						2017-04-05 14:41:04 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						83f6fab8fa 
					 
					
						
						
							
							Big/Small crush test, and fast SITMO rng init, faster but not ideal  
						
						... 
						
						
						
						MT and Ranlux init. 
						
						
					 
					
						2017-04-02 12:10:51 +09:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						9dc7ca4c3b 
					 
					
						
						
							
							Sitmo fast init  
						
						
						
						
					 
					
						2017-04-02 00:28:22 +09:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						b3dede4dd3 
					 
					
						
						
							
							Merge branch 'develop' into feature/hmc_generalise  
						
						
						
						
					 
					
						2017-03-10 23:57:37 +09:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						586a7c90b7 
					 
					
						
						
							
							Merge branch 'develop' into feature/bgq-asm  
						
						
						
						
					 
					
						2017-02-23 00:26:59 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						e099dcdae7 
					 
					
						
						
							
							Merge branch 'develop' into feature/bgq-asm  
						
						
						
						
					 
					
						2017-02-23 00:25:29 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						4e7ab3166f 
					 
					
						
						
							
							Refactoring header layout  
						
						
						
						
					 
					
						2017-02-22 18:09:33 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						aac80cbb44 
					 
					
						
						
							
							Bug fix from Chris K  
						
						
						
						
					 
					
						2017-02-22 12:19:09 -05:00 
						 
				 
			
				
					
						
							
							
								Francesco Sanfilippo 
							
						 
					 
					
						
						
							
						
						15e668eef1 
					 
					
						
						
							
							now it is possible to pass {coords list} to a peek or poke  
						
						
						
						
					 
					
						2017-02-21 22:48:38 +01:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						3ae92fa2e6 
					 
					
						
						
							
							Global changes to parallel_for structure.  
						
						... 
						
						
						
						Move the comms flags to more sensible names 
						
						
					 
					
						2017-02-21 05:24:27 -05:00 
						 
				 
			
				
					
						
							
							
								Guido Cossu 
							
						 
					 
					
						
						
							
						
						e0571c872b 
					 
					
						
						
							
							Merge branch 'develop' into feature/hmc_generalise  
						
						
						
						
					 
					
						2017-02-09 16:12:00 +00:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						71ac2e7940 
					 
					
						
						
							
							Faster RNG init  
						
						
						
						
					 
					
						2017-02-07 01:33:23 -05:00 
						 
				 
			
				
					
						
							
							
								paboyle 
							
						 
					 
					
						
						
							
						
						fdc170b8a3 
					 
					
						
						
							
							Parallel fors in lattice transfer  
						
						
						
						
					 
					
						2017-02-07 01:16:39 -05:00