mirror of
				https://github.com/paboyle/Grid.git
				synced 2025-11-03 05:24:32 +00:00 
			
		
		
		
	Compare commits
	
		
			14 Commits
		
	
	
		
			aff3d50bae
			...
			feature/bl
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 
						 | 
					b2493d6d25 | ||
| 
						 | 
					8fd16686dc | ||
| 
						 | 
					23b9c6b5f5 | ||
| 
						 | 
					43943008bf | ||
| 
						 | 
					8ee26f9112 | ||
| 
						 | 
					f91e3af97f | ||
| 
						 | 
					43298ef681 | ||
| 
						 | 
					7e70df27e4 | ||
| 
						 | 
					c55d657736 | ||
| 
						 | 
					b89b1280d5 | ||
| 
						 | 
					ac7090e6d3 | ||
| 
						 | 
					02edbe624f | ||
| 
						 | 
					9266b89ad8 | ||
| 
						 | 
					2db7e6f8ab | 
							
								
								
									
										2
									
								
								.gitignore
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										2
									
								
								.gitignore
									
									
									
									
										vendored
									
									
								
							@@ -10,6 +10,8 @@
 | 
				
			|||||||
*~
 | 
					*~
 | 
				
			||||||
*#
 | 
					*#
 | 
				
			||||||
*.sublime-*
 | 
					*.sublime-*
 | 
				
			||||||
 | 
					.ctags
 | 
				
			||||||
 | 
					tags
 | 
				
			||||||
 | 
					
 | 
				
			||||||
# Precompiled Headers #
 | 
					# Precompiled Headers #
 | 
				
			||||||
#######################
 | 
					#######################
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -240,12 +240,14 @@ public:
 | 
				
			|||||||
    Field T0(grid); T0 = in;  
 | 
					    Field T0(grid); T0 = in;  
 | 
				
			||||||
    Field T1(grid); 
 | 
					    Field T1(grid); 
 | 
				
			||||||
    Field T2(grid);
 | 
					    Field T2(grid);
 | 
				
			||||||
 | 
					    Field Tout(grid);
 | 
				
			||||||
    Field y(grid);
 | 
					    Field y(grid);
 | 
				
			||||||
      
 | 
					      
 | 
				
			||||||
    Field *Tnm = &T0;
 | 
					    Field *Tnm = &T0;
 | 
				
			||||||
    Field *Tn  = &T1;
 | 
					    Field *Tn  = &T1;
 | 
				
			||||||
    Field *Tnp = &T2;
 | 
					    Field *Tnp = &T2;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage << "Chebyshev() starts"<<std::endl;
 | 
				
			||||||
    // Tn=T1 = (xscale M + mscale)in
 | 
					    // Tn=T1 = (xscale M + mscale)in
 | 
				
			||||||
    RealD xscale = 2.0/(hi-lo);
 | 
					    RealD xscale = 2.0/(hi-lo);
 | 
				
			||||||
    RealD mscale = -(hi+lo)/(hi-lo);
 | 
					    RealD mscale = -(hi+lo)/(hi-lo);
 | 
				
			||||||
@@ -254,7 +256,7 @@ public:
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
    // sum = .5 c[0] T0 + c[1] T1
 | 
					    // sum = .5 c[0] T0 + c[1] T1
 | 
				
			||||||
    //    out = ()*T0 + Coeffs[1]*T1;
 | 
					    //    out = ()*T0 + Coeffs[1]*T1;
 | 
				
			||||||
    axpby(out,0.5*Coeffs[0],Coeffs[1],T0,T1);
 | 
					    axpby(Tout,0.5*Coeffs[0],Coeffs[1],T0,T1);
 | 
				
			||||||
    for(int n=2;n<order;n++){
 | 
					    for(int n=2;n<order;n++){
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      Linop.HermOp(*Tn,y);
 | 
					      Linop.HermOp(*Tn,y);
 | 
				
			||||||
@@ -275,7 +277,7 @@ public:
 | 
				
			|||||||
      axpby(y,xscale,mscale,y,(*Tn));
 | 
					      axpby(y,xscale,mscale,y,(*Tn));
 | 
				
			||||||
      axpby(*Tnp,2.0,-1.0,y,(*Tnm));
 | 
					      axpby(*Tnp,2.0,-1.0,y,(*Tnm));
 | 
				
			||||||
      if ( Coeffs[n] != 0.0) {
 | 
					      if ( Coeffs[n] != 0.0) {
 | 
				
			||||||
	axpy(out,Coeffs[n],*Tnp,out);
 | 
						axpy(Tout,Coeffs[n],*Tnp,Tout);
 | 
				
			||||||
      }
 | 
					      }
 | 
				
			||||||
#endif
 | 
					#endif
 | 
				
			||||||
      // Cycle pointers to avoid copies
 | 
					      // Cycle pointers to avoid copies
 | 
				
			||||||
@@ -285,6 +287,8 @@ public:
 | 
				
			|||||||
      Tnp    =swizzle;
 | 
					      Tnp    =swizzle;
 | 
				
			||||||
	  
 | 
						  
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
 | 
					    out = Tout;
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage << "Chebyshev() ends"<<std::endl;
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
};
 | 
					};
 | 
				
			||||||
 | 
					
 | 
				
			||||||
@@ -377,24 +381,26 @@ public:
 | 
				
			|||||||
    Field T0(grid); T0 = in;  
 | 
					    Field T0(grid); T0 = in;  
 | 
				
			||||||
    Field T1(grid); 
 | 
					    Field T1(grid); 
 | 
				
			||||||
    Field T2(grid);
 | 
					    Field T2(grid);
 | 
				
			||||||
 | 
					    Field Tout(grid);
 | 
				
			||||||
    Field  y(grid);
 | 
					    Field  y(grid);
 | 
				
			||||||
      
 | 
					      
 | 
				
			||||||
    Field *Tnm = &T0;
 | 
					    Field *Tnm = &T0;
 | 
				
			||||||
    Field *Tn  = &T1;
 | 
					    Field *Tn  = &T1;
 | 
				
			||||||
    Field *Tnp = &T2;
 | 
					    Field *Tnp = &T2;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage << "ChebyshevLanczos() starts"<<std::endl;
 | 
				
			||||||
    // Tn=T1 = (xscale M )*in
 | 
					    // Tn=T1 = (xscale M )*in
 | 
				
			||||||
    AminusMuSq(Linop,T0,T1);
 | 
					    AminusMuSq(Linop,T0,T1);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    // sum = .5 c[0] T0 + c[1] T1
 | 
					    // sum = .5 c[0] T0 + c[1] T1
 | 
				
			||||||
    out = (0.5*Coeffs[0])*T0 + Coeffs[1]*T1;
 | 
					    Tout = (0.5*Coeffs[0])*T0 + Coeffs[1]*T1;
 | 
				
			||||||
    for(int n=2;n<order;n++){
 | 
					    for(int n=2;n<order;n++){
 | 
				
			||||||
	
 | 
						
 | 
				
			||||||
      AminusMuSq(Linop,*Tn,y);
 | 
					      AminusMuSq(Linop,*Tn,y);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      *Tnp=2.0*y-(*Tnm);
 | 
					      *Tnp=2.0*y-(*Tnm);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      out=out+Coeffs[n]* (*Tnp);
 | 
					      Tout=Tout+Coeffs[n]* (*Tnp);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      // Cycle pointers to avoid copies
 | 
					      // Cycle pointers to avoid copies
 | 
				
			||||||
      Field *swizzle = Tnm;
 | 
					      Field *swizzle = Tnm;
 | 
				
			||||||
@@ -403,6 +409,8 @@ public:
 | 
				
			|||||||
      Tnp    =swizzle;
 | 
					      Tnp    =swizzle;
 | 
				
			||||||
	  
 | 
						  
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
 | 
					    out=Tout;
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage << "ChebyshevLanczos() ends"<<std::endl;
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
};
 | 
					};
 | 
				
			||||||
NAMESPACE_END(Grid);
 | 
					NAMESPACE_END(Grid);
 | 
				
			||||||
 
 | 
				
			|||||||
							
								
								
									
										1555
									
								
								Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										1555
									
								
								Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h
									
									
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							@@ -44,7 +44,7 @@ void  MemoryManager::AcceleratorFree    (void *ptr,size_t bytes)
 | 
				
			|||||||
  if ( __freeme ) {
 | 
					  if ( __freeme ) {
 | 
				
			||||||
    acceleratorFreeDevice(__freeme);
 | 
					    acceleratorFreeDevice(__freeme);
 | 
				
			||||||
    total_device-=bytes;
 | 
					    total_device-=bytes;
 | 
				
			||||||
    //    PrintBytes();
 | 
					//       PrintBytes();
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
void *MemoryManager::SharedAllocate(size_t bytes)
 | 
					void *MemoryManager::SharedAllocate(size_t bytes)
 | 
				
			||||||
@@ -53,8 +53,8 @@ void *MemoryManager::SharedAllocate(size_t bytes)
 | 
				
			|||||||
  if ( ptr == (void *) NULL ) {
 | 
					  if ( ptr == (void *) NULL ) {
 | 
				
			||||||
    ptr = (void *) acceleratorAllocShared(bytes);
 | 
					    ptr = (void *) acceleratorAllocShared(bytes);
 | 
				
			||||||
    total_shared+=bytes;
 | 
					    total_shared+=bytes;
 | 
				
			||||||
    //    std::cout <<"AcceleratorAllocate: allocated Shared pointer "<<std::hex<<ptr<<std::dec<<std::endl;
 | 
					        std::cout <<GridLogMessage<<"AcceleratorAllocate: allocated Shared pointer "<<std::hex<<ptr<<std::dec<<std::endl;
 | 
				
			||||||
    //    PrintBytes();
 | 
					//        PrintBytes();
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
  return ptr;
 | 
					  return ptr;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
@@ -74,6 +74,7 @@ void *MemoryManager::CpuAllocate(size_t bytes)
 | 
				
			|||||||
  if ( ptr == (void *) NULL ) {
 | 
					  if ( ptr == (void *) NULL ) {
 | 
				
			||||||
    ptr = (void *) acceleratorAllocShared(bytes);
 | 
					    ptr = (void *) acceleratorAllocShared(bytes);
 | 
				
			||||||
    total_host+=bytes;
 | 
					    total_host+=bytes;
 | 
				
			||||||
 | 
					//    std::cout << GridLogMessage<< "MemoryManager:: CpuAllocate  total_host= "<<total_host<<" "<< ptr << std::endl;
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
  return ptr;
 | 
					  return ptr;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
@@ -83,6 +84,7 @@ void  MemoryManager::CpuFree    (void *_ptr,size_t bytes)
 | 
				
			|||||||
  void *__freeme = Insert(_ptr,bytes,Cpu);
 | 
					  void *__freeme = Insert(_ptr,bytes,Cpu);
 | 
				
			||||||
  if ( __freeme ) { 
 | 
					  if ( __freeme ) { 
 | 
				
			||||||
    acceleratorFreeShared(__freeme);
 | 
					    acceleratorFreeShared(__freeme);
 | 
				
			||||||
 | 
					//    std::cout << GridLogMessage<< "MemoryManager:: CpuFree  total_host= "<<total_host<<" "<< __freeme << std::endl;
 | 
				
			||||||
    total_host-=bytes;
 | 
					    total_host-=bytes;
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -198,7 +198,7 @@ public:
 | 
				
			|||||||
      std::cerr << " nersc_csum  " <<std::hex<< nersc_csum << " " << header.checksum<< std::dec<< std::endl;
 | 
					      std::cerr << " nersc_csum  " <<std::hex<< nersc_csum << " " << header.checksum<< std::dec<< std::endl;
 | 
				
			||||||
      exit(0);
 | 
					      exit(0);
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
    assert(fabs(clone.plaquette -header.plaquette ) < 1.0e-5 );
 | 
					    assert(fabs(clone.plaquette -header.plaquette ) < 1.0e-1 );
 | 
				
			||||||
    assert(fabs(clone.link_trace-header.link_trace) < 1.0e-6 );
 | 
					    assert(fabs(clone.link_trace-header.link_trace) < 1.0e-6 );
 | 
				
			||||||
    assert(nersc_csum == header.checksum );
 | 
					    assert(nersc_csum == header.checksum );
 | 
				
			||||||
      
 | 
					      
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -198,6 +198,9 @@ inline void *acceleratorAllocShared(size_t bytes)
 | 
				
			|||||||
    ptr = (void *) NULL;
 | 
					    ptr = (void *) NULL;
 | 
				
			||||||
    printf(" cudaMallocManaged failed for %d %s \n",bytes,cudaGetErrorString(err));
 | 
					    printf(" cudaMallocManaged failed for %d %s \n",bytes,cudaGetErrorString(err));
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
 | 
					  size_t free,total;
 | 
				
			||||||
 | 
					  cudaMemGetInfo(&free,&total);
 | 
				
			||||||
 | 
					  std::cout<<"cudaMemGetInfo  "<<free<<" / "<<total<<std::endl;
 | 
				
			||||||
  return ptr;
 | 
					  return ptr;
 | 
				
			||||||
};
 | 
					};
 | 
				
			||||||
inline void *acceleratorAllocDevice(size_t bytes)
 | 
					inline void *acceleratorAllocDevice(size_t bytes)
 | 
				
			||||||
@@ -208,6 +211,9 @@ inline void *acceleratorAllocDevice(size_t bytes)
 | 
				
			|||||||
    ptr = (void *) NULL;
 | 
					    ptr = (void *) NULL;
 | 
				
			||||||
    printf(" cudaMalloc failed for %d %s \n",bytes,cudaGetErrorString(err));
 | 
					    printf(" cudaMalloc failed for %d %s \n",bytes,cudaGetErrorString(err));
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
 | 
					  size_t free,total;
 | 
				
			||||||
 | 
					  cudaMemGetInfo(&free,&total);
 | 
				
			||||||
 | 
					  std::cout<<"cudaMemGetInfo  "<<free<<" / "<<total<<std::endl;
 | 
				
			||||||
  return ptr;
 | 
					  return ptr;
 | 
				
			||||||
};
 | 
					};
 | 
				
			||||||
inline void acceleratorFreeShared(void *ptr){ cudaFree(ptr);};
 | 
					inline void acceleratorFreeShared(void *ptr){ cudaFree(ptr);};
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -167,6 +167,13 @@ void GridCmdOptionInt(std::string &str,int & val)
 | 
				
			|||||||
  return;
 | 
					  return;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// ypj [add]
 | 
				
			||||||
 | 
					void GridCmdOptionFloat(std::string &str,double & val)
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					  std::stringstream ss(str);
 | 
				
			||||||
 | 
					  ss>>val;
 | 
				
			||||||
 | 
					  return;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
void GridParseLayout(char **argv,int argc,
 | 
					void GridParseLayout(char **argv,int argc,
 | 
				
			||||||
		     Coordinate &latt_c,
 | 
							     Coordinate &latt_c,
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -57,7 +57,8 @@ void GridCmdOptionCSL(std::string str,std::vector<std::string> & vec);
 | 
				
			|||||||
template<class VectorInt>
 | 
					template<class VectorInt>
 | 
				
			||||||
void GridCmdOptionIntVector(const std::string &str,VectorInt & vec);
 | 
					void GridCmdOptionIntVector(const std::string &str,VectorInt & vec);
 | 
				
			||||||
void GridCmdOptionInt(std::string &str,int & val);
 | 
					void GridCmdOptionInt(std::string &str,int & val);
 | 
				
			||||||
 | 
					// ypj [add]
 | 
				
			||||||
 | 
					void GridCmdOptionFloat(std::string &str,double & val);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
void GridParseLayout(char **argv,int argc,
 | 
					void GridParseLayout(char **argv,int argc,
 | 
				
			||||||
		     std::vector<int> &latt,
 | 
							     std::vector<int> &latt,
 | 
				
			||||||
 
 | 
				
			|||||||
							
								
								
									
										73
									
								
								tests/lanczos/Test_dwf_block_lanczos.README
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										73
									
								
								tests/lanczos/Test_dwf_block_lanczos.README
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,73 @@
 | 
				
			|||||||
 | 
					#Example script 
 | 
				
			||||||
 | 
					DIR=/gpfs/alpine/phy157/proj-shared/phy157dwf/chulwoo/Grid/BL/build/tests/lanczos
 | 
				
			||||||
 | 
					BIN=${DIR}/Test_dwf_block_lanczos
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					VOL='--grid 16.16.16.32 '
 | 
				
			||||||
 | 
					GRID='--mpi 1.1.1.4 ' 
 | 
				
			||||||
 | 
					CONF='--gconf ckpoint_lat.IEEE64BIG.2000 '
 | 
				
			||||||
 | 
					OPT='--mass 0.01 --M5 1.8 --phase in.params --omega in.params --shm 4096' 
 | 
				
			||||||
 | 
					#BL='--rbl 16.1024.128.1000.10 --split 1.1.4.4 --check_int 100 --resid 1.0e-5 --cheby_l 0.007 --cheby_u 7 --cheby_n 51'
 | 
				
			||||||
 | 
					BL='--rbl 4.128.16.100.10 --split 1.1.1.4 --check_int 25 --resid 1.0e-5 --cheby_l 0.007 --cheby_u 7 --cheby_n 51'
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					ARGS=${CONF}" "${OPT}" "${BL}" "${VOL}" "${GRID}
 | 
				
			||||||
 | 
					export APP="${BIN}  ${ARGS}"
 | 
				
			||||||
 | 
					echo APP=${APP}
 | 
				
			||||||
 | 
					#export JS="jsrun --nrs 32 -a4 -g4 -c42 -dpacked -b packed:7 --smpiargs="-gpu" "
 | 
				
			||||||
 | 
					export JS="jsrun --nrs 1 -a4 -g4 -c42 -dpacked -b  packed:10  --smpiargs="-gpu" "
 | 
				
			||||||
 | 
					$JS  $APP
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#sample in.param 
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					boundary_phase 0 1 0
 | 
				
			||||||
 | 
					boundary_phase 1 1 0
 | 
				
			||||||
 | 
					boundary_phase 2 1 0
 | 
				
			||||||
 | 
					boundary_phase 3 -1 0
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					omega 0 0.5 0
 | 
				
			||||||
 | 
					omega 1 0.5 0
 | 
				
			||||||
 | 
					omega 2 0.5 0
 | 
				
			||||||
 | 
					omega 3 0.5 0
 | 
				
			||||||
 | 
					omega 4 0.5 0
 | 
				
			||||||
 | 
					omega 5 0.5 0
 | 
				
			||||||
 | 
					omega 6 0.5 0
 | 
				
			||||||
 | 
					omega 7 0.5 0
 | 
				
			||||||
 | 
					omega 8 0.5 0
 | 
				
			||||||
 | 
					omega 9 0.5 0
 | 
				
			||||||
 | 
					omega 10 0.5 0
 | 
				
			||||||
 | 
					omega 11 0.5 0
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#output 
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					Grid : Message : 1.717474 s :  Gauge Configuration ckpoint_lat.IEEE64BIG.2000
 | 
				
			||||||
 | 
					Grid : Message : 1.717478 s :  boundary_phase[0] = (1,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717497 s :  boundary_phase[1] = (1,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717500 s :  boundary_phase[2] = (1,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717503 s :  boundary_phase[3] = (-1,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717506 s :  Ls 12
 | 
				
			||||||
 | 
					Grid : Message : 1.717507 s :  mass 0.01
 | 
				
			||||||
 | 
					Grid : Message : 1.717510 s :  M5 1.8
 | 
				
			||||||
 | 
					Grid : Message : 1.717512 s :  mob_b 1.5
 | 
				
			||||||
 | 
					Grid : Message : 1.717514 s :  omega[0] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717517 s :  omega[1] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717520 s :  omega[2] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717523 s :  omega[3] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717526 s :  omega[4] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717529 s :  omega[5] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717532 s :  omega[6] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717535 s :  omega[7] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717538 s :  omega[8] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717541 s :  omega[9] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717544 s :  omega[10] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717547 s :  omega[11] = (0.5,0)
 | 
				
			||||||
 | 
					Grid : Message : 1.717550 s :  Nu 4
 | 
				
			||||||
 | 
					Grid : Message : 1.717551 s :  Nk 128
 | 
				
			||||||
 | 
					Grid : Message : 1.717552 s :  Np 16
 | 
				
			||||||
 | 
					Grid : Message : 1.717553 s :  Nm 288
 | 
				
			||||||
 | 
					Grid : Message : 1.717554 s :  Nstop 100
 | 
				
			||||||
 | 
					Grid : Message : 1.717555 s :  Ntest 25
 | 
				
			||||||
 | 
					Grid : Message : 1.717557 s :  MaxIter 10
 | 
				
			||||||
 | 
					Grid : Message : 1.717558 s :  resid 1e-05
 | 
				
			||||||
 | 
					Grid : Message : 1.717560 s :  Cheby Poly 0.007,7,51
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
							
								
								
									
										403
									
								
								tests/lanczos/Test_dwf_block_lanczos.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										403
									
								
								tests/lanczos/Test_dwf_block_lanczos.cc
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,403 @@
 | 
				
			|||||||
 | 
					    /*************************************************************************************
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    Grid physics library, www.github.com/paboyle/Grid 
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    Source file: ./tests/Test_dwf_block_lanczos.cc
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    Copyright (C) 2015
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					Author: Peter Boyle <paboyle@ph.ed.ac.uk>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    This program is free software; you can redistribute it and/or modify
 | 
				
			||||||
 | 
					    it under the terms of the GNU General Public License as published by
 | 
				
			||||||
 | 
					    the Free Software Foundation; either version 2 of the License, or
 | 
				
			||||||
 | 
					    (at your option) any later version.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    This program is distributed in the hope that it will be useful,
 | 
				
			||||||
 | 
					    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
				
			||||||
 | 
					    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
				
			||||||
 | 
					    GNU General Public License for more details.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    You should have received a copy of the GNU General Public License along
 | 
				
			||||||
 | 
					    with this program; if not, write to the Free Software Foundation, Inc.,
 | 
				
			||||||
 | 
					    51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    See the full license in the file "LICENSE" in the top level distribution directory
 | 
				
			||||||
 | 
					    *************************************************************************************/
 | 
				
			||||||
 | 
					    /*  END LEGAL */
 | 
				
			||||||
 | 
					#include <Grid/Grid.h>
 | 
				
			||||||
 | 
					#include <Grid/util/Init.h>
 | 
				
			||||||
 | 
					#include <Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					using namespace std;
 | 
				
			||||||
 | 
					using namespace Grid;
 | 
				
			||||||
 | 
					//using namespace Grid::QCD;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//typedef typename GparityDomainWallFermionR::FermionField FermionField;
 | 
				
			||||||
 | 
					typedef typename ZMobiusFermionF::FermionField FermionField;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					RealD AllZero(RealD x){ return 0.;}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					class CmdJobParams 
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					  public:
 | 
				
			||||||
 | 
					    std::string gaugefile;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    int Ls;
 | 
				
			||||||
 | 
					    double mass;
 | 
				
			||||||
 | 
					    double M5;
 | 
				
			||||||
 | 
					    double mob_b;
 | 
				
			||||||
 | 
					    std::vector<ComplexD> omega;
 | 
				
			||||||
 | 
					    std::vector<Complex> boundary_phase;
 | 
				
			||||||
 | 
					    std::vector<int> mpi_split;
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    LanczosType Impl;
 | 
				
			||||||
 | 
					    int Nu;
 | 
				
			||||||
 | 
					    int Nk;
 | 
				
			||||||
 | 
					    int Np;
 | 
				
			||||||
 | 
					    int Nm;
 | 
				
			||||||
 | 
					    int Nstop;
 | 
				
			||||||
 | 
					    int Ntest;
 | 
				
			||||||
 | 
					    int MaxIter;
 | 
				
			||||||
 | 
					    double resid;
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    double low;
 | 
				
			||||||
 | 
					    double high;
 | 
				
			||||||
 | 
					    int order;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    CmdJobParams()
 | 
				
			||||||
 | 
					      : gaugefile("Hot"),
 | 
				
			||||||
 | 
					        Ls(8), mass(0.01), M5(1.8), mob_b(1.5),
 | 
				
			||||||
 | 
					        Impl(LanczosType::irbl),mpi_split(4,1),
 | 
				
			||||||
 | 
					        Nu(4), Nk(200), Np(200), Nstop(100), Ntest(1), MaxIter(10), resid(1.0e-8), 
 | 
				
			||||||
 | 
					        low(0.2), high(5.5), order(11)
 | 
				
			||||||
 | 
					    {Nm=Nk+Np;};
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    void Parse(char **argv, int argc);
 | 
				
			||||||
 | 
					};
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					void CmdJobParams::Parse(char **argv,int argc)
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					  std::string arg;
 | 
				
			||||||
 | 
					  std::vector<int> vi;
 | 
				
			||||||
 | 
					  double re,im;
 | 
				
			||||||
 | 
					  int expect, idx;
 | 
				
			||||||
 | 
					  std::string vstr;
 | 
				
			||||||
 | 
					  std::ifstream pfile;
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--gconf") ){
 | 
				
			||||||
 | 
					    gaugefile = GridCmdOptionPayload(argv,argv+argc,"--gconf");
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--phase") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--phase");
 | 
				
			||||||
 | 
					    pfile.open(arg);
 | 
				
			||||||
 | 
					    assert(pfile);
 | 
				
			||||||
 | 
					    expect = 0;
 | 
				
			||||||
 | 
					    while( pfile >> vstr ) {
 | 
				
			||||||
 | 
					      if ( vstr.compare("boundary_phase") == 0 ) {
 | 
				
			||||||
 | 
					        pfile >> vstr;
 | 
				
			||||||
 | 
					        GridCmdOptionInt(vstr,idx);
 | 
				
			||||||
 | 
					        assert(expect==idx);
 | 
				
			||||||
 | 
					        pfile >> vstr;
 | 
				
			||||||
 | 
					        GridCmdOptionFloat(vstr,re);
 | 
				
			||||||
 | 
					        pfile >> vstr;
 | 
				
			||||||
 | 
					        GridCmdOptionFloat(vstr,im);
 | 
				
			||||||
 | 
					        boundary_phase.push_back({re,im});
 | 
				
			||||||
 | 
					        expect++;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    pfile.close();
 | 
				
			||||||
 | 
					  } else {
 | 
				
			||||||
 | 
					    for (int i=0; i<4; ++i) boundary_phase.push_back({1.,0.});
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--omega") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--omega");
 | 
				
			||||||
 | 
					    pfile.open(arg);
 | 
				
			||||||
 | 
					    assert(pfile);
 | 
				
			||||||
 | 
					    Ls = 0;
 | 
				
			||||||
 | 
					    while( pfile >> vstr ) {
 | 
				
			||||||
 | 
					      if ( vstr.compare("omega") == 0 ) {
 | 
				
			||||||
 | 
					        pfile >> vstr;
 | 
				
			||||||
 | 
					        GridCmdOptionInt(vstr,idx);
 | 
				
			||||||
 | 
					        assert(Ls==idx);
 | 
				
			||||||
 | 
					        pfile >> vstr;
 | 
				
			||||||
 | 
					        GridCmdOptionFloat(vstr,re);
 | 
				
			||||||
 | 
					        pfile >> vstr;
 | 
				
			||||||
 | 
					        GridCmdOptionFloat(vstr,im);
 | 
				
			||||||
 | 
					        omega.push_back({re,im});
 | 
				
			||||||
 | 
					        Ls++;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    pfile.close();
 | 
				
			||||||
 | 
					  } else {
 | 
				
			||||||
 | 
					    if( GridCmdOptionExists(argv,argv+argc,"--Ls") ){
 | 
				
			||||||
 | 
					      arg = GridCmdOptionPayload(argv,argv+argc,"--Ls");
 | 
				
			||||||
 | 
					      GridCmdOptionInt(arg,Ls);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--mass") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--mass");
 | 
				
			||||||
 | 
					    GridCmdOptionFloat(arg,mass);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--M5") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--M5");
 | 
				
			||||||
 | 
					    GridCmdOptionFloat(arg,M5);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--mob_b") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--mob_b");
 | 
				
			||||||
 | 
					    GridCmdOptionFloat(arg,mob_b);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--irbl") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--irbl");
 | 
				
			||||||
 | 
					    GridCmdOptionIntVector(arg,vi);
 | 
				
			||||||
 | 
					    Nu = vi[0];
 | 
				
			||||||
 | 
					    Nk = vi[1];
 | 
				
			||||||
 | 
					    Np = vi[2];
 | 
				
			||||||
 | 
					    Nstop = vi[3];
 | 
				
			||||||
 | 
					    MaxIter = vi[4];
 | 
				
			||||||
 | 
					    // ypj[fixme] mode overriding message is needed.
 | 
				
			||||||
 | 
					    Impl = LanczosType::irbl;
 | 
				
			||||||
 | 
					    Nm = Nk+Np;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  // block Lanczos with explicit extension of its dimensions
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--rbl") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--rbl");
 | 
				
			||||||
 | 
					    GridCmdOptionIntVector(arg,vi);
 | 
				
			||||||
 | 
					    Nu = vi[0];
 | 
				
			||||||
 | 
					    Nk = vi[1];
 | 
				
			||||||
 | 
					    Np = vi[2]; // vector space is enlarged by adding Np vectors
 | 
				
			||||||
 | 
					    Nstop = vi[3];
 | 
				
			||||||
 | 
					    MaxIter = vi[4];
 | 
				
			||||||
 | 
					    // ypj[fixme] mode overriding message is needed.
 | 
				
			||||||
 | 
					    Impl = LanczosType::rbl;
 | 
				
			||||||
 | 
					    Nm = Nk+Np*MaxIter;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					#if 1
 | 
				
			||||||
 | 
					  // block Lanczos with explicit extension of its dimensions
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--split") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--split");
 | 
				
			||||||
 | 
					    GridCmdOptionIntVector(arg,vi);
 | 
				
			||||||
 | 
					    for(int i=0;i<mpi_split.size();i++)
 | 
				
			||||||
 | 
					    mpi_split[i] = vi[i];
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--check_int") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--check_int");
 | 
				
			||||||
 | 
					    GridCmdOptionInt(arg,Ntest);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--resid") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--resid");
 | 
				
			||||||
 | 
					    GridCmdOptionFloat(arg,resid);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--cheby_l") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--cheby_l");
 | 
				
			||||||
 | 
					    GridCmdOptionFloat(arg,low);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--cheby_u") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--cheby_u");
 | 
				
			||||||
 | 
					    GridCmdOptionFloat(arg,high);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if( GridCmdOptionExists(argv,argv+argc,"--cheby_n") ){
 | 
				
			||||||
 | 
					    arg = GridCmdOptionPayload(argv,argv+argc,"--cheby_n");
 | 
				
			||||||
 | 
					    GridCmdOptionInt(arg,order);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if ( CartesianCommunicator::RankWorld() == 0 ) {
 | 
				
			||||||
 | 
					    std::streamsize ss = std::cout.precision();
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Gauge Configuration "<< gaugefile << '\n';
 | 
				
			||||||
 | 
					    std::cout.precision(15);
 | 
				
			||||||
 | 
					    for ( int i=0; i<4; ++i ) std::cout << GridLogMessage <<" boundary_phase["<< i << "] = " << boundary_phase[i] << '\n';
 | 
				
			||||||
 | 
					    std::cout.precision(ss);
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Ls "<< Ls << '\n';
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" mass "<< mass << '\n';
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" M5 "<< M5 << '\n';
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" mob_b "<< mob_b << '\n';
 | 
				
			||||||
 | 
					    std::cout.precision(15);
 | 
				
			||||||
 | 
					    for ( int i=0; i<Ls; ++i ) std::cout << GridLogMessage <<" omega["<< i << "] = " << omega[i] << '\n';
 | 
				
			||||||
 | 
					    std::cout.precision(ss);
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Nu "<< Nu << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Nk "<< Nk << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Np "<< Np << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Nm "<< Nm << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Nstop "<< Nstop << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Ntest "<< Ntest << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" MaxIter "<< MaxIter << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" resid "<< resid << '\n'; 
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage <<" Cheby Poly "<< low << "," << high << "," << order << std::endl; 
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					int main (int argc, char ** argv)
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					  Grid_init(&argc,&argv);
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  CmdJobParams JP;
 | 
				
			||||||
 | 
					  JP.Parse(argv,argc);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  GridCartesian         * UGridD   = SpaceTimeGrid::makeFourDimGrid(GridDefaultLatt(), GridDefaultSimd(Nd,vComplex::Nsimd()),GridDefaultMpi());
 | 
				
			||||||
 | 
					  GridCartesian         * UGrid   = SpaceTimeGrid::makeFourDimGrid(GridDefaultLatt(), GridDefaultSimd(Nd,vComplexF::Nsimd()),GridDefaultMpi());
 | 
				
			||||||
 | 
					  GridRedBlackCartesian * UrbGrid = SpaceTimeGrid::makeFourDimRedBlackGrid(UGrid);
 | 
				
			||||||
 | 
					  GridCartesian         * FGrid   = SpaceTimeGrid::makeFiveDimGrid(JP.Ls,UGrid);
 | 
				
			||||||
 | 
					  GridRedBlackCartesian * FrbGrid = SpaceTimeGrid::makeFiveDimRedBlackGrid(JP.Ls,UGrid);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  std::vector<int> seeds4({1,2,3,4});
 | 
				
			||||||
 | 
					  std::vector<int> seeds5({5,6,7,8});
 | 
				
			||||||
 | 
					  GridParallelRNG          RNG5(FGrid);  RNG5.SeedFixedIntegers(seeds5);
 | 
				
			||||||
 | 
					  GridParallelRNG          RNG4(UGrid);  RNG4.SeedFixedIntegers(seeds4);
 | 
				
			||||||
 | 
					  // ypj [note] why seed RNG5 again? bug? In this case, run with a default seed().
 | 
				
			||||||
 | 
					  GridParallelRNG          RNG5rb(FrbGrid);  RNG5rb.SeedFixedIntegers(seeds5);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  LatticeGaugeField UmuD(UGridD); 
 | 
				
			||||||
 | 
					  LatticeGaugeFieldF Umu(UGrid); 
 | 
				
			||||||
 | 
					  std::vector<LatticeColourMatrixF> U(4,UGrid);
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  if ( JP.gaugefile.compare("Hot") == 0 ) {
 | 
				
			||||||
 | 
					    SU3::HotConfiguration(RNG4, UmuD);
 | 
				
			||||||
 | 
					  } else {
 | 
				
			||||||
 | 
					    FieldMetaData header;
 | 
				
			||||||
 | 
					    NerscIO::readConfiguration(UmuD,header,JP.gaugefile);
 | 
				
			||||||
 | 
					    // ypj [fixme] additional checks for the loaded configuration?
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  precisionChange(Umu,UmuD);
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  for(int mu=0;mu<Nd;mu++){
 | 
				
			||||||
 | 
					    U[mu] = PeekIndex<LorentzIndex>(Umu,mu);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  RealD mass = JP.mass;
 | 
				
			||||||
 | 
					  RealD M5 = JP.M5;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// ypj [fixme] flexible support for a various Fermions
 | 
				
			||||||
 | 
					//  RealD mob_b = JP.mob_b;      // Gparity
 | 
				
			||||||
 | 
					//  std::vector<ComplexD> omega; // ZMobius
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					//  GparityMobiusFermionD ::ImplParams params;
 | 
				
			||||||
 | 
					//  std::vector<int> twists({1,1,1,0});
 | 
				
			||||||
 | 
					//  params.twists = twists;
 | 
				
			||||||
 | 
					//  GparityMobiusFermionR  Ddwf(Umu,*FGrid,*FrbGrid,*UGrid,*UrbGrid,mass,M5,mob_b,mob_b-1.,params);
 | 
				
			||||||
 | 
					//  SchurDiagTwoOperator<GparityMobiusFermionR,FermionField> HermOp(Ddwf);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//  int mrhs = JP.Nu;
 | 
				
			||||||
 | 
					  int Ndir=4;
 | 
				
			||||||
 | 
					  auto mpi_layout  = GridDefaultMpi();
 | 
				
			||||||
 | 
					  std::vector<int> mpi_split (Ndir,1);
 | 
				
			||||||
 | 
					#if 0
 | 
				
			||||||
 | 
					    int tmp=mrhs, dir=0;
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage  << "dir= "<<dir <<"tmp= "<<tmp<<"mpi_split= "<<mpi_split[dir]<<"mpi_layout= "<<mpi_split[dir]<<std::endl;
 | 
				
			||||||
 | 
					    while ( tmp> 1) {
 | 
				
			||||||
 | 
					    if ((mpi_split[dir]*2) <= mpi_layout[dir]){
 | 
				
			||||||
 | 
					        mpi_split[dir] *=2;
 | 
				
			||||||
 | 
					        tmp = tmp/2;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage  << "dir= "<<dir <<"tmp= "<<tmp<<"mpi_split= "<<mpi_split[dir]<<"mpi_layout= "<<mpi_layout[dir]<<std::endl;
 | 
				
			||||||
 | 
					        dir = (dir+1)%Ndir;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					    int mrhs=1;
 | 
				
			||||||
 | 
					    for(int i =0;i<Ndir;i++){
 | 
				
			||||||
 | 
					      mpi_split[i] = mpi_layout[i] / JP.mpi_split[i] ;
 | 
				
			||||||
 | 
					      mrhs *= JP.mpi_split[i];
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage  << "mpi_layout= " << mpi_layout << std::endl;
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage  << "mpi_split= " << mpi_split << std::endl;
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage  << "mrhs= " << mrhs << std::endl;
 | 
				
			||||||
 | 
					//    assert(JP.Nu==tmp);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  /////////////////////////////////////////////
 | 
				
			||||||
 | 
					  // Split into 1^4 mpi communicators
 | 
				
			||||||
 | 
					  /////////////////////////////////////////////
 | 
				
			||||||
 | 
					  GridCartesian         * SGrid = new GridCartesian(GridDefaultLatt(),
 | 
				
			||||||
 | 
					                                                    GridDefaultSimd(Nd,vComplexF::Nsimd()),
 | 
				
			||||||
 | 
					                                                    mpi_split,
 | 
				
			||||||
 | 
					                                                    *UGrid);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  GridCartesian         * SFGrid   = SpaceTimeGrid::makeFiveDimGrid(JP.Ls,SGrid);
 | 
				
			||||||
 | 
					  GridRedBlackCartesian * SrbGrid  = SpaceTimeGrid::makeFourDimRedBlackGrid(SGrid);
 | 
				
			||||||
 | 
					  GridRedBlackCartesian * SFrbGrid = SpaceTimeGrid::makeFiveDimRedBlackGrid(JP.Ls,SGrid);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  LatticeGaugeFieldF s_Umu(SGrid);
 | 
				
			||||||
 | 
					  Grid_split  (Umu,s_Umu);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  //WilsonFermionR::ImplParams params;
 | 
				
			||||||
 | 
					  ZMobiusFermionF::ImplParams params;
 | 
				
			||||||
 | 
					  params.overlapCommsCompute = true;
 | 
				
			||||||
 | 
					  params.boundary_phases = JP.boundary_phase;
 | 
				
			||||||
 | 
					  ZMobiusFermionF  Ddwf(Umu,*FGrid,*FrbGrid,*UGrid,*UrbGrid,mass,M5,JP.omega,1.,0.,params);
 | 
				
			||||||
 | 
					//  SchurDiagTwoOperator<ZMobiusFermionR,FermionField> HermOp(Ddwf);
 | 
				
			||||||
 | 
					  SchurDiagOneOperator<ZMobiusFermionF,FermionField> HermOp(Ddwf);
 | 
				
			||||||
 | 
					  ZMobiusFermionF  Dsplit(s_Umu,*SFGrid,*SFrbGrid,*SGrid,*SrbGrid,mass,M5,JP.omega,1.,0.,params);
 | 
				
			||||||
 | 
					//  SchurDiagTwoOperator<ZMobiusFermionR,FermionField> SHermOp(Dsplit);
 | 
				
			||||||
 | 
					  SchurDiagOneOperator<ZMobiusFermionF,FermionField> SHermOp(Dsplit);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  //std::vector<double> Coeffs { 0.,-1.}; 
 | 
				
			||||||
 | 
					  // ypj [note] this may not be supported by some compilers
 | 
				
			||||||
 | 
					  std::vector<double> Coeffs({ 0.,-1.}); 
 | 
				
			||||||
 | 
					  Polynomial<FermionField> PolyX(Coeffs);
 | 
				
			||||||
 | 
					  //Chebyshev<FermionField> Cheb(0.2,5.5,11);
 | 
				
			||||||
 | 
					  Chebyshev<FermionField> Cheb(JP.low,JP.high,JP.order);
 | 
				
			||||||
 | 
					//  Cheb.csv(std::cout);
 | 
				
			||||||
 | 
					  ImplicitlyRestartedBlockLanczos<FermionField> IRBL(HermOp, SHermOp,
 | 
				
			||||||
 | 
											     FrbGrid,SFrbGrid,mrhs,
 | 
				
			||||||
 | 
					                                                     Cheb,
 | 
				
			||||||
 | 
					                                                     JP.Nstop, JP.Ntest,
 | 
				
			||||||
 | 
					                                                     JP.Nu, JP.Nk, JP.Nm,
 | 
				
			||||||
 | 
					                                                     JP.resid,
 | 
				
			||||||
 | 
					                                                     JP.MaxIter,
 | 
				
			||||||
 | 
											     IRBLdiagonaliseWithEigen);
 | 
				
			||||||
 | 
					//						     IRBLdiagonaliseWithLAPACK);
 | 
				
			||||||
 | 
					  IRBL.split_test=0;
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  std::vector<RealD> eval(JP.Nm);
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  std::vector<FermionField> src(JP.Nu,FrbGrid);
 | 
				
			||||||
 | 
					if (0)
 | 
				
			||||||
 | 
					{
 | 
				
			||||||
 | 
					// in case RNG is too slow
 | 
				
			||||||
 | 
					  std::cout << GridLogMessage << "Using RNG5"<<std::endl;
 | 
				
			||||||
 | 
					  FermionField src_tmp(FGrid);
 | 
				
			||||||
 | 
					  for ( int i=0; i<JP.Nu; ++i ){
 | 
				
			||||||
 | 
					//    gaussian(RNG5,src_tmp);
 | 
				
			||||||
 | 
					     ComplexD rnd;
 | 
				
			||||||
 | 
					     RealD re;
 | 
				
			||||||
 | 
					     fillScalar(re,RNG5._gaussian[0],RNG5._generators[0]);
 | 
				
			||||||
 | 
					    std::cout << i <<" / "<< JP.Nm  <<" re "<< re  << std::endl;
 | 
				
			||||||
 | 
					// printf("%d / %d re %e\n",i,FGrid->_processor,re);
 | 
				
			||||||
 | 
					    src_tmp=re;
 | 
				
			||||||
 | 
					    pickCheckerboard(Odd,src[i],src_tmp);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  RNG5.Report();
 | 
				
			||||||
 | 
					} else {
 | 
				
			||||||
 | 
					  std::cout << GridLogMessage << "Using RNG5rb"<<std::endl;
 | 
				
			||||||
 | 
					  for ( int i=0; i<JP.Nu; ++i )
 | 
				
			||||||
 | 
					    gaussian(RNG5rb,src[i]);
 | 
				
			||||||
 | 
					  RNG5rb.Report();
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					  
 | 
				
			||||||
 | 
					  std::vector<FermionField> evec(JP.Nm,FrbGrid);
 | 
				
			||||||
 | 
					  for(int i=0;i<1;++i){
 | 
				
			||||||
 | 
					    std::cout << GridLogMessage << i <<" / "<< JP.Nm <<" grid pointer "<< evec[i].Grid() << std::endl;
 | 
				
			||||||
 | 
					  };
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  int Nconv;
 | 
				
			||||||
 | 
					  IRBL.calc(eval,evec,src,Nconv,JP.Impl);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  Grid_finalize();
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
							
								
								
									
										27
									
								
								tests/lanczos/dwf.batch
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										27
									
								
								tests/lanczos/dwf.batch
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,27 @@
 | 
				
			|||||||
 | 
					# run script on Cori
 | 
				
			||||||
 | 
					#!/bin/bash
 | 
				
			||||||
 | 
					#SBATCH  -t 30
 | 
				
			||||||
 | 
					#SBATCH  -N 16
 | 
				
			||||||
 | 
					#SBATCH  -C knl
 | 
				
			||||||
 | 
					#SBATCH  -A mp13
 | 
				
			||||||
 | 
					#SBATCH  --ntasks-per-node=1
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					export OMP_PROC_BIND=true
 | 
				
			||||||
 | 
					export OMP_PLACES=threads
 | 
				
			||||||
 | 
					export OMP_NUM_THREADS=64
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#BIN=benchmarks/Benchmark_ITT
 | 
				
			||||||
 | 
					#OPT='--cpu-bind=cores' 
 | 
				
			||||||
 | 
					BIN=./Test_dwf_block_lanczos
 | 
				
			||||||
 | 
					rundir=.
 | 
				
			||||||
 | 
					CONF='--gconf '${rundir}'/ckpoint_lat.IEEE64BIG.5000'
 | 
				
			||||||
 | 
					VOL='--grid 16.16.16.32'
 | 
				
			||||||
 | 
					GRID='--mpi 1.2.2.4'
 | 
				
			||||||
 | 
					OPT='--mass 0.00054 --M5 1.8 --phase in.params --omega in.params --shm 4096'
 | 
				
			||||||
 | 
					BL='--rbl 4.32.32.30.7 --split 1.2.2.1 --check_int 8 --resid 1.0e-5 --cheby_l 0.0027 --cheby_u 7 --cheby_n 51'
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#echo srun $OPT $BIN $gridoptions $jobparams
 | 
				
			||||||
 | 
					#srun $OPT $BIN $gridoptions $jobparams
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					echo srun $BIN $CONF $OPT $BL $VOL $GRID
 | 
				
			||||||
 | 
					srun $BIN $CONF $OPT $BL $VOL $GRID
 | 
				
			||||||
							
								
								
									
										17
									
								
								tests/lanczos/in.params
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										17
									
								
								tests/lanczos/in.params
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,17 @@
 | 
				
			|||||||
 | 
					boundary_phase 0 1 0
 | 
				
			||||||
 | 
					boundary_phase 1 1 0
 | 
				
			||||||
 | 
					boundary_phase 2 1 0
 | 
				
			||||||
 | 
					boundary_phase 3 -1 0
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					omega 0 0.375 0
 | 
				
			||||||
 | 
					omega 1 0.375 0
 | 
				
			||||||
 | 
					omega 2 0.375 0
 | 
				
			||||||
 | 
					omega 3 0.375 0
 | 
				
			||||||
 | 
					omega 4 0.375 0
 | 
				
			||||||
 | 
					omega 5 0.375 0
 | 
				
			||||||
 | 
					omega 6 0.375 0
 | 
				
			||||||
 | 
					omega 7 0.375 0
 | 
				
			||||||
 | 
					omega 8 0.375 0
 | 
				
			||||||
 | 
					omega 9 0.375 0
 | 
				
			||||||
 | 
					omega 10 0.375 0
 | 
				
			||||||
 | 
					omega 11 0.375 0
 | 
				
			||||||
		Reference in New Issue
	
	Block a user