mirror of
				https://github.com/paboyle/Grid.git
				synced 2025-10-23 09:14:48 +01:00 
			
		
		
		
	More verbosity. The 16bit limit on Grid.y, Grid.z is annoying
This commit is contained in:
		| @@ -53,7 +53,6 @@ void acceleratorInit(void) | ||||
|     prop = gpu_props[i]; | ||||
|     totalDeviceMem = prop.totalGlobalMem; | ||||
|     if ( world_rank == 0) { | ||||
| #ifndef GRID_DEFAULT_GPU | ||||
|       if ( i==rank ) { | ||||
| 	printf("AcceleratorCudaInit[%d]: ========================\n",rank); | ||||
| 	printf("AcceleratorCudaInit[%d]: Device Number    : %d\n", rank,i); | ||||
| @@ -67,8 +66,8 @@ void acceleratorInit(void) | ||||
| 	GPU_PROP(warpSize); | ||||
| 	GPU_PROP(pciBusID); | ||||
| 	GPU_PROP(pciDeviceID); | ||||
|  	printf("AcceleratorCudaInit[%d]: maxGridSize (%d,%d,%d)\n",rank,prop.maxGridSize[0],prop.maxGridSize[1],prop.maxGridSize[2]); | ||||
|       } | ||||
| #endif | ||||
|       //      GPU_PROP(unifiedAddressing); | ||||
|       //      GPU_PROP(l2CacheSize); | ||||
|       //      GPU_PROP(singleToDoublePrecisionPerfRatio); | ||||
|   | ||||
| @@ -178,9 +178,10 @@ void Lambda6Apply(uint64_t num1, uint64_t num2, uint64_t num3, | ||||
|     cudaDeviceSynchronize();						\ | ||||
|     cudaError err = cudaGetLastError();					\ | ||||
|     if ( cudaSuccess != err ) {						\ | ||||
|       printf("Cuda error %s \n", cudaGetErrorString( err ));		\ | ||||
|       puts(__FILE__);							\ | ||||
|       printf("Line %d\n",__LINE__);					\ | ||||
|       printf("accelerator_barrier(): Cuda error %s \n",			\ | ||||
| 	     cudaGetErrorString( err ));				\ | ||||
|       printf("File %s Line %d\n",__FILE__,__LINE__);			\ | ||||
|       fflush(stdout);							\ | ||||
|       if (acceleratorAbortOnGpuError) assert(err==cudaSuccess);		\ | ||||
|     }									\ | ||||
|   } | ||||
|   | ||||
		Reference in New Issue
	
	Block a user