diff --git a/Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h b/Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h index fe388c19..c5d00722 100644 --- a/Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h +++ b/Grid/algorithms/iterative/ImplicitlyRestartedBlockLanczos.h @@ -7,9 +7,8 @@ Copyright (C) 2015 Author: Peter Boyle -Author: Chulwoo Jung Author: Yong-Chull Jang -Author: Guido Cossu +Author: Chulwoo Jung This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by @@ -185,10 +184,6 @@ public: { RealD nn = norm2(v); nn = sqrt(nn); -#if 0 - if(if_print && nn < 1e20) - Glog<<"normalize: "< 1e-14) - Glog<<"orthogonalize before: "< 1e-14) - Glog<<"orthogonalize after: "<GlobalSumVector((CUDA_FLOAT*)c_acc,2*Nu*Nevec_acc); -#if 0 - for (int i=0; i[" << j << "," << i << "] = " - << z.x << " + i " << z.y << std::endl; - } - w[i] = w[i] - ip * evec[b*Nevec_acc+j]; - } - } -#else alpha = MAKE_CUDA_COMPLEX(-1.0,0.0); beta = MAKE_CUDA_COMPLEX(1.0,0.0); stat = CUDA_GEMM(handle, CUBLAS_OP_N, CUBLAS_OP_N, 12*sites, Nu, Nevec_acc, @@ -340,9 +292,7 @@ public: &beta, w_acc, 12*sites); //Glog << stat << std::endl; -#endif } -#if 1 for (int col=0; col &inner, std::vector& lhs, int llhs, std::vector& rhs, int lrhs) -{ - typedef typename Field:vector_object vobj; - typedef typename vobj::scalar_type scalar_type; - typedef typename vobj::vector_typeD vector_type; - GridBase *grid = lhs[0]._grid; - assert(grid == rhs[0]._grid; - const int pad = 8; - int total = llhs*lrhs; - assert(inner.size()==total); - int sum_size=grid->SumArraySize(); - -// std::vector inner(total); - Vector sumarray(sum_size*pad*total); - - parallel_for(int thr=0;throSites(),thr,mywork,myoff); - - std::vector< decltype(innerProductD(lhs[0]._odata[0],rhs[0]._odata[0])) > vinner(total,zero); // private to thread; sub summation - for(int ss=myoff;ssGlobalSum(tmp); - inner[i]=tmp; - } -// return inner; -} -#endif - void orthogonalize_blockhead(Field& w, std::vector& evec, int k, int Nu) { @@ -839,14 +738,6 @@ cudaStat = cudaMallocManaged((void **)&evec_acc, Nevec_acc*sites*12*sizeof(CUDA_ Glog << fname + " CONVERGED ; Summary :\n"; // Sort convered eigenpairs. std::vector Btmp(Nstop,grid); // waste of space replicating -#if 0 - for(int i=0; i0) { - for (int u=0; u0) { - // orthogonalize_blockhead(w[0],evec,b,Nu); - // for (int u=1; uGlobalSumVector((double*)evec_tmp,2*NN*NN); } } - // Safer to sort instead of just reversing it, - // but the document of the routine says evals are sorted in increasing order. - // qr gives evals in decreasing order. -// for(int i=0;i +Author: Yong-Chull Jang +Author: Chulwoo Jung This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by