From 9e48b7dfdafdf19d63a1f8ce8d140f21b3ffbb31 Mon Sep 17 00:00:00 2001 From: Chulwoo Jung Date: Thu, 6 Apr 2017 22:21:56 -0400 Subject: [PATCH] MEM_SAVE in Lanczos seems to be working, but not pretty --- .../iterative/ImplicitlyRestartedLanczos.h | 130 ++++++++++++++++-- 1 file changed, 118 insertions(+), 12 deletions(-) diff --git a/lib/algorithms/iterative/ImplicitlyRestartedLanczos.h b/lib/algorithms/iterative/ImplicitlyRestartedLanczos.h index aa4dfd19..2ca8d765 100644 --- a/lib/algorithms/iterative/ImplicitlyRestartedLanczos.h +++ b/lib/algorithms/iterative/ImplicitlyRestartedLanczos.h @@ -494,6 +494,10 @@ repeat →AVK =VKHK +fKe†K † Extend to an M = K + P step factorization AVM = VMHM + fMeM until convergence */ + +// alternate implementation for minimizing memory usage. May affect the performance +#define MEM_SAVE +#undef MEM_SAVE2 void calc(DenseVector& eval, DenseVector& evec, const Field& src, @@ -516,11 +520,13 @@ until convergence DenseVector Qt(Nm*Nm); DenseVector Iconv(Nm); +#if (!defined MEM_SAVE ) || (!defined MEM_SAVE2) DenseVector B(Nm,grid); // waste of space replicating -// DenseVector Btemp(Nm,grid); // waste of space replicating +#endif Field f(grid); Field v(grid); +// auto B2 = evec[0]._odata[0]; int k1 = 1; int k2 = Nk; @@ -603,6 +609,9 @@ until convergence } t1=usecond()/1e6; std::cout<oSites();ss++){ - for(int jj=k1-1; jj0); +// DenseVector < decltype(B2) > B(Nm); +// std::vector < decltype( B2 ) > B(Nm*thr,B2); + Field B(grid); +PARALLEL_FOR_LOOP + for(int ss=0;ss < grid->oSites();ss++){ + int thr=GridThread::GetThreads(); + int me = GridThread::ThreadBarrier(); + printf("thr=%d ss=%d me=%d\n",thr,ss,me);fflush(stdout); + for(int j=0; joSites();ss++){ + auto B2 = evec[0]._odata[0]; + std::vector < decltype( B2 ) > B(Nm,B2); + for(int j=0; j