1
0
mirror of https://github.com/paboyle/Grid.git synced 2024-11-15 10:15:36 +00:00
Grid/lib/allocator/AlignedAllocator.h

240 lines
7.4 KiB
C
Raw Normal View History

/*************************************************************************************
Grid physics library, www.github.com/paboyle/Grid
Source file: ./lib/AlignedAllocator.h
Copyright (C) 2015
Author: Azusa Yamaguchi <ayamaguc@staffmail.ed.ac.uk>
Author: Peter Boyle <paboyle@ph.ed.ac.uk>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License along
with this program; if not, write to the Free Software Foundation, Inc.,
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
See the full license in the file "LICENSE" in the top level distribution directory
2018-01-13 00:19:19 +00:00
*************************************************************************************/
/* END LEGAL */
2015-03-04 05:31:44 +00:00
#ifndef GRID_ALIGNED_ALLOCATOR_H
#define GRID_ALIGNED_ALLOCATOR_H
#ifdef HAVE_MALLOC_MALLOC_H
#include <malloc/malloc.h>
#endif
#ifdef HAVE_MALLOC_H
#include <malloc.h>
#endif
2015-05-15 11:32:11 +01:00
#ifdef HAVE_MM_MALLOC_H
#include <mm_malloc.h>
#endif
2018-03-18 14:44:46 +00:00
#define POINTER_CACHE
#define GRID_ALLOC_ALIGN (2*1024*1024)
2018-01-13 00:19:19 +00:00
NAMESPACE_BEGIN(Grid);
2015-03-04 05:31:44 +00:00
// Move control to configure.ac and Config.h?
#ifdef POINTER_CACHE
2018-01-13 00:19:19 +00:00
class PointerCache {
private:
2018-01-13 00:19:19 +00:00
static const int Ncache=8;
static int victim;
2018-01-13 00:19:19 +00:00
typedef struct {
void *address;
size_t bytes;
int valid;
} PointerCacheEntry;
2018-01-13 00:19:19 +00:00
static PointerCacheEntry Entries[Ncache];
2018-01-13 00:19:19 +00:00
public:
2018-01-13 00:19:19 +00:00
static void *Insert(void *ptr,size_t bytes) ;
static void *Lookup(size_t bytes) ;
2018-01-13 00:19:19 +00:00
};
#endif
2018-01-13 00:19:19 +00:00
std::string sizeString(size_t bytes);
2018-01-13 00:19:19 +00:00
struct MemoryStats
{
size_t totalAllocated{0}, maxAllocated{0},
currentlyAllocated{0}, totalFreed{0};
};
2017-09-22 14:21:18 +01:00
2018-01-13 00:19:19 +00:00
class MemoryProfiler
{
public:
static MemoryStats *stats;
static bool debug;
};
2017-12-06 15:50:25 +00:00
2018-01-13 00:19:19 +00:00
#define memString(bytes) std::to_string(bytes) + " (" + sizeString(bytes) + ")"
#define profilerDebugPrint \
if (MemoryProfiler::stats) \
{ \
auto s = MemoryProfiler::stats; \
std::cout << GridLogDebug << "[Memory debug] Stats " << MemoryProfiler::stats << std::endl; \
std::cout << GridLogDebug << "[Memory debug] total : " << memString(s->totalAllocated) \
<< std::endl; \
std::cout << GridLogDebug << "[Memory debug] max : " << memString(s->maxAllocated) \
<< std::endl; \
std::cout << GridLogDebug << "[Memory debug] current: " << memString(s->currentlyAllocated) \
<< std::endl; \
std::cout << GridLogDebug << "[Memory debug] freed : " << memString(s->totalFreed) \
<< std::endl; \
}
2017-12-06 15:50:25 +00:00
2018-01-13 00:19:19 +00:00
#define profilerAllocate(bytes) \
if (MemoryProfiler::stats) \
{ \
auto s = MemoryProfiler::stats; \
s->totalAllocated += (bytes); \
s->currentlyAllocated += (bytes); \
s->maxAllocated = std::max(s->maxAllocated, s->currentlyAllocated); \
} \
if (MemoryProfiler::debug) \
{ \
std::cout << GridLogDebug << "[Memory debug] allocating " << memString(bytes) << std::endl; \
profilerDebugPrint; \
}
2017-12-06 15:50:25 +00:00
2018-01-13 00:19:19 +00:00
#define profilerFree(bytes) \
if (MemoryProfiler::stats) \
{ \
auto s = MemoryProfiler::stats; \
s->totalFreed += (bytes); \
s->currentlyAllocated -= (bytes); \
} \
if (MemoryProfiler::debug) \
{ \
std::cout << GridLogDebug << "[Memory debug] freeing " << memString(bytes) << std::endl; \
profilerDebugPrint; \
}
void check_huge_pages(void *Buf,uint64_t BYTES);
2015-03-04 05:31:44 +00:00
////////////////////////////////////////////////////////////////////
// A lattice of something, but assume the something is SIMDized.
////////////////////////////////////////////////////////////////////
2015-03-04 05:31:44 +00:00
template<typename _Tp>
class alignedAllocator {
public:
typedef std::size_t size_type;
typedef std::ptrdiff_t difference_type;
typedef _Tp* pointer;
typedef const _Tp* const_pointer;
typedef _Tp& reference;
typedef const _Tp& const_reference;
typedef _Tp value_type;
template<typename _Tp1> struct rebind { typedef alignedAllocator<_Tp1> other; };
alignedAllocator() throw() { }
alignedAllocator(const alignedAllocator&) throw() { }
template<typename _Tp1> alignedAllocator(const alignedAllocator<_Tp1>&) throw() { }
~alignedAllocator() throw() { }
pointer address(reference __x) const { return &__x; }
2015-03-04 05:31:44 +00:00
size_type max_size() const throw() { return size_t(-1) / sizeof(_Tp); }
pointer allocate(size_type __n, const void* _p= 0)
2015-03-04 05:31:44 +00:00
{
size_type bytes = __n*sizeof(_Tp);
2017-12-06 15:50:25 +00:00
profilerAllocate(bytes);
2017-09-22 14:21:18 +01:00
#ifdef POINTER_CACHE
_Tp *ptr = (_Tp *) PointerCache::Lookup(bytes);
#else
pointer ptr = nullptr;
#endif
2017-08-25 09:25:54 +01:00
2018-03-18 14:44:46 +00:00
#ifdef GRID_NVCC
2018-03-20 10:33:59 +00:00
////////////////////////////////////
// Unified (managed) memory
////////////////////////////////////
2018-03-18 14:44:46 +00:00
if ( ptr == (_Tp *) NULL ) {
if( cudaMallocManaged((void **)&ptr,bytes) != cudaSuccess ) {
ptr = (_Tp *) NULL;
assert(0);
}
}
#else
2018-03-20 10:33:59 +00:00
//////////////////////////////////////////////////////////////////////////////////////////
// 2MB align; could make option probably doesn't need configurability
//////////////////////////////////////////////////////////////////////////////////////////
2018-03-18 14:44:46 +00:00
#ifdef HAVE_MM_MALLOC_H
2017-07-29 18:06:53 +01:00
if ( ptr == (_Tp *) NULL ) ptr = (_Tp *) _mm_malloc(bytes,GRID_ALLOC_ALIGN);
2018-03-18 14:44:46 +00:00
#else
2017-07-29 18:06:53 +01:00
if ( ptr == (_Tp *) NULL ) ptr = (_Tp *) memalign(GRID_ALLOC_ALIGN,bytes);
2018-03-18 14:44:46 +00:00
#endif
#endif
2018-03-18 14:44:46 +00:00
assert( ptr != (_Tp *)NULL);
2018-03-20 10:33:59 +00:00
2018-03-18 14:44:46 +00:00
/////////////////////////////////////////
// First touch optimise in threaded loop
2018-03-18 14:44:46 +00:00
/////////////////////////////////////////
uint8_t *cp = (uint8_t *)ptr;
2018-01-24 13:49:39 +00:00
thread_loop( (size_type n=0;n<bytes;n+=4096) , {
cp[n]=0;
2018-01-24 13:49:39 +00:00
});
return ptr;
}
void deallocate(pointer __p, size_type __n) {
size_type bytes = __n * sizeof(_Tp);
2017-08-25 09:25:54 +01:00
2017-12-06 15:50:25 +00:00
profilerFree(bytes);
2017-09-22 14:21:18 +01:00
#ifdef POINTER_CACHE
pointer __freeme = (pointer)PointerCache::Insert((void *)__p,bytes);
#else
pointer __freeme = __p;
#endif
2018-03-18 14:44:46 +00:00
#ifdef GRID_NVCC
if ( __freeme ) cudaFree((void *)__freeme);
#else
#ifdef HAVE_MM_MALLOC_H
if ( __freeme ) _mm_free((void *)__freeme);
2018-03-18 14:44:46 +00:00
#else
if ( __freeme ) free((void *)__freeme);
2018-03-18 14:44:46 +00:00
#endif
#endif
2018-03-18 14:44:46 +00:00
}
void construct(pointer __p, const _Tp& __val) { };
void construct(pointer __p) { };
void destroy(pointer __p) { };
};
template<typename _Tp> inline bool operator==(const alignedAllocator<_Tp>&, const alignedAllocator<_Tp>&){ return true; }
template<typename _Tp> inline bool operator!=(const alignedAllocator<_Tp>&, const alignedAllocator<_Tp>&){ return false; }
////////////////////////////////////////////////////////////////////////////////
// Template typedefs
////////////////////////////////////////////////////////////////////////////////
template<class T> using commAllocator = alignedAllocator<T>;
2016-10-20 17:09:40 +01:00
template<class T> using Vector = std::vector<T,alignedAllocator<T> >;
template<class T> using commVector = std::vector<T,alignedAllocator<T> >;
2016-10-20 17:09:40 +01:00
template<class T> using Matrix = std::vector<std::vector<T,alignedAllocator<T> > >;
2018-01-13 00:19:19 +00:00
NAMESPACE_END(Grid);
2015-03-04 05:31:44 +00:00
#endif