2018-01-02 18:12:05 +01:00
|
|
|
// Copyright (c) 2016-2017 The Bitcoin Core developers
|
2016-09-18 09:55:14 +02:00
|
|
|
// Distributed under the MIT software license, see the accompanying
|
|
|
|
// file COPYING or http://www.opensource.org/licenses/mit-license.php.
|
|
|
|
|
2017-11-10 01:57:53 +01:00
|
|
|
#include <support/lockedpool.h>
|
|
|
|
#include <support/cleanse.h>
|
2016-09-18 09:55:14 +02:00
|
|
|
|
|
|
|
#if defined(HAVE_CONFIG_H)
|
2017-11-10 01:57:53 +01:00
|
|
|
#include <config/bitcoin-config.h>
|
2016-09-18 09:55:14 +02:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef WIN32
|
|
|
|
#ifdef _WIN32_WINNT
|
|
|
|
#undef _WIN32_WINNT
|
|
|
|
#endif
|
|
|
|
#define _WIN32_WINNT 0x0501
|
|
|
|
#define WIN32_LEAN_AND_MEAN 1
|
|
|
|
#ifndef NOMINMAX
|
|
|
|
#define NOMINMAX
|
|
|
|
#endif
|
|
|
|
#include <windows.h>
|
|
|
|
#else
|
|
|
|
#include <sys/mman.h> // for mmap
|
|
|
|
#include <sys/resource.h> // for getrlimit
|
|
|
|
#include <limits.h> // for PAGESIZE
|
|
|
|
#include <unistd.h> // for sysconf
|
|
|
|
#endif
|
|
|
|
|
2016-11-02 22:09:03 +01:00
|
|
|
#include <algorithm>
|
|
|
|
|
2017-08-07 07:36:37 +02:00
|
|
|
LockedPoolManager* LockedPoolManager::_instance = nullptr;
|
2016-09-18 09:55:14 +02:00
|
|
|
std::once_flag LockedPoolManager::init_flag;
|
|
|
|
|
|
|
|
/*******************************************************************************/
|
|
|
|
// Utilities
|
|
|
|
//
|
|
|
|
/** Align up to power of 2 */
|
|
|
|
static inline size_t align_up(size_t x, size_t align)
|
|
|
|
{
|
|
|
|
return (x + align - 1) & ~(align - 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*******************************************************************************/
|
|
|
|
// Implementation: Arena
|
|
|
|
|
|
|
|
Arena::Arena(void *base_in, size_t size_in, size_t alignment_in):
|
|
|
|
base(static_cast<char*>(base_in)), end(static_cast<char*>(base_in) + size_in), alignment(alignment_in)
|
|
|
|
{
|
|
|
|
// Start with one free chunk that covers the entire arena
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
auto it = size_to_free_chunk.emplace(size_in, base);
|
|
|
|
chunks_free.emplace(base, it);
|
|
|
|
chunks_free_end.emplace(base + size_in, it);
|
2016-09-18 09:55:14 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
Arena::~Arena()
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
void* Arena::alloc(size_t size)
|
|
|
|
{
|
|
|
|
// Round to next multiple of alignment
|
|
|
|
size = align_up(size, alignment);
|
|
|
|
|
2016-11-02 22:09:03 +01:00
|
|
|
// Don't handle zero-sized chunks
|
|
|
|
if (size == 0)
|
2016-09-18 09:55:14 +02:00
|
|
|
return nullptr;
|
|
|
|
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
// Pick a large enough free-chunk. Returns an iterator pointing to the first element that is not less than key.
|
|
|
|
// This allocation strategy is best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review",
|
|
|
|
// Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, best-fit and first-fit
|
|
|
|
// policies seem to work well in practice.
|
2018-01-06 09:13:41 +01:00
|
|
|
auto size_ptr_it = size_to_free_chunk.lower_bound(size);
|
|
|
|
if (size_ptr_it == size_to_free_chunk.end())
|
2016-11-02 22:09:03 +01:00
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
// Create the used-chunk, taking its space from the end of the free-chunk
|
2018-01-06 09:13:41 +01:00
|
|
|
const size_t size_remaining = size_ptr_it->first - size;
|
|
|
|
auto alloced = chunks_used.emplace(size_ptr_it->second + size_remaining, size).first;
|
|
|
|
chunks_free_end.erase(size_ptr_it->second + size_ptr_it->first);
|
|
|
|
if (size_ptr_it->first == size) {
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
// whole chunk is used up
|
2018-01-06 09:13:41 +01:00
|
|
|
chunks_free.erase(size_ptr_it->second);
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
} else {
|
|
|
|
// still some memory left in the chunk
|
2018-01-06 09:13:41 +01:00
|
|
|
auto it_remaining = size_to_free_chunk.emplace(size_remaining, size_ptr_it->second);
|
|
|
|
chunks_free[size_ptr_it->second] = it_remaining;
|
|
|
|
chunks_free_end.emplace(size_ptr_it->second + size_remaining, it_remaining);
|
2016-09-18 09:55:14 +02:00
|
|
|
}
|
2018-01-06 09:13:41 +01:00
|
|
|
size_to_free_chunk.erase(size_ptr_it);
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
|
|
|
|
return reinterpret_cast<void*>(alloced->first);
|
2016-09-18 09:55:14 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
void Arena::free(void *ptr)
|
|
|
|
{
|
2017-08-07 07:36:37 +02:00
|
|
|
// Freeing the nullptr pointer is OK.
|
2016-09-18 09:55:14 +02:00
|
|
|
if (ptr == nullptr) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-11-02 22:09:03 +01:00
|
|
|
// Remove chunk from used map
|
|
|
|
auto i = chunks_used.find(static_cast<char*>(ptr));
|
|
|
|
if (i == chunks_used.end()) {
|
|
|
|
throw std::runtime_error("Arena: invalid or double free");
|
2016-09-18 09:55:14 +02:00
|
|
|
}
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
std::pair<char*, size_t> freed = *i;
|
2016-11-02 22:09:03 +01:00
|
|
|
chunks_used.erase(i);
|
|
|
|
|
2018-01-06 09:13:41 +01:00
|
|
|
// coalesce freed with previous chunk
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
auto prev = chunks_free_end.find(freed.first);
|
|
|
|
if (prev != chunks_free_end.end()) {
|
|
|
|
freed.first -= prev->second->first;
|
|
|
|
freed.second += prev->second->first;
|
|
|
|
size_to_free_chunk.erase(prev->second);
|
|
|
|
chunks_free_end.erase(prev);
|
|
|
|
}
|
|
|
|
|
2018-01-06 09:13:41 +01:00
|
|
|
// coalesce freed with chunk after freed
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
auto next = chunks_free.find(freed.first + freed.second);
|
|
|
|
if (next != chunks_free.end()) {
|
|
|
|
freed.second += next->second->first;
|
|
|
|
size_to_free_chunk.erase(next->second);
|
2016-11-02 22:09:03 +01:00
|
|
|
chunks_free.erase(next);
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Add/set space with coalesced free chunk
|
|
|
|
auto it = size_to_free_chunk.emplace(freed.second, freed.first);
|
|
|
|
chunks_free[freed.first] = it;
|
|
|
|
chunks_free_end[freed.first + freed.second] = it;
|
2016-09-18 09:55:14 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
Arena::Stats Arena::stats() const
|
|
|
|
{
|
2016-11-02 22:09:03 +01:00
|
|
|
Arena::Stats r{ 0, 0, 0, chunks_used.size(), chunks_free.size() };
|
|
|
|
for (const auto& chunk: chunks_used)
|
|
|
|
r.used += chunk.second;
|
|
|
|
for (const auto& chunk: chunks_free)
|
Use best-fit strategy in Arena, now O(log(n)) instead O(n)
This replaces the first-fit algorithm used in the Arena with a best-fit. According to "Dynamic Storage Allocation: A Survey and Critical Review", Wilson et. al. 1995, http://www.scs.stanford.edu/14wi-cs140/sched/readings/wilson.pdf, both startegies work well in practice.
The advantage of using best-fit is that we can switch the slow O(n) algorithm to O(log(n)) operations. Additionally, some previously O(log(n)) operations are now replaced with O(1) operations by using a hash map. The end effect is that the benchmark runs about 2.5 times faster on my machine:
old: BenchLockedPool, 5, 530, 5.25749, 0.00196938, 0.00199755, 0.00198172
new: BenchLockedPool, 5, 1300, 5.11313, 0.000781493, 0.000793314, 0.00078606
I've run all unit tests and benchmarks.
2017-12-29 11:36:11 +01:00
|
|
|
r.free += chunk.second->first;
|
2016-11-02 22:09:03 +01:00
|
|
|
r.total = r.used + r.free;
|
2016-09-18 09:55:14 +02:00
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef ARENA_DEBUG
|
2018-05-02 17:14:48 +02:00
|
|
|
static void printchunk(char* base, size_t sz, bool used) {
|
2016-11-02 22:09:03 +01:00
|
|
|
std::cout <<
|
|
|
|
"0x" << std::hex << std::setw(16) << std::setfill('0') << base <<
|
|
|
|
" 0x" << std::hex << std::setw(16) << std::setfill('0') << sz <<
|
|
|
|
" 0x" << used << std::endl;
|
|
|
|
}
|
2016-09-18 09:55:14 +02:00
|
|
|
void Arena::walk() const
|
|
|
|
{
|
2016-11-02 22:09:03 +01:00
|
|
|
for (const auto& chunk: chunks_used)
|
|
|
|
printchunk(chunk.first, chunk.second, true);
|
|
|
|
std::cout << std::endl;
|
|
|
|
for (const auto& chunk: chunks_free)
|
|
|
|
printchunk(chunk.first, chunk.second, false);
|
2016-09-18 09:55:14 +02:00
|
|
|
std::cout << std::endl;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*******************************************************************************/
|
|
|
|
// Implementation: Win32LockedPageAllocator
|
|
|
|
|
|
|
|
#ifdef WIN32
|
|
|
|
/** LockedPageAllocator specialized for Windows.
|
|
|
|
*/
|
|
|
|
class Win32LockedPageAllocator: public LockedPageAllocator
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
Win32LockedPageAllocator();
|
2017-06-20 21:58:56 +02:00
|
|
|
void* AllocateLocked(size_t len, bool *lockingSuccess) override;
|
|
|
|
void FreeLocked(void* addr, size_t len) override;
|
|
|
|
size_t GetLimit() override;
|
2016-09-18 09:55:14 +02:00
|
|
|
private:
|
|
|
|
size_t page_size;
|
|
|
|
};
|
|
|
|
|
|
|
|
Win32LockedPageAllocator::Win32LockedPageAllocator()
|
|
|
|
{
|
|
|
|
// Determine system page size in bytes
|
|
|
|
SYSTEM_INFO sSysInfo;
|
|
|
|
GetSystemInfo(&sSysInfo);
|
|
|
|
page_size = sSysInfo.dwPageSize;
|
|
|
|
}
|
|
|
|
void *Win32LockedPageAllocator::AllocateLocked(size_t len, bool *lockingSuccess)
|
|
|
|
{
|
|
|
|
len = align_up(len, page_size);
|
|
|
|
void *addr = VirtualAlloc(nullptr, len, MEM_COMMIT | MEM_RESERVE, PAGE_READWRITE);
|
|
|
|
if (addr) {
|
|
|
|
// VirtualLock is used to attempt to keep keying material out of swap. Note
|
|
|
|
// that it does not provide this as a guarantee, but, in practice, memory
|
|
|
|
// that has been VirtualLock'd almost never gets written to the pagefile
|
|
|
|
// except in rare circumstances where memory is extremely low.
|
|
|
|
*lockingSuccess = VirtualLock(const_cast<void*>(addr), len) != 0;
|
|
|
|
}
|
|
|
|
return addr;
|
|
|
|
}
|
|
|
|
void Win32LockedPageAllocator::FreeLocked(void* addr, size_t len)
|
|
|
|
{
|
|
|
|
len = align_up(len, page_size);
|
|
|
|
memory_cleanse(addr, len);
|
|
|
|
VirtualUnlock(const_cast<void*>(addr), len);
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t Win32LockedPageAllocator::GetLimit()
|
|
|
|
{
|
2018-03-18 15:26:45 +01:00
|
|
|
// TODO is there a limit on Windows, how to get it?
|
2016-09-18 09:55:14 +02:00
|
|
|
return std::numeric_limits<size_t>::max();
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*******************************************************************************/
|
|
|
|
// Implementation: PosixLockedPageAllocator
|
|
|
|
|
|
|
|
#ifndef WIN32
|
|
|
|
/** LockedPageAllocator specialized for OSes that don't try to be
|
|
|
|
* special snowflakes.
|
|
|
|
*/
|
|
|
|
class PosixLockedPageAllocator: public LockedPageAllocator
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
PosixLockedPageAllocator();
|
2017-06-20 21:58:56 +02:00
|
|
|
void* AllocateLocked(size_t len, bool *lockingSuccess) override;
|
|
|
|
void FreeLocked(void* addr, size_t len) override;
|
|
|
|
size_t GetLimit() override;
|
2016-09-18 09:55:14 +02:00
|
|
|
private:
|
|
|
|
size_t page_size;
|
|
|
|
};
|
|
|
|
|
|
|
|
PosixLockedPageAllocator::PosixLockedPageAllocator()
|
|
|
|
{
|
|
|
|
// Determine system page size in bytes
|
|
|
|
#if defined(PAGESIZE) // defined in limits.h
|
|
|
|
page_size = PAGESIZE;
|
|
|
|
#else // assume some POSIX OS
|
|
|
|
page_size = sysconf(_SC_PAGESIZE);
|
|
|
|
#endif
|
|
|
|
}
|
2016-11-02 14:18:19 +01:00
|
|
|
|
|
|
|
// Some systems (at least OS X) do not define MAP_ANONYMOUS yet and define
|
|
|
|
// MAP_ANON which is deprecated
|
|
|
|
#ifndef MAP_ANONYMOUS
|
|
|
|
#define MAP_ANONYMOUS MAP_ANON
|
|
|
|
#endif
|
|
|
|
|
2016-09-18 09:55:14 +02:00
|
|
|
void *PosixLockedPageAllocator::AllocateLocked(size_t len, bool *lockingSuccess)
|
|
|
|
{
|
|
|
|
void *addr;
|
|
|
|
len = align_up(len, page_size);
|
|
|
|
addr = mmap(nullptr, len, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0);
|
|
|
|
if (addr) {
|
|
|
|
*lockingSuccess = mlock(addr, len) == 0;
|
|
|
|
}
|
|
|
|
return addr;
|
|
|
|
}
|
|
|
|
void PosixLockedPageAllocator::FreeLocked(void* addr, size_t len)
|
|
|
|
{
|
|
|
|
len = align_up(len, page_size);
|
|
|
|
memory_cleanse(addr, len);
|
|
|
|
munlock(addr, len);
|
|
|
|
munmap(addr, len);
|
|
|
|
}
|
|
|
|
size_t PosixLockedPageAllocator::GetLimit()
|
|
|
|
{
|
|
|
|
#ifdef RLIMIT_MEMLOCK
|
|
|
|
struct rlimit rlim;
|
|
|
|
if (getrlimit(RLIMIT_MEMLOCK, &rlim) == 0) {
|
|
|
|
if (rlim.rlim_cur != RLIM_INFINITY) {
|
|
|
|
return rlim.rlim_cur;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
return std::numeric_limits<size_t>::max();
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*******************************************************************************/
|
|
|
|
// Implementation: LockedPool
|
|
|
|
|
|
|
|
LockedPool::LockedPool(std::unique_ptr<LockedPageAllocator> allocator_in, LockingFailed_Callback lf_cb_in):
|
|
|
|
allocator(std::move(allocator_in)), lf_cb(lf_cb_in), cumulative_bytes_locked(0)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
LockedPool::~LockedPool()
|
|
|
|
{
|
|
|
|
}
|
|
|
|
void* LockedPool::alloc(size_t size)
|
|
|
|
{
|
|
|
|
std::lock_guard<std::mutex> lock(mutex);
|
2016-11-02 22:11:07 +01:00
|
|
|
|
|
|
|
// Don't handle impossible sizes
|
|
|
|
if (size == 0 || size > ARENA_SIZE)
|
|
|
|
return nullptr;
|
|
|
|
|
2016-09-18 09:55:14 +02:00
|
|
|
// Try allocating from each current arena
|
|
|
|
for (auto &arena: arenas) {
|
|
|
|
void *addr = arena.alloc(size);
|
|
|
|
if (addr) {
|
|
|
|
return addr;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// If that fails, create a new one
|
|
|
|
if (new_arena(ARENA_SIZE, ARENA_ALIGN)) {
|
|
|
|
return arenas.back().alloc(size);
|
|
|
|
}
|
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
|
|
|
void LockedPool::free(void *ptr)
|
|
|
|
{
|
|
|
|
std::lock_guard<std::mutex> lock(mutex);
|
|
|
|
// TODO we can do better than this linear search by keeping a map of arena
|
|
|
|
// extents to arena, and looking up the address.
|
|
|
|
for (auto &arena: arenas) {
|
|
|
|
if (arena.addressInArena(ptr)) {
|
|
|
|
arena.free(ptr);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
throw std::runtime_error("LockedPool: invalid address not pointing to any arena");
|
|
|
|
}
|
|
|
|
|
|
|
|
LockedPool::Stats LockedPool::stats() const
|
|
|
|
{
|
|
|
|
std::lock_guard<std::mutex> lock(mutex);
|
2016-11-02 22:09:03 +01:00
|
|
|
LockedPool::Stats r{0, 0, 0, cumulative_bytes_locked, 0, 0};
|
2016-09-18 09:55:14 +02:00
|
|
|
for (const auto &arena: arenas) {
|
|
|
|
Arena::Stats i = arena.stats();
|
|
|
|
r.used += i.used;
|
|
|
|
r.free += i.free;
|
|
|
|
r.total += i.total;
|
|
|
|
r.chunks_used += i.chunks_used;
|
|
|
|
r.chunks_free += i.chunks_free;
|
|
|
|
}
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool LockedPool::new_arena(size_t size, size_t align)
|
|
|
|
{
|
|
|
|
bool locked;
|
|
|
|
// If this is the first arena, handle this specially: Cap the upper size
|
|
|
|
// by the process limit. This makes sure that the first arena will at least
|
|
|
|
// be locked. An exception to this is if the process limit is 0:
|
|
|
|
// in this case no memory can be locked at all so we'll skip past this logic.
|
|
|
|
if (arenas.empty()) {
|
|
|
|
size_t limit = allocator->GetLimit();
|
|
|
|
if (limit > 0) {
|
|
|
|
size = std::min(size, limit);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
void *addr = allocator->AllocateLocked(size, &locked);
|
|
|
|
if (!addr) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (locked) {
|
|
|
|
cumulative_bytes_locked += size;
|
|
|
|
} else if (lf_cb) { // Call the locking-failed callback if locking failed
|
|
|
|
if (!lf_cb()) { // If the callback returns false, free the memory and fail, otherwise consider the user warned and proceed.
|
|
|
|
allocator->FreeLocked(addr, size);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
arenas.emplace_back(allocator.get(), addr, size, align);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
LockedPool::LockedPageArena::LockedPageArena(LockedPageAllocator *allocator_in, void *base_in, size_t size_in, size_t align_in):
|
|
|
|
Arena(base_in, size_in, align_in), base(base_in), size(size_in), allocator(allocator_in)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
LockedPool::LockedPageArena::~LockedPageArena()
|
|
|
|
{
|
|
|
|
allocator->FreeLocked(base, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*******************************************************************************/
|
|
|
|
// Implementation: LockedPoolManager
|
|
|
|
//
|
2016-11-10 08:00:05 +01:00
|
|
|
LockedPoolManager::LockedPoolManager(std::unique_ptr<LockedPageAllocator> allocator_in):
|
|
|
|
LockedPool(std::move(allocator_in), &LockedPoolManager::LockingFailed)
|
2016-09-18 09:55:14 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
bool LockedPoolManager::LockingFailed()
|
|
|
|
{
|
|
|
|
// TODO: log something but how? without including util.h
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void LockedPoolManager::CreateInstance()
|
|
|
|
{
|
|
|
|
// Using a local static instance guarantees that the object is initialized
|
|
|
|
// when it's first needed and also deinitialized after all objects that use
|
|
|
|
// it are done with it. I can think of one unlikely scenario where we may
|
|
|
|
// have a static deinitialization order/problem, but the check in
|
|
|
|
// LockedPoolManagerBase's destructor helps us detect if that ever happens.
|
|
|
|
#ifdef WIN32
|
|
|
|
std::unique_ptr<LockedPageAllocator> allocator(new Win32LockedPageAllocator());
|
|
|
|
#else
|
|
|
|
std::unique_ptr<LockedPageAllocator> allocator(new PosixLockedPageAllocator());
|
|
|
|
#endif
|
|
|
|
static LockedPoolManager instance(std::move(allocator));
|
|
|
|
LockedPoolManager::_instance = &instance;
|
|
|
|
}
|