You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 

129 lines
4.4 KiB

#ifndef ALGOIM_SPARKSTACK_HPP
#define ALGOIM_SPARKSTACK_HPP
// algoim::SparkStack<T> implements a fast, thread-safe, stack-based allocator,
// similar in function to alloca() but with additional guarantees regarding
// portability, alignment, and type consistency.
#include <vector>
#include "uvector.hpp"
namespace algoim
{
template <typename T, int N>
class xarray;
template <typename T>
class SparkStack
{
static constexpr size_t capacity = 1u << 23;
static constexpr int capacity_line = __LINE__ - 1;
template <typename... R>
static size_t alloc(T** ptr, size_t len, R... rest)
{
if (pos() + len > capacity) {
std::cerr << "SparkStack<T = " << typeid(T).name() << ">: capacity=" << capacity << " and pos=" << pos()
<< " insufficient for request len=" << len << '\n';
std::cerr << " consider increasing const 'capacity', defined on line " << capacity_line << " in file "
<< __FILE__ << '\n';
throw std::bad_alloc();
}
// std::cout << "Before alloc, the **ptr pointing to nullptr is not nullptr: " << ptr << std::endl;
*ptr = base() + pos();
// std::cout << "pos before += len:" << pos() << std::endl;
pos() += len;
// std::cout << "pos after += len:" << pos() << std::endl;
// std::cout << "base: " << base() << std::endl;
// std::cout << "ptr: " << ptr << std::endl;
// std::cout << "*ptr: " << *ptr << std::endl;
// std::cout << "==========" << std::endl;
if constexpr (sizeof...(rest) == 0)
return len;
else
return len + alloc(rest...);
}
static T* base()
{
static thread_local std::vector<T> buff(capacity);
return buff.data();
}
static ptrdiff_t& pos()
{
static thread_local ptrdiff_t pos_ = 0;
return pos_;
};
size_t len_;
SparkStack(const SparkStack&) = delete;
SparkStack(SparkStack&&) = delete;
SparkStack& operator=(const SparkStack&) = delete;
SparkStack& operator=(SparkStack&&) = delete;
public:
// With parameters x0, n0, x1, n1, x2, n2, ..., allocate n0 elements and assign to x0, etc.
template <typename... R>
explicit SparkStack(T** ptr, size_t len, R&&... rest)
{
len_ = alloc(ptr, len, rest...);
}
// With parameters value, x0, n0, x1, n1, x2, n2, ..., allocate n0 elements and assign to x0, ...,
// and assign the given value to all n0*n1*n2*... values allocated
template <typename... R>
explicit SparkStack(T value, T** ptr, size_t len, R&&... rest)
{
T* start = base() + pos();
len_ = alloc(ptr, len, rest...);
for (int i = 0; i < len_; ++i) *(start + i) = value;
}
// For each i, allocate ext(i) elements and assign to ptr(i)
template <int N>
explicit SparkStack(uvector<T*, N>& ptr, const uvector<int, N>& ext)
{
len_ = 0;
for (int i = 0; i < N; ++i) len_ += alloc(&ptr(i), ext(i));
}
// Allocate enough elements for one or more xarray's having pre-set extent
template <int... N>
explicit SparkStack(xarray<T, N>&... a)
{
len_ = (alloc(&a.data_, a.size()) + ...);
}
template <int N>
explicit SparkStack(std::vector<xarray<T, N>>& as)
{
len_ = 0;
for (auto& a : as) len_ += alloc(&a.data_, a.size());
}
// Release memory when the SparkStack object goes out of scope
~SparkStack()
{
pos() -= len_;
// std::cout << "Here! len = " << len_ << std::endl;
}
};
#define algoim_CONCAT2(x, y) x##y
#define algoim_CONCAT(x, y) algoim_CONCAT2(x, y)
#define algoim_spark_alloc(T, ...) SparkStack<T> algoim_CONCAT(spark_alloc_var_, __LINE__)(__VA_ARGS__)
#define algoim_spark_alloc_def(T, val, ...) SparkStack<T> algoim_CONCAT(spark_alloc_var_, __LINE__)(val, __VA_ARGS__)
#define algoim_spark_alloc_vec(T, ptr, ext) SparkStack<T> algoim_CONCAT(spark_alloc_var_, __LINE__)(ptr, ext)
#define algoim_spark_alloc_heap(T, ...) new SparkStack<T>(__VA_ARGS__)
#define algoim_spark_release_heap(SparkStackPtr) delete SparkStackPtr
void algoimSparkAllocHeapVector(std::vector<SparkStack<real>*>& sparkStackPtrs, std::vector<xarray<real, 3>>& tensors)
{
for (int i = 0; i < tensors.size(); ++i) { sparkStackPtrs.push_back(algoim_spark_alloc_heap(real, tensors[i])); }
}
} // namespace algoim
#endif