Commit 67943c23 authored by Kevin Modzelewski's avatar Kevin Modzelewski

Avoid allocations in pyElements()

I had added an allocation to deal with the requirements refcounting
added.  To remove that allocation, I added a "SmallUniquePtr" class
which is similar to unique_ptr but it allocates the object in-line.

It's a bit tricky to use since if the containing object gets moved around
then the pointers become invalid.
parent a0f0cb72
...@@ -591,20 +591,70 @@ public: ...@@ -591,20 +591,70 @@ public:
Box* operator*() { return impl->getValue(); } Box* operator*() { return impl->getValue(); }
}; };
template <typename T, int N> class SmallUniquePtr {
private:
char _data[N];
bool owned;
#ifndef NDEBUG
bool address_taken = false;
#endif
template <typename ConcreteType, typename... Args> SmallUniquePtr(ConcreteType* dummy, Args... args) {
static_assert(sizeof(ConcreteType) <= N, "SmallUniquePtr not large enough to contain this object");
new (_data) ConcreteType(std::forward<Args>(args)...);
owned = true;
}
public:
template <typename ConcreteType, typename... Args> static SmallUniquePtr emplace(Args... args) {
return SmallUniquePtr<T, N>((ConcreteType*)nullptr, args...);
}
SmallUniquePtr(const SmallUniquePtr&) = delete;
SmallUniquePtr(SmallUniquePtr&& rhs) { *this = std::move(rhs); }
void operator=(const SmallUniquePtr&) = delete;
void operator=(SmallUniquePtr&& rhs) {
assert(!rhs.address_taken && "Invalid copy after being converted to a pointer");
std::swap(_data, rhs._data);
owned = false;
std::swap(owned, rhs.owned);
}
~SmallUniquePtr() {
if (owned)
((T*)this)->~T();
}
operator T*() {
#ifndef NDEBUG
address_taken = true;
#endif
return reinterpret_cast<T*>(_data);
}
};
// A custom "range" container that helps manage lifetimes. We need to free the underlying Impl object // A custom "range" container that helps manage lifetimes. We need to free the underlying Impl object
// when the range loop is done; previously we had the iterator itself handle this, but that started // when the range loop is done; previously we had the iterator itself handle this, but that started
// to get complicated since they get copied around, and the management of the begin() and end() iterators // to get complicated since they get copied around, and the management of the begin() and end() iterators
// is slightly different. // is slightly different.
// So to simplify, have the range object take care of it. // So to simplify, have the range object take care of it.
//
// Note: be careful when explicitly calling begin(). The returned iterator points into this BoxIteratorRange
// object, so once you call begin() it is a bug to move/copy this BoxIteratorRange object (the SmallUniquePtr
// should complain).
class BoxIteratorRange { class BoxIteratorRange {
private: private:
std::unique_ptr<BoxIteratorImpl> begin_impl; // std::unique_ptr<BoxIteratorImpl> begin_impl;
// char _data[32];
typedef SmallUniquePtr<BoxIteratorImpl, 32> UniquePtr;
UniquePtr begin_impl;
BoxIteratorImpl* end_impl; BoxIteratorImpl* end_impl;
public: public:
BoxIteratorRange(std::unique_ptr<BoxIteratorImpl> begin, BoxIteratorImpl* end) template <typename ImplType, typename T>
: begin_impl(std::move(begin)), end_impl(end) {} BoxIteratorRange(BoxIteratorImpl* end, T&& arg, ImplType* dummy)
BoxIterator begin() { return BoxIterator(begin_impl.get()); } : begin_impl(UniquePtr::emplace<ImplType, T>(arg)), end_impl(end) {}
BoxIterator begin() { return BoxIterator(begin_impl); }
BoxIterator end() { return BoxIterator(end_impl); } BoxIterator end() { return BoxIterator(end_impl); }
int traverse(visitproc visit, void* arg) { int traverse(visitproc visit, void* arg) {
......
...@@ -803,15 +803,15 @@ Box* map(Box* f, BoxedTuple* args) { ...@@ -803,15 +803,15 @@ Box* map(Box* f, BoxedTuple* args) {
if (num_iterable == 1) if (num_iterable == 1)
return map2(f, args->elts[0]); return map2(f, args->elts[0]);
std::vector<BoxIteratorRange> ranges; std::deque<BoxIteratorRange> ranges;
std::vector<BoxIterator> args_it; std::vector<BoxIterator> args_it;
std::vector<BoxIterator> args_end; std::vector<BoxIterator> args_end;
for (auto e : *args) { for (auto e : *args) {
auto range = e->pyElements(); auto range = e->pyElements();
args_it.emplace_back(range.begin());
args_end.emplace_back(range.end());
ranges.push_back(std::move(range)); ranges.push_back(std::move(range));
args_it.emplace_back(ranges.back().begin());
args_end.emplace_back(ranges.back().end());
} }
assert(args_it.size() == num_iterable); assert(args_it.size() == num_iterable);
assert(args_end.size() == num_iterable); assert(args_end.size() == num_iterable);
...@@ -1221,11 +1221,13 @@ Box* zip(BoxedTuple* containers) { ...@@ -1221,11 +1221,13 @@ Box* zip(BoxedTuple* containers) {
return incref(rtn); return incref(rtn);
std::vector<BoxIteratorRange> ranges; std::vector<BoxIteratorRange> ranges;
ranges.reserve(containers->size());
for (auto container : *containers) { for (auto container : *containers) {
ranges.push_back(std::move(container->pyElements())); ranges.push_back(container->pyElements());
} }
std::vector<BoxIterator> iterators; std::vector<BoxIterator> iterators;
iterators.reserve(containers->size());
for (auto&& range : ranges) { for (auto&& range : ranges) {
iterators.push_back(std::move(range.begin())); iterators.push_back(std::move(range.begin()));
} }
......
...@@ -45,7 +45,7 @@ static std::deque<uint64_t> available_addrs; ...@@ -45,7 +45,7 @@ static std::deque<uint64_t> available_addrs;
#define STACK_REDZONE_SIZE PAGE_SIZE #define STACK_REDZONE_SIZE PAGE_SIZE
#define MAX_STACK_SIZE (4 * 1024 * 1024) #define MAX_STACK_SIZE (4 * 1024 * 1024)
static std::unordered_map<void*, BoxedGenerator*> s_generator_map; static llvm::DenseMap<void*, BoxedGenerator*> s_generator_map;
static_assert(THREADING_USE_GIL, "have to make the generator map thread safe!"); static_assert(THREADING_USE_GIL, "have to make the generator map thread safe!");
class RegisterHelper { class RegisterHelper {
......
...@@ -165,23 +165,19 @@ public: ...@@ -165,23 +165,19 @@ public:
BoxIteratorRange Box::pyElements() { BoxIteratorRange Box::pyElements() {
if (this->cls == list_cls) { if (this->cls == list_cls) {
using BoxIteratorList = BoxIteratorIndex<BoxedList>; using BoxIteratorList = BoxIteratorIndex<BoxedList>;
std::unique_ptr<BoxIteratorImpl> begin(new BoxIteratorList((BoxedList*)this));
BoxIteratorImpl* end = BoxIteratorList::end(); BoxIteratorImpl* end = BoxIteratorList::end();
return BoxIteratorRange(std::move(begin), end); return BoxIteratorRange(end, (BoxedList*)this, (BoxIteratorList*)nullptr);
} else if (this->cls == tuple_cls) { } else if (this->cls == tuple_cls) {
using BoxIteratorTuple = BoxIteratorIndex<BoxedTuple>; using BoxIteratorTuple = BoxIteratorIndex<BoxedTuple>;
std::unique_ptr<BoxIteratorImpl> begin(new BoxIteratorTuple((BoxedTuple*)this));
BoxIteratorImpl* end = BoxIteratorTuple::end(); BoxIteratorImpl* end = BoxIteratorTuple::end();
return BoxIteratorRange(std::move(begin), end); return BoxIteratorRange(end, (BoxedTuple*)this, (BoxIteratorTuple*)nullptr);
} else if (this->cls == str_cls) { } else if (this->cls == str_cls) {
using BoxIteratorString = BoxIteratorIndex<BoxedString>; using BoxIteratorString = BoxIteratorIndex<BoxedString>;
std::unique_ptr<BoxIteratorImpl> begin(new BoxIteratorString((BoxedString*)this));
BoxIteratorImpl* end = BoxIteratorString::end(); BoxIteratorImpl* end = BoxIteratorString::end();
return BoxIteratorRange(std::move(begin), end); return BoxIteratorRange(end, (BoxedString*)this, (BoxIteratorString*)nullptr);
} else { } else {
std::unique_ptr<BoxIteratorImpl> begin(new BoxIteratorGeneric(this));
BoxIteratorImpl* end = BoxIteratorGeneric::end(); BoxIteratorImpl* end = BoxIteratorGeneric::end();
return BoxIteratorRange(std::move(begin), end); return BoxIteratorRange(end, this, (BoxIteratorGeneric*)nullptr);
} }
} }
} }
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment