From 0ef8ce0d60996be2467fd4ccff324d4786243f27 Mon Sep 17 00:00:00 2001 From: Nick Terrell Date: Wed, 26 Apr 2017 10:32:25 -0700 Subject: [PATCH] small_vector improvements Summary: 1. `emplace_back()` is broken when there are at least two arguments and one is a reference to inside the vector. See the `ForwardingEmplaceInsideVector` test. 2. Only `push_back(value_type&&)` did exponential growth, every other function grew linearly. The bug is hidden inside of facebook because `goodMallocSize()` grows fast enough to not be horribly slow. When not using jemalloc, it will grow one element at a time. 3. `push_back(value_type const& t)` performed a copy and a move on `t` when `size() == capacity()`. Remove the extra move. Fixes https://github.com/facebook/folly/issues/541. Reviewed By: luciang Differential Revision: D4875084 fbshipit-source-id: eefa76028c6bfd9d7c73af65e8bb9d4baf49b8cb --- folly/small_vector.h | 184 ++++++++++++++++--------------- folly/test/small_vector_test.cpp | 140 +++++++++++++++++++++++ 2 files changed, 235 insertions(+), 89 deletions(-) diff --git a/folly/small_vector.h b/folly/small_vector.h index 1cb111e3..12eba17f 100644 --- a/folly/small_vector.h +++ b/folly/small_vector.h @@ -43,6 +43,7 @@ #include #include +#include #include #include #include @@ -120,6 +121,42 @@ namespace detail { std::memmove(out, first, (last - first) * sizeof *first); } + /* + * Move a range to a range of uninitialized memory. Assumes the + * ranges don't overlap. Inserts an element at out + pos using emplaceFunc(). + * out will contain (end - begin) + 1 elements on success and none on failure. + * If emplaceFunc() throws [begin, end) is unmodified. + */ + template + void moveToUninitializedEmplace( + T* begin, + T* end, + T* out, + Size pos, + EmplaceFunc&& emplaceFunc) { + // Must be called first so that if it throws [begin, end) is unmodified. + // We have to support the strong exception guarantee for emplace_back(). + emplaceFunc(out + pos); + // move old elements to the left of the new one + try { + detail::moveToUninitialized(begin, begin + pos, out); + } catch (...) { + out[pos].~T(); + throw; + } + // move old elements to the right of the new one + try { + if (begin + pos < end) { + detail::moveToUninitialized(begin + pos, end, out + pos + 1); + } + } catch (...) { + for (Size i = 0; i <= pos; ++i) { + out[i].~T(); + } + throw; + } + } + /* * Move objects in memory to the right into some uninitialized * memory, where the region overlaps. This doesn't just use @@ -638,44 +675,28 @@ class small_vector tmp.swap(*this); } - template + template void emplace_back(Args&&... args) { - // call helper function for static dispatch of special cases - emplaceBack(std::forward(args)...); - } - - void emplace_back(const value_type& t) { - push_back(t); - } - void emplace_back(value_type& t) { - push_back(t); - } - - void emplace_back(value_type&& t) { - push_back(std::move(t)); - } - - void push_back(value_type&& t) { if (capacity() == size()) { - makeSize(std::max(size_type(2), 3 * size() / 2), &t, size()); + // Any of args may be references into the vector. + // When we are reallocating, we have to be careful to construct the new + // element before modifying the data in the old buffer. + makeSize( + size() + 1, + [&](void* p) { new (p) value_type(std::forward(args)...); }, + size()); } else { - new (end()) value_type(std::move(t)); + new (end()) value_type(std::forward(args)...); } this->setSize(size() + 1); } + void push_back(value_type&& t) { + return emplace_back(std::move(t)); + } + void push_back(value_type const& t) { - // TODO: we'd like to make use of makeSize (it can be optimized better, - // because it manipulates the internals) - // unfortunately the current implementation only supports moving from - // a supplied rvalue, and doing an extra move just to reuse it is a perf - // net loss - if (size() == capacity()) {// && isInside(&t)) { - value_type tmp(t); - emplaceBack(std::move(tmp)); - } else { - emplaceBack(t); - } + emplace_back(t); } void pop_back() { @@ -693,10 +714,12 @@ class small_vector auto offset = p - begin(); if (capacity() == size()) { - makeSize(size() + 1, &t, offset); + makeSize( + size() + 1, + [&t](void* ptr) { new (ptr) value_type(std::move(t)); }, + offset); this->setSize(this->size() + 1); } else { - makeSize(size() + 1); detail::moveObjectsRight(data() + offset, data() + size(), data() + size() + 1); @@ -803,17 +826,6 @@ class small_vector private: - /* - * This is doing the same like emplace_back, but we need this helper - * to catch the special case - see the next overload function.. - */ - template - void emplaceBack(Args&&... args) { - makeSize(size() + 1); - new (end()) value_type(std::forward(args)...); - this->setSize(size() + 1); - } - static iterator unconst(const_iterator it) { return const_cast(it); } @@ -900,30 +912,50 @@ private: doConstruct(n, [&](void* p) { new (p) value_type(val); }); } - void makeSize(size_type size, value_type* v = nullptr) { - makeSize(size, v, size - 1); + /* + * Compute the size after growth. + */ + size_type computeNewSize() const { + return std::min((3 * capacity()) / 2 + 1, max_size()); + } + + void makeSize(size_type newSize) { + makeSizeInternal(newSize, false, [](void*) { assume_unreachable(); }, 0); + } + + template + void makeSize(size_type newSize, EmplaceFunc&& emplaceFunc, size_type pos) { + assert(size() == capacity()); + makeSizeInternal( + newSize, true, std::forward(emplaceFunc), pos); } /* - * Ensure we have a large enough memory region to be size `size'. + * Ensure we have a large enough memory region to be size `newSize'. * Will move/copy elements if we are spilling to heap_ or needed to * allocate a new region, but if resized in place doesn't initialize * anything in the new region. In any case doesn't change size(). * Supports insertion of new element during reallocation by given * pointer to new element and position of new element. - * NOTE: If reallocation is not needed, and new element should be - * inserted in the middle of vector (not at the end), do the move - * objects and insertion outside the function, otherwise exception is thrown. + * NOTE: If reallocation is not needed, insert must be false, + * because we only know how to emplace elements into new memory. */ - void makeSize(size_type size, value_type* v, size_type pos) { - if (size > this->max_size()) { + template + void makeSizeInternal( + size_type newSize, + bool insert, + EmplaceFunc&& emplaceFunc, + size_type pos) { + if (newSize > max_size()) { throw std::length_error("max_size exceeded in small_vector"); } - if (size <= this->capacity()) { + if (newSize <= capacity()) { + assert(!insert); return; } + newSize = std::max(newSize, computeNewSize()); - auto needBytes = size * sizeof(value_type); + auto needBytes = newSize * sizeof(value_type); // If the capacity isn't explicitly stored inline, but the heap // allocation is grown to over some threshold, we should store // a capacity at the front of the heap allocation. @@ -943,44 +975,18 @@ private: detail::shiftPointer(newh, kHeapifyCapacitySize) : newh); - if (v != nullptr) { - // move new element - try { - new (&newp[pos]) value_type(std::move(*v)); - } catch (...) { - free(newh); - throw; - } - - // move old elements to the left of the new one - try { - detail::moveToUninitialized(begin(), begin() + pos, newp); - } catch (...) { - newp[pos].~value_type(); - free(newh); - throw; - } - - // move old elements to the right of the new one - try { - if (pos < size-1) { - detail::moveToUninitialized(begin() + pos, end(), newp + pos + 1); - } - } catch (...) { - for (size_type i = 0; i <= pos; ++i) { - newp[i].~value_type(); - } - free(newh); - throw; - } - } else { - // move without inserting new element - try { + try { + if (insert) { + // move and insert the new element + detail::moveToUninitializedEmplace( + begin(), end(), newp, pos, std::forward(emplaceFunc)); + } else { + // move without inserting new element detail::moveToUninitialized(begin(), end(), newp); - } catch (...) { - free(newh); - throw; } + } catch (...) { + free(newh); + throw; } for (auto& val : *this) { val.~value_type(); diff --git a/folly/test/small_vector_test.cpp b/folly/test/small_vector_test.cpp index db63d491..38e1d37b 100644 --- a/folly/test/small_vector_test.cpp +++ b/folly/test/small_vector_test.cpp @@ -739,6 +739,7 @@ struct CheckedInt { static const int DEFAULT_VALUE = (int)0xdeadbeef; CheckedInt(): value(DEFAULT_VALUE) {} explicit CheckedInt(int value): value(value) {} + CheckedInt(const CheckedInt& rhs, int) : value(rhs.value) {} CheckedInt(const CheckedInt& rhs): value(rhs.value) {} CheckedInt(CheckedInt&& rhs) noexcept: value(rhs.value) { rhs.value = DEFAULT_VALUE; @@ -756,6 +757,15 @@ struct CheckedInt { int value; }; +TEST(small_vector, ForwardingEmplaceInsideVector) { + folly::small_vector v; + v.push_back(CheckedInt(1)); + for (int i = 1; i < 20; ++i) { + v.emplace_back(v[0], 42); + ASSERT_EQ(1, v.back().value); + } +} + TEST(small_vector, LVEmplaceInsideVector) { folly::small_vector v; v.push_back(CheckedInt(1)); @@ -856,3 +866,133 @@ TEST(small_vector, ZeroInitializable) { EXPECT_EQ(element, 0); } } + +TEST(small_vector, InsertMoreThanGrowth) { + small_vector test; + test.insert(test.end(), 30, 0); + for (auto element : test) { + EXPECT_EQ(element, 0); + } +} + +TEST(small_vector, EmplaceBackExponentialGrowth) { + small_vector> test; + std::vector capacities; + capacities.push_back(test.capacity()); + for (int i = 0; i < 10000; ++i) { + test.emplace_back(0, 0); + if (test.capacity() != capacities.back()) { + capacities.push_back(test.capacity()); + } + } + EXPECT_LE(capacities.size(), 25); +} + +TEST(small_vector, InsertExponentialGrowth) { + small_vector> test; + std::vector capacities; + capacities.push_back(test.capacity()); + for (int i = 0; i < 10000; ++i) { + test.insert(test.begin(), std::make_pair(0, 0)); + if (test.capacity() != capacities.back()) { + capacities.push_back(test.capacity()); + } + } + EXPECT_LE(capacities.size(), 25); +} + +TEST(small_vector, InsertNExponentialGrowth) { + small_vector test; + std::vector capacities; + capacities.push_back(test.capacity()); + for (int i = 0; i < 10000; ++i) { + test.insert(test.begin(), 100, 0); + if (test.capacity() != capacities.back()) { + capacities.push_back(test.capacity()); + } + } + EXPECT_LE(capacities.size(), 25); +} + +namespace { +struct Counts { + size_t copyCount{0}; + size_t moveCount{0}; +}; + +class Counter { + Counts* counts; + + public: + explicit Counter(Counts& counts) : counts(&counts) {} + Counter(Counter const& other) noexcept : counts(other.counts) { + ++counts->copyCount; + } + Counter(Counter&& other) noexcept : counts(other.counts) { + ++counts->moveCount; + } + Counter& operator=(Counter const& rhs) noexcept { + EXPECT_EQ(counts, rhs.counts); + ++counts->copyCount; + return *this; + } + Counter& operator=(Counter&& rhs) noexcept { + EXPECT_EQ(counts, rhs.counts); + ++counts->moveCount; + return *this; + } +}; +} + +TEST(small_vector, EmplaceBackEfficiency) { + small_vector test; + Counts counts; + for (size_t i = 1; i <= test.capacity(); ++i) { + test.emplace_back(counts); + EXPECT_EQ(0, counts.copyCount); + EXPECT_EQ(0, counts.moveCount); + } + EXPECT_EQ(test.size(), test.capacity()); + test.emplace_back(counts); + // Every element except the last has to be moved to the new position + EXPECT_EQ(0, counts.copyCount); + EXPECT_EQ(test.size() - 1, counts.moveCount); + EXPECT_LT(test.size(), test.capacity()); +} + +TEST(small_vector, RVPushBackEfficiency) { + small_vector test; + Counts counts; + for (size_t i = 1; i <= test.capacity(); ++i) { + test.push_back(Counter(counts)); + // 1 copy for each push_back() + EXPECT_EQ(0, counts.copyCount); + EXPECT_EQ(i, counts.moveCount); + } + EXPECT_EQ(test.size(), test.capacity()); + test.push_back(Counter(counts)); + // 1 move for each push_back() + // Every element except the last has to be moved to the new position + EXPECT_EQ(0, counts.copyCount); + EXPECT_EQ(test.size() + test.size() - 1, counts.moveCount); + EXPECT_LT(test.size(), test.capacity()); +} + +TEST(small_vector, CLVPushBackEfficiency) { + small_vector test; + Counts counts; + Counter const counter(counts); + for (size_t i = 1; i <= test.capacity(); ++i) { + test.push_back(counter); + // 1 copy for each push_back() + EXPECT_EQ(i, counts.copyCount); + EXPECT_EQ(0, counts.moveCount); + } + EXPECT_EQ(test.size(), test.capacity()); + test.push_back(counter); + // 1 copy for each push_back() + EXPECT_EQ(test.size(), counts.copyCount); + // Every element except the last has to be moved to the new position + EXPECT_EQ(test.size() - 1, counts.moveCount); + EXPECT_LT(test.size(), test.capacity()); +} -- 2.34.1