/* * Copyright 2016 Facebook, Inc. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ /* * Nicholas Ormrod (njormrod) * Andrei Alexandrescu (aalexandre) * * FBVector is Facebook's drop-in implementation of std::vector. It has special * optimizations for use with relocatable types and jemalloc. */ #pragma once //============================================================================= // headers #include #include #include #include #include #include #include #include #include #include #include #include #include //============================================================================= // forward declaration namespace folly { template > class fbvector; } //============================================================================= // unrolling #define FOLLY_FBV_UNROLL_PTR(first, last, OP) do { \ for (; (last) - (first) >= 4; (first) += 4) { \ OP(((first) + 0)); \ OP(((first) + 1)); \ OP(((first) + 2)); \ OP(((first) + 3)); \ } \ for (; (first) != (last); ++(first)) OP((first)); \ } while(0); //============================================================================= /////////////////////////////////////////////////////////////////////////////// // // // fbvector class // // // /////////////////////////////////////////////////////////////////////////////// namespace folly { template class fbvector : private boost::totally_ordered> { //=========================================================================== //--------------------------------------------------------------------------- // implementation private: typedef std::allocator_traits A; struct Impl : public Allocator { // typedefs typedef typename A::pointer pointer; typedef typename A::size_type size_type; // data pointer b_, e_, z_; // constructors Impl() : Allocator(), b_(nullptr), e_(nullptr), z_(nullptr) {} /* implicit */ Impl(const Allocator& a) : Allocator(a), b_(nullptr), e_(nullptr), z_(nullptr) {} /* implicit */ Impl(Allocator&& a) : Allocator(std::move(a)), b_(nullptr), e_(nullptr), z_(nullptr) {} /* implicit */ Impl(size_type n, const Allocator& a = Allocator()) : Allocator(a) { init(n); } Impl(Impl&& other) noexcept : Allocator(std::move(other)), b_(other.b_), e_(other.e_), z_(other.z_) { other.b_ = other.e_ = other.z_ = nullptr; } // destructor ~Impl() { destroy(); } // allocation // note that 'allocate' and 'deallocate' are inherited from Allocator T* D_allocate(size_type n) { if (usingStdAllocator::value) { return static_cast(malloc(n * sizeof(T))); } else { return std::allocator_traits::allocate(*this, n); } } void D_deallocate(T* p, size_type n) noexcept { if (usingStdAllocator::value) { free(p); } else { std::allocator_traits::deallocate(*this, p, n); } } // helpers void swapData(Impl& other) { std::swap(b_, other.b_); std::swap(e_, other.e_); std::swap(z_, other.z_); } // data ops inline void destroy() noexcept { if (b_) { // THIS DISPATCH CODE IS DUPLICATED IN fbvector::D_destroy_range_a. // It has been inlined here for speed. It calls the static fbvector // methods to perform the actual destruction. if (usingStdAllocator::value) { S_destroy_range(b_, e_); } else { S_destroy_range_a(*this, b_, e_); } D_deallocate(b_, z_ - b_); } } void init(size_type n) { if (UNLIKELY(n == 0)) { b_ = e_ = z_ = nullptr; } else { size_type sz = folly::goodMallocSize(n * sizeof(T)) / sizeof(T); b_ = D_allocate(sz); e_ = b_; z_ = b_ + sz; } } void set(pointer newB, size_type newSize, size_type newCap) { z_ = newB + newCap; e_ = newB + newSize; b_ = newB; } void reset(size_type newCap) { destroy(); try { init(newCap); } catch (...) { init(0); throw; } } void reset() { // same as reset(0) destroy(); b_ = e_ = z_ = nullptr; } } impl_; static void swap(Impl& a, Impl& b) { using std::swap; if (!usingStdAllocator::value) swap(a, b); a.swapData(b); } //=========================================================================== //--------------------------------------------------------------------------- // types and constants public: typedef T value_type; typedef value_type& reference; typedef const value_type& const_reference; typedef T* iterator; typedef const T* const_iterator; typedef size_t size_type; typedef typename std::make_signed::type difference_type; typedef Allocator allocator_type; typedef typename A::pointer pointer; typedef typename A::const_pointer const_pointer; typedef std::reverse_iterator reverse_iterator; typedef std::reverse_iterator const_reverse_iterator; private: typedef std::integral_constant::value && sizeof(T) <= 16 // don't force large structures to be passed by value > should_pass_by_value; typedef typename std::conditional< should_pass_by_value::value, T, const T&>::type VT; typedef typename std::conditional< should_pass_by_value::value, T, T&&>::type MT; typedef std::integral_constant>::value> usingStdAllocator; typedef std::integral_constant moveIsSwap; //=========================================================================== //--------------------------------------------------------------------------- // allocator helpers private: //--------------------------------------------------------------------------- // allocate T* M_allocate(size_type n) { return impl_.D_allocate(n); } //--------------------------------------------------------------------------- // deallocate void M_deallocate(T* p, size_type n) noexcept { impl_.D_deallocate(p, n); } //--------------------------------------------------------------------------- // construct // GCC is very sensitive to the exact way that construct is called. For // that reason there are several different specializations of construct. template void M_construct(U* p, Args&&... args) { if (usingStdAllocator::value) { new (p) U(std::forward(args)...); } else { std::allocator_traits::construct( impl_, p, std::forward(args)...); } } template static void S_construct(U* p, Args&&... args) { new (p) U(std::forward(args)...); } template static void S_construct_a(Allocator& a, U* p, Args&&... args) { std::allocator_traits::construct( a, p, std::forward(args)...); } // scalar optimization // TODO we can expand this optimization to: default copyable and assignable template ::value>::type> void M_construct(U* p, U arg) { if (usingStdAllocator::value) { *p = arg; } else { std::allocator_traits::construct(impl_, p, arg); } } template ::value>::type> static void S_construct(U* p, U arg) { *p = arg; } template ::value>::type> static void S_construct_a(Allocator& a, U* p, U arg) { std::allocator_traits::construct(a, p, arg); } // const& optimization template ::value>::type> void M_construct(U* p, const U& value) { if (usingStdAllocator::value) { new (p) U(value); } else { std::allocator_traits::construct(impl_, p, value); } } template ::value>::type> static void S_construct(U* p, const U& value) { new (p) U(value); } template ::value>::type> static void S_construct_a(Allocator& a, U* p, const U& value) { std::allocator_traits::construct(a, p, value); } //--------------------------------------------------------------------------- // destroy void M_destroy(T* p) noexcept { if (usingStdAllocator::value) { if (!boost::has_trivial_destructor::value) p->~T(); } else { std::allocator_traits::destroy(impl_, p); } } //=========================================================================== //--------------------------------------------------------------------------- // algorithmic helpers private: //--------------------------------------------------------------------------- // destroy_range // wrappers void M_destroy_range_e(T* pos) noexcept { D_destroy_range_a(pos, impl_.e_); impl_.e_ = pos; } // dispatch // THIS DISPATCH CODE IS DUPLICATED IN IMPL. SEE IMPL FOR DETAILS. void D_destroy_range_a(T* first, T* last) noexcept { if (usingStdAllocator::value) { S_destroy_range(first, last); } else { S_destroy_range_a(impl_, first, last); } } // allocator static void S_destroy_range_a(Allocator& a, T* first, T* last) noexcept { for (; first != last; ++first) std::allocator_traits::destroy(a, first); } // optimized static void S_destroy_range(T* first, T* last) noexcept { if (!boost::has_trivial_destructor::value) { // EXPERIMENTAL DATA on fbvector> (where each vector has // size 0). // The unrolled version seems to work faster for small to medium sized // fbvectors. It gets a 10% speedup on fbvectors of size 1024, 64, and // 16. // The simple loop version seems to work faster for large fbvectors. The // unrolled version is about 6% slower on fbvectors on size 16384. // The two methods seem tied for very large fbvectors. The unrolled // version is about 0.5% slower on size 262144. // for (; first != last; ++first) first->~T(); #define FOLLY_FBV_OP(p) (p)->~T() FOLLY_FBV_UNROLL_PTR(first, last, FOLLY_FBV_OP) #undef FOLLY_FBV_OP } } //--------------------------------------------------------------------------- // uninitialized_fill_n // wrappers void M_uninitialized_fill_n_e(size_type sz) { D_uninitialized_fill_n_a(impl_.e_, sz); impl_.e_ += sz; } void M_uninitialized_fill_n_e(size_type sz, VT value) { D_uninitialized_fill_n_a(impl_.e_, sz, value); impl_.e_ += sz; } // dispatch void D_uninitialized_fill_n_a(T* dest, size_type sz) { if (usingStdAllocator::value) { S_uninitialized_fill_n(dest, sz); } else { S_uninitialized_fill_n_a(impl_, dest, sz); } } void D_uninitialized_fill_n_a(T* dest, size_type sz, VT value) { if (usingStdAllocator::value) { S_uninitialized_fill_n(dest, sz, value); } else { S_uninitialized_fill_n_a(impl_, dest, sz, value); } } // allocator template static void S_uninitialized_fill_n_a(Allocator& a, T* dest, size_type sz, Args&&... args) { auto b = dest; auto e = dest + sz; try { for (; b != e; ++b) std::allocator_traits::construct(a, b, std::forward(args)...); } catch (...) { S_destroy_range_a(a, dest, b); throw; } } // optimized static void S_uninitialized_fill_n(T* dest, size_type n) { if (folly::IsZeroInitializable::value) { std::memset(dest, 0, sizeof(T) * n); } else { auto b = dest; auto e = dest + n; try { for (; b != e; ++b) S_construct(b); } catch (...) { --b; for (; b >= dest; --b) b->~T(); throw; } } } static void S_uninitialized_fill_n(T* dest, size_type n, const T& value) { auto b = dest; auto e = dest + n; try { for (; b != e; ++b) S_construct(b, value); } catch (...) { S_destroy_range(dest, b); throw; } } //--------------------------------------------------------------------------- // uninitialized_copy // it is possible to add an optimization for the case where // It = move(T*) and IsRelocatable and Is0Initiailizable // wrappers template void M_uninitialized_copy_e(It first, It last) { D_uninitialized_copy_a(impl_.e_, first, last); impl_.e_ += std::distance(first, last); } template void M_uninitialized_move_e(It first, It last) { D_uninitialized_move_a(impl_.e_, first, last); impl_.e_ += std::distance(first, last); } // dispatch template void D_uninitialized_copy_a(T* dest, It first, It last) { if (usingStdAllocator::value) { if (folly::IsTriviallyCopyable::value) { S_uninitialized_copy_bits(dest, first, last); } else { S_uninitialized_copy(dest, first, last); } } else { S_uninitialized_copy_a(impl_, dest, first, last); } } template void D_uninitialized_move_a(T* dest, It first, It last) { D_uninitialized_copy_a(dest, std::make_move_iterator(first), std::make_move_iterator(last)); } // allocator template static void S_uninitialized_copy_a(Allocator& a, T* dest, It first, It last) { auto b = dest; try { for (; first != last; ++first, ++b) std::allocator_traits::construct(a, b, *first); } catch (...) { S_destroy_range_a(a, dest, b); throw; } } // optimized template static void S_uninitialized_copy(T* dest, It first, It last) { auto b = dest; try { for (; first != last; ++first, ++b) S_construct(b, *first); } catch (...) { S_destroy_range(dest, b); throw; } } static void S_uninitialized_copy_bits(T* dest, const T* first, const T* last) { if (last != first) { std::memcpy((void*)dest, (void*)first, (last - first) * sizeof(T)); } } static void S_uninitialized_copy_bits(T* dest, std::move_iterator first, std::move_iterator last) { T* bFirst = first.base(); T* bLast = last.base(); if (bLast != bFirst) { std::memcpy((void*)dest, (void*)bFirst, (bLast - bFirst) * sizeof(T)); } } template static void S_uninitialized_copy_bits(T* dest, It first, It last) { S_uninitialized_copy(dest, first, last); } //--------------------------------------------------------------------------- // copy_n // This function is "unsafe": it assumes that the iterator can be advanced at // least n times. However, as a private function, that unsafety is managed // wholly by fbvector itself. template static It S_copy_n(T* dest, It first, size_type n) { auto e = dest + n; for (; dest != e; ++dest, ++first) *dest = *first; return first; } static const T* S_copy_n(T* dest, const T* first, size_type n) { if (folly::IsTriviallyCopyable::value) { std::memcpy((void*)dest, (void*)first, n * sizeof(T)); return first + n; } else { return S_copy_n(dest, first, n); } } static std::move_iterator S_copy_n(T* dest, std::move_iterator mIt, size_type n) { if (folly::IsTriviallyCopyable::value) { T* first = mIt.base(); std::memcpy((void*)dest, (void*)first, n * sizeof(T)); return std::make_move_iterator(first + n); } else { return S_copy_n>(dest, mIt, n); } } //=========================================================================== //--------------------------------------------------------------------------- // relocation helpers private: // Relocation is divided into three parts: // // 1: relocate_move // Performs the actual movement of data from point a to point b. // // 2: relocate_done // Destroys the old data. // // 3: relocate_undo // Destoys the new data and restores the old data. // // The three steps are used because there may be an exception after part 1 // has completed. If that is the case, then relocate_undo can nullify the // initial move. Otherwise, relocate_done performs the last bit of tidying // up. // // The relocation trio may use either memcpy, move, or copy. It is decided // by the following case statement: // // IsRelocatable && usingStdAllocator -> memcpy // has_nothrow_move && usingStdAllocator -> move // cannot copy -> move // default -> copy // // If the class is non-copyable then it must be movable. However, if the // move constructor is not noexcept, i.e. an error could be thrown, then // relocate_undo will be unable to restore the old data, for fear of a // second exception being thrown. This is a known and unavoidable // deficiency. In lieu of a strong exception guarantee, relocate_undo does // the next best thing: it provides a weak exception guarantee by // destorying the new data, but leaving the old data in an indeterminate // state. Note that that indeterminate state will be valid, since the // old data has not been destroyed; it has merely been the source of a // move, which is required to leave the source in a valid state. // wrappers void M_relocate(T* newB) { relocate_move(newB, impl_.b_, impl_.e_); relocate_done(newB, impl_.b_, impl_.e_); } // dispatch type trait typedef std::integral_constant::value && usingStdAllocator::value > relocate_use_memcpy; typedef std::integral_constant::value && usingStdAllocator::value) || !std::is_copy_constructible::value > relocate_use_move; // move void relocate_move(T* dest, T* first, T* last) { relocate_move_or_memcpy(dest, first, last, relocate_use_memcpy()); } void relocate_move_or_memcpy(T* dest, T* first, T* last, std::true_type) { if (first != nullptr) { std::memcpy((void*)dest, (void*)first, (last - first) * sizeof(T)); } } void relocate_move_or_memcpy(T* dest, T* first, T* last, std::false_type) { relocate_move_or_copy(dest, first, last, relocate_use_move()); } void relocate_move_or_copy(T* dest, T* first, T* last, std::true_type) { D_uninitialized_move_a(dest, first, last); } void relocate_move_or_copy(T* dest, T* first, T* last, std::false_type) { D_uninitialized_copy_a(dest, first, last); } // done void relocate_done(T* /*dest*/, T* first, T* last) noexcept { if (folly::IsRelocatable::value && usingStdAllocator::value) { // used memcpy; data has been relocated, do not call destructor } else { D_destroy_range_a(first, last); } } // undo void relocate_undo(T* dest, T* first, T* last) noexcept { if (folly::IsRelocatable::value && usingStdAllocator::value) { // used memcpy, old data is still valid, nothing to do } else if (std::is_nothrow_move_constructible::value && usingStdAllocator::value) { // noexcept move everything back, aka relocate_move relocate_move(first, dest, dest + (last - first)); } else if (!std::is_copy_constructible::value) { // weak guarantee D_destroy_range_a(dest, dest + (last - first)); } else { // used copy, old data is still valid D_destroy_range_a(dest, dest + (last - first)); } } //=========================================================================== //--------------------------------------------------------------------------- // construct/copy/destroy public: fbvector() = default; explicit fbvector(const Allocator& a) : impl_(a) {} explicit fbvector(size_type n, const Allocator& a = Allocator()) : impl_(n, a) { M_uninitialized_fill_n_e(n); } fbvector(size_type n, VT value, const Allocator& a = Allocator()) : impl_(n, a) { M_uninitialized_fill_n_e(n, value); } template ::iterator_category> fbvector(It first, It last, const Allocator& a = Allocator()) : fbvector(first, last, a, Category()) {} fbvector(const fbvector& other) : impl_(other.size(), A::select_on_container_copy_construction(other.impl_)) { M_uninitialized_copy_e(other.begin(), other.end()); } fbvector(fbvector&& other) noexcept : impl_(std::move(other.impl_)) {} fbvector(const fbvector& other, const Allocator& a) : fbvector(other.begin(), other.end(), a) {} /* may throw */ fbvector(fbvector&& other, const Allocator& a) : impl_(a) { if (impl_ == other.impl_) { impl_.swapData(other.impl_); } else { impl_.init(other.size()); M_uninitialized_move_e(other.begin(), other.end()); } } fbvector(std::initializer_list il, const Allocator& a = Allocator()) : fbvector(il.begin(), il.end(), a) {} ~fbvector() = default; // the cleanup occurs in impl_ fbvector& operator=(const fbvector& other) { if (UNLIKELY(this == &other)) return *this; if (!usingStdAllocator::value && A::propagate_on_container_copy_assignment::value) { if (impl_ != other.impl_) { // can't use other's different allocator to clean up self impl_.reset(); } (Allocator&)impl_ = (Allocator&)other.impl_; } assign(other.begin(), other.end()); return *this; } fbvector& operator=(fbvector&& other) { if (UNLIKELY(this == &other)) return *this; moveFrom(std::move(other), moveIsSwap()); return *this; } fbvector& operator=(std::initializer_list il) { assign(il.begin(), il.end()); return *this; } template ::iterator_category> void assign(It first, It last) { assign(first, last, Category()); } void assign(size_type n, VT value) { if (n > capacity()) { // Not enough space. Do not reserve in place, since we will // discard the old values anyways. if (dataIsInternalAndNotVT(value)) { T copy(std::move(value)); impl_.reset(n); M_uninitialized_fill_n_e(n, copy); } else { impl_.reset(n); M_uninitialized_fill_n_e(n, value); } } else if (n <= size()) { auto newE = impl_.b_ + n; std::fill(impl_.b_, newE, value); M_destroy_range_e(newE); } else { std::fill(impl_.b_, impl_.e_, value); M_uninitialized_fill_n_e(n - size(), value); } } void assign(std::initializer_list il) { assign(il.begin(), il.end()); } allocator_type get_allocator() const noexcept { return impl_; } private: // contract dispatch for iterator types fbvector(It first, It last) template fbvector(ForwardIterator first, ForwardIterator last, const Allocator& a, std::forward_iterator_tag) : impl_(std::distance(first, last), a) { M_uninitialized_copy_e(first, last); } template fbvector(InputIterator first, InputIterator last, const Allocator& a, std::input_iterator_tag) : impl_(a) { for (; first != last; ++first) emplace_back(*first); } // contract dispatch for allocator movement in operator=(fbvector&&) void moveFrom(fbvector&& other, std::true_type) { swap(impl_, other.impl_); } void moveFrom(fbvector&& other, std::false_type) { if (impl_ == other.impl_) { impl_.swapData(other.impl_); } else { impl_.reset(other.size()); M_uninitialized_move_e(other.begin(), other.end()); } } // contract dispatch for iterator types in assign(It first, It last) template void assign(ForwardIterator first, ForwardIterator last, std::forward_iterator_tag) { const size_t newSize = std::distance(first, last); if (newSize > capacity()) { impl_.reset(newSize); M_uninitialized_copy_e(first, last); } else if (newSize <= size()) { auto newEnd = std::copy(first, last, impl_.b_); M_destroy_range_e(newEnd); } else { auto mid = S_copy_n(impl_.b_, first, size()); M_uninitialized_copy_e(mid, last); } } template void assign(InputIterator first, InputIterator last, std::input_iterator_tag) { auto p = impl_.b_; for (; first != last && p != impl_.e_; ++first, ++p) { *p = *first; } if (p != impl_.e_) { M_destroy_range_e(p); } else { for (; first != last; ++first) emplace_back(*first); } } // contract dispatch for aliasing under VT optimization bool dataIsInternalAndNotVT(const T& t) { if (should_pass_by_value::value) return false; return dataIsInternal(t); } bool dataIsInternal(const T& t) { return UNLIKELY(impl_.b_ <= std::addressof(t) && std::addressof(t) < impl_.e_); } //=========================================================================== //--------------------------------------------------------------------------- // iterators public: iterator begin() noexcept { return impl_.b_; } const_iterator begin() const noexcept { return impl_.b_; } iterator end() noexcept { return impl_.e_; } const_iterator end() const noexcept { return impl_.e_; } reverse_iterator rbegin() noexcept { return reverse_iterator(end()); } const_reverse_iterator rbegin() const noexcept { return const_reverse_iterator(end()); } reverse_iterator rend() noexcept { return reverse_iterator(begin()); } const_reverse_iterator rend() const noexcept { return const_reverse_iterator(begin()); } const_iterator cbegin() const noexcept { return impl_.b_; } const_iterator cend() const noexcept { return impl_.e_; } const_reverse_iterator crbegin() const noexcept { return const_reverse_iterator(end()); } const_reverse_iterator crend() const noexcept { return const_reverse_iterator(begin()); } //=========================================================================== //--------------------------------------------------------------------------- // capacity public: size_type size() const noexcept { return impl_.e_ - impl_.b_; } size_type max_size() const noexcept { // good luck gettin' there return ~size_type(0); } void resize(size_type n) { if (n <= size()) { M_destroy_range_e(impl_.b_ + n); } else { reserve(n); M_uninitialized_fill_n_e(n - size()); } } void resize(size_type n, VT t) { if (n <= size()) { M_destroy_range_e(impl_.b_ + n); } else if (dataIsInternalAndNotVT(t) && n > capacity()) { T copy(t); reserve(n); M_uninitialized_fill_n_e(n - size(), copy); } else { reserve(n); M_uninitialized_fill_n_e(n - size(), t); } } size_type capacity() const noexcept { return impl_.z_ - impl_.b_; } bool empty() const noexcept { return impl_.b_ == impl_.e_; } void reserve(size_type n) { if (n <= capacity()) return; if (impl_.b_ && reserve_in_place(n)) return; auto newCap = folly::goodMallocSize(n * sizeof(T)) / sizeof(T); auto newB = M_allocate(newCap); try { M_relocate(newB); } catch (...) { M_deallocate(newB, newCap); throw; } if (impl_.b_) M_deallocate(impl_.b_, impl_.z_ - impl_.b_); impl_.z_ = newB + newCap; impl_.e_ = newB + (impl_.e_ - impl_.b_); impl_.b_ = newB; } void shrink_to_fit() noexcept { if (empty()) { impl_.reset(); return; } auto const newCapacityBytes = folly::goodMallocSize(size() * sizeof(T)); auto const newCap = newCapacityBytes / sizeof(T); auto const oldCap = capacity(); if (newCap >= oldCap) return; void* p = impl_.b_; // xallocx() will shrink to precisely newCapacityBytes (which was generated // by goodMallocSize()) if it successfully shrinks in place. if ((usingJEMalloc() && usingStdAllocator::value) && newCapacityBytes >= folly::jemallocMinInPlaceExpandable && xallocx(p, newCapacityBytes, 0, 0) == newCapacityBytes) { impl_.z_ += newCap - oldCap; } else { T* newB; // intentionally uninitialized try { newB = M_allocate(newCap); try { M_relocate(newB); } catch (...) { M_deallocate(newB, newCap); return; // swallow the error } } catch (...) { return; } if (impl_.b_) M_deallocate(impl_.b_, impl_.z_ - impl_.b_); impl_.z_ = newB + newCap; impl_.e_ = newB + (impl_.e_ - impl_.b_); impl_.b_ = newB; } } private: bool reserve_in_place(size_type n) { if (!usingStdAllocator::value || !usingJEMalloc()) return false; // jemalloc can never grow in place blocks smaller than 4096 bytes. if ((impl_.z_ - impl_.b_) * sizeof(T) < folly::jemallocMinInPlaceExpandable) return false; auto const newCapacityBytes = folly::goodMallocSize(n * sizeof(T)); void* p = impl_.b_; if (xallocx(p, newCapacityBytes, 0, 0) == newCapacityBytes) { impl_.z_ = impl_.b_ + newCapacityBytes / sizeof(T); return true; } return false; } //=========================================================================== //--------------------------------------------------------------------------- // element access public: reference operator[](size_type n) { assert(n < size()); return impl_.b_[n]; } const_reference operator[](size_type n) const { assert(n < size()); return impl_.b_[n]; } const_reference at(size_type n) const { if (UNLIKELY(n >= size())) { std::__throw_out_of_range("fbvector: index is greater than size."); } return (*this)[n]; } reference at(size_type n) { auto const& cThis = *this; return const_cast(cThis.at(n)); } reference front() { assert(!empty()); return *impl_.b_; } const_reference front() const { assert(!empty()); return *impl_.b_; } reference back() { assert(!empty()); return impl_.e_[-1]; } const_reference back() const { assert(!empty()); return impl_.e_[-1]; } //=========================================================================== //--------------------------------------------------------------------------- // data access public: T* data() noexcept { return impl_.b_; } const T* data() const noexcept { return impl_.b_; } //=========================================================================== //--------------------------------------------------------------------------- // modifiers (common) public: template void emplace_back(Args&&... args) { if (impl_.e_ != impl_.z_) { M_construct(impl_.e_, std::forward(args)...); ++impl_.e_; } else { emplace_back_aux(std::forward(args)...); } } void push_back(const T& value) { if (impl_.e_ != impl_.z_) { M_construct(impl_.e_, value); ++impl_.e_; } else { emplace_back_aux(value); } } void push_back(T&& value) { if (impl_.e_ != impl_.z_) { M_construct(impl_.e_, std::move(value)); ++impl_.e_; } else { emplace_back_aux(std::move(value)); } } void pop_back() { assert(!empty()); --impl_.e_; M_destroy(impl_.e_); } void swap(fbvector& other) noexcept { if (!usingStdAllocator::value && A::propagate_on_container_swap::value) swap(impl_, other.impl_); else impl_.swapData(other.impl_); } void clear() noexcept { M_destroy_range_e(impl_.b_); } private: // std::vector implements a similar function with a different growth // strategy: empty() ? 1 : capacity() * 2. // // fbvector grows differently on two counts: // // (1) initial size // Instead of growing to size 1 from empty, fbvector allocates at least // 64 bytes. You may still use reserve to reserve a lesser amount of // memory. // (2) 1.5x // For medium-sized vectors, the growth strategy is 1.5x. See the docs // for details. // This does not apply to very small or very large fbvectors. This is a // heuristic. // A nice addition to fbvector would be the capability of having a user- // defined growth strategy, probably as part of the allocator. // size_type computePushBackCapacity() const { if (capacity() == 0) { return std::max(64 / sizeof(T), size_type(1)); } if (capacity() < folly::jemallocMinInPlaceExpandable / sizeof(T)) { return capacity() * 2; } if (capacity() > 4096 * 32 / sizeof(T)) { return capacity() * 2; } return (capacity() * 3 + 1) / 2; } template void emplace_back_aux(Args&&... args); //=========================================================================== //--------------------------------------------------------------------------- // modifiers (erase) public: iterator erase(const_iterator position) { return erase(position, position + 1); } iterator erase(const_iterator first, const_iterator last) { assert(isValid(first) && isValid(last)); assert(first <= last); if (first != last) { if (last == end()) { M_destroy_range_e((iterator)first); } else { if (folly::IsRelocatable::value && usingStdAllocator::value) { D_destroy_range_a((iterator)first, (iterator)last); if (last - first >= cend() - last) { std::memcpy((void*)first, (void*)last, (cend() - last) * sizeof(T)); } else { std::memmove((iterator)first, last, (cend() - last) * sizeof(T)); } impl_.e_ -= (last - first); } else { std::copy(std::make_move_iterator((iterator)last), std::make_move_iterator(end()), (iterator)first); auto newEnd = impl_.e_ - std::distance(first, last); M_destroy_range_e(newEnd); } } } return (iterator)first; } //=========================================================================== //--------------------------------------------------------------------------- // modifiers (insert) private: // we have the private section first because it defines some macros bool isValid(const_iterator it) { return cbegin() <= it && it <= cend(); } size_type computeInsertCapacity(size_type n) { size_type nc = std::max(computePushBackCapacity(), size() + n); size_type ac = folly::goodMallocSize(nc * sizeof(T)) / sizeof(T); return ac; } //--------------------------------------------------------------------------- // // make_window takes an fbvector, and creates an uninitialized gap (a // window) at the given position, of the given size. The fbvector must // have enough capacity. // // Explanation by picture. // // 123456789______ // ^ // make_window here of size 3 // // 1234___56789___ // // If something goes wrong and the window must be destroyed, use // undo_window to provide a weak exception guarantee. It destroys // the right ledge. // // 1234___________ // //--------------------------------------------------------------------------- // // wrap_frame takes an inverse window and relocates an fbvector around it. // The fbvector must have at least as many elements as the left ledge. // // Explanation by picture. // // START // fbvector: inverse window: // 123456789______ _____abcde_______ // [idx][ n ] // // RESULT // _______________ 12345abcde6789___ // //--------------------------------------------------------------------------- // // insert_use_fresh_memory returns true iff the fbvector should use a fresh // block of memory for the insertion. If the fbvector does not have enough // spare capacity, then it must return true. Otherwise either true or false // may be returned. // //--------------------------------------------------------------------------- // // These three functions, make_window, wrap_frame, and // insert_use_fresh_memory, can be combined into a uniform interface. // Since that interface involves a lot of case-work, it is built into // some macros: FOLLY_FBVECTOR_INSERT_(PRE|START|TRY|END) // Macros are used in an attempt to let GCC perform better optimizations, // especially control flow optimization. // //--------------------------------------------------------------------------- // window void make_window(iterator position, size_type n) { // The result is guaranteed to be non-negative, so use an unsigned type: size_type tail = std::distance(position, impl_.e_); if (tail <= n) { relocate_move(position + n, position, impl_.e_); relocate_done(position + n, position, impl_.e_); impl_.e_ += n; } else { if (folly::IsRelocatable::value && usingStdAllocator::value) { std::memmove(position + n, position, tail * sizeof(T)); impl_.e_ += n; } else { D_uninitialized_move_a(impl_.e_, impl_.e_ - n, impl_.e_); try { std::copy_backward(std::make_move_iterator(position), std::make_move_iterator(impl_.e_ - n), impl_.e_); } catch (...) { D_destroy_range_a(impl_.e_ - n, impl_.e_ + n); impl_.e_ -= n; throw; } impl_.e_ += n; D_destroy_range_a(position, position + n); } } } void undo_window(iterator position, size_type n) noexcept { D_destroy_range_a(position + n, impl_.e_); impl_.e_ = position; } //--------------------------------------------------------------------------- // frame void wrap_frame(T* ledge, size_type idx, size_type n) { assert(size() >= idx); assert(n != 0); relocate_move(ledge, impl_.b_, impl_.b_ + idx); try { relocate_move(ledge + idx + n, impl_.b_ + idx, impl_.e_); } catch (...) { relocate_undo(ledge, impl_.b_, impl_.b_ + idx); throw; } relocate_done(ledge, impl_.b_, impl_.b_ + idx); relocate_done(ledge + idx + n, impl_.b_ + idx, impl_.e_); } //--------------------------------------------------------------------------- // use fresh? bool insert_use_fresh(bool at_end, size_type n) { if (at_end) { if (size() + n <= capacity()) return false; if (reserve_in_place(size() + n)) return false; return true; } if (size() + n > capacity()) return true; return false; } //--------------------------------------------------------------------------- // interface #define FOLLY_FBVECTOR_INSERT_PRE(cpos, n) \ if (n == 0) return (iterator)cpos; \ bool at_end = cpos == cend(); \ bool fresh = insert_use_fresh(at_end, n); \ if (!at_end) { \ if (!fresh) { // check for internal data (technically not required by the standard) #define FOLLY_FBVECTOR_INSERT_START(cpos, n) \ } \ assert(isValid(cpos)); \ } \ T* position = const_cast(cpos); \ size_type idx = std::distance(impl_.b_, position); \ T* b; \ size_type newCap; /* intentionally uninitialized */ \ \ if (fresh) { \ newCap = computeInsertCapacity(n); \ b = M_allocate(newCap); \ } else { \ if (!at_end) { \ make_window(position, n); \ } else { \ impl_.e_ += n; \ } \ b = impl_.b_; \ } \ \ T* start = b + idx; \ \ try { \ // construct the inserted elements #define FOLLY_FBVECTOR_INSERT_TRY(cpos, n) \ } catch (...) { \ if (fresh) { \ M_deallocate(b, newCap); \ } else { \ if (!at_end) { \ undo_window(position, n); \ } else { \ impl_.e_ -= n; \ } \ } \ throw; \ } \ \ if (fresh) { \ try { \ wrap_frame(b, idx, n); \ } catch (...) { \ // delete the inserted elements (exception has been thrown) #define FOLLY_FBVECTOR_INSERT_END(cpos, n) \ M_deallocate(b, newCap); \ throw; \ } \ if (impl_.b_) M_deallocate(impl_.b_, capacity()); \ impl_.set(b, size() + n, newCap); \ return impl_.b_ + idx; \ } else { \ return position; \ } \ //--------------------------------------------------------------------------- // insert functions public: template iterator emplace(const_iterator cpos, Args&&... args) { FOLLY_FBVECTOR_INSERT_PRE(cpos, 1) FOLLY_FBVECTOR_INSERT_START(cpos, 1) M_construct(start, std::forward(args)...); FOLLY_FBVECTOR_INSERT_TRY(cpos, 1) M_destroy(start); FOLLY_FBVECTOR_INSERT_END(cpos, 1) } iterator insert(const_iterator cpos, const T& value) { FOLLY_FBVECTOR_INSERT_PRE(cpos, 1) if (dataIsInternal(value)) return insert(cpos, T(value)); FOLLY_FBVECTOR_INSERT_START(cpos, 1) M_construct(start, value); FOLLY_FBVECTOR_INSERT_TRY(cpos, 1) M_destroy(start); FOLLY_FBVECTOR_INSERT_END(cpos, 1) } iterator insert(const_iterator cpos, T&& value) { FOLLY_FBVECTOR_INSERT_PRE(cpos, 1) if (dataIsInternal(value)) return insert(cpos, T(std::move(value))); FOLLY_FBVECTOR_INSERT_START(cpos, 1) M_construct(start, std::move(value)); FOLLY_FBVECTOR_INSERT_TRY(cpos, 1) M_destroy(start); FOLLY_FBVECTOR_INSERT_END(cpos, 1) } iterator insert(const_iterator cpos, size_type n, VT value) { FOLLY_FBVECTOR_INSERT_PRE(cpos, n) if (dataIsInternalAndNotVT(value)) return insert(cpos, n, T(value)); FOLLY_FBVECTOR_INSERT_START(cpos, n) D_uninitialized_fill_n_a(start, n, value); FOLLY_FBVECTOR_INSERT_TRY(cpos, n) D_destroy_range_a(start, start + n); FOLLY_FBVECTOR_INSERT_END(cpos, n) } template ::iterator_category> iterator insert(const_iterator cpos, It first, It last) { return insert(cpos, first, last, Category()); } iterator insert(const_iterator cpos, std::initializer_list il) { return insert(cpos, il.begin(), il.end()); } //--------------------------------------------------------------------------- // insert dispatch for iterator types private: template iterator insert(const_iterator cpos, FIt first, FIt last, std::forward_iterator_tag) { size_type n = std::distance(first, last); FOLLY_FBVECTOR_INSERT_PRE(cpos, n) FOLLY_FBVECTOR_INSERT_START(cpos, n) D_uninitialized_copy_a(start, first, last); FOLLY_FBVECTOR_INSERT_TRY(cpos, n) D_destroy_range_a(start, start + n); FOLLY_FBVECTOR_INSERT_END(cpos, n) } template iterator insert(const_iterator cpos, IIt first, IIt last, std::input_iterator_tag) { T* position = const_cast(cpos); assert(isValid(position)); size_type idx = std::distance(begin(), position); fbvector storage(std::make_move_iterator(position), std::make_move_iterator(end()), A::select_on_container_copy_construction(impl_)); M_destroy_range_e(position); for (; first != last; ++first) emplace_back(*first); insert(cend(), std::make_move_iterator(storage.begin()), std::make_move_iterator(storage.end())); return impl_.b_ + idx; } //=========================================================================== //--------------------------------------------------------------------------- // lexicographical functions (others from boost::totally_ordered superclass) public: bool operator==(const fbvector& other) const { return size() == other.size() && std::equal(begin(), end(), other.begin()); } bool operator<(const fbvector& other) const { return std::lexicographical_compare( begin(), end(), other.begin(), other.end()); } //=========================================================================== //--------------------------------------------------------------------------- // friends private: template friend _T* relinquish(fbvector<_T, _A>&); template friend void attach(fbvector<_T, _A>&, _T* data, size_t sz, size_t cap); }; // class fbvector //============================================================================= //----------------------------------------------------------------------------- // outlined functions (gcc, you finicky compiler you) template template void fbvector::emplace_back_aux(Args&&... args) { size_type byte_sz = folly::goodMallocSize( computePushBackCapacity() * sizeof(T)); if (usingStdAllocator::value && usingJEMalloc() && ((impl_.z_ - impl_.b_) * sizeof(T) >= folly::jemallocMinInPlaceExpandable)) { // Try to reserve in place. // Ask xallocx to allocate in place at least size()+1 and at most sz space. // xallocx will allocate as much as possible within that range, which // is the best possible outcome: if sz space is available, take it all, // otherwise take as much as possible. If nothing is available, then fail. // In this fashion, we never relocate if there is a possibility of // expanding in place, and we never reallocate by less than the desired // amount unless we cannot expand further. Hence we will not reallocate // sub-optimally twice in a row (modulo the blocking memory being freed). size_type lower = folly::goodMallocSize(sizeof(T) + size() * sizeof(T)); size_type upper = byte_sz; size_type extra = upper - lower; void* p = impl_.b_; size_t actual; if ((actual = xallocx(p, lower, extra, 0)) >= lower) { impl_.z_ = impl_.b_ + actual / sizeof(T); M_construct(impl_.e_, std::forward(args)...); ++impl_.e_; return; } } // Reallocation failed. Perform a manual relocation. size_type sz = byte_sz / sizeof(T); auto newB = M_allocate(sz); auto newE = newB + size(); try { if (folly::IsRelocatable::value && usingStdAllocator::value) { // For linear memory access, relocate before construction. // By the test condition, relocate is noexcept. // Note that there is no cleanup to do if M_construct throws - that's // one of the beauties of relocation. // Benchmarks for this code have high variance, and seem to be close. relocate_move(newB, impl_.b_, impl_.e_); M_construct(newE, std::forward(args)...); ++newE; } else { M_construct(newE, std::forward(args)...); ++newE; try { M_relocate(newB); } catch (...) { M_destroy(newE - 1); throw; } } } catch (...) { M_deallocate(newB, sz); throw; } if (impl_.b_) M_deallocate(impl_.b_, size()); impl_.b_ = newB; impl_.e_ = newE; impl_.z_ = newB + sz; } //============================================================================= //----------------------------------------------------------------------------- // specialized functions template void swap(fbvector& lhs, fbvector& rhs) noexcept { lhs.swap(rhs); } //============================================================================= //----------------------------------------------------------------------------- // other namespace detail { // Format support. template struct IndexableTraits> : public IndexableTraitsSeq> { }; } // namespace detail template void compactResize(fbvector* v, size_t sz) { v->resize(sz); v->shrink_to_fit(); } // DANGER // // relinquish and attach are not a members function specifically so that it is // awkward to call them. It is very easy to shoot yourself in the foot with // these functions. // // If you call relinquish, then it is your responsibility to free the data // and the storage, both of which may have been generated in a non-standard // way through the fbvector's allocator. // // If you call attach, it is your responsibility to ensure that the fbvector // is fresh (size and capacity both zero), and that the supplied data is // capable of being manipulated by the allocator. // It is acceptable to supply a stack pointer IF: // (1) The vector's data does not outlive the stack pointer. This includes // extension of the data's life through a move operation. // (2) The pointer has enough capacity that the vector will never be // relocated. // (3) Insert is not called on the vector; these functions have leeway to // relocate the vector even if there is enough capacity. // (4) A stack pointer is compatible with the fbvector's allocator. // template T* relinquish(fbvector& v) { T* ret = v.data(); v.impl_.b_ = v.impl_.e_ = v.impl_.z_ = nullptr; return ret; } template void attach(fbvector& v, T* data, size_t sz, size_t cap) { assert(v.data() == nullptr); v.impl_.b_ = data; v.impl_.e_ = data + sz; v.impl_.z_ = data + cap; } } // namespace folly