Skip to content

Commit ceaf011

Browse files
committed
Revert "Revert "ADT: Fix reference invalidation in SmallVector...""
This reverts commit 33be50d, effectively reapplying: - 260a856 - 3043e5a - 4914299 ... with a fix to skip a call to `SmallVector::isReferenceToStorage()` when we know the parameter had been taken by value for small, POD-like `T`. See https://reviews.llvm.org/D93779 for the discussion on the revert. At a high-level, these commits fix reference invalidation in SmallVector's push_back, append, insert (one or N), and resize operations. For more details, please see the original commit messages. This commit fixes a bug that crept into `SmallVectorTemplateCommon::reserveForAndGetAddress()` during the review process after performance analysis was done. That function is now called `reserveForParamAndGetAddress()`, clarifying that it only works for parameter values. It uses that knowledge to bypass `SmallVector::isReferenceToStorage()` when `TakesParamByValue`. This is `constexpr` and avoids adding overhead for "small enough", trivially copyable `T`. Performance could potentially be tuned further by increasing the threshold for `TakesParamByValue`, which is currently defined as: ``` bool TakesParamByValue = sizeof(T) <= 2 * sizeof(void *); ``` in the POD-like version of SmallVectorTemplateBase (else, `false`). Differential Revision: https://reviews.llvm.org/D94800
1 parent ceb3cdc commit ceaf011

File tree

2 files changed

+245
-75
lines changed

2 files changed

+245
-75
lines changed

llvm/include/llvm/ADT/SmallVector.h

+121-47
Original file line numberDiff line numberDiff line change
@@ -220,6 +220,27 @@ class SmallVectorTemplateCommon
220220
}
221221
void assertSafeToEmplace() {}
222222

223+
/// Reserve enough space to add one element, and return the updated element
224+
/// pointer in case it was a reference to the storage.
225+
template <class U>
226+
static const T *reserveForParamAndGetAddressImpl(U *This, const T &Elt,
227+
size_t N) {
228+
size_t NewSize = This->size() + N;
229+
if (LLVM_LIKELY(NewSize <= This->capacity()))
230+
return &Elt;
231+
232+
bool ReferencesStorage = false;
233+
int64_t Index = -1;
234+
if (!U::TakesParamByValue) {
235+
if (LLVM_UNLIKELY(This->isReferenceToStorage(&Elt))) {
236+
ReferencesStorage = true;
237+
Index = &Elt - This->begin();
238+
}
239+
}
240+
This->grow(NewSize);
241+
return ReferencesStorage ? This->begin() + Index : &Elt;
242+
}
243+
223244
public:
224245
using size_type = size_t;
225246
using difference_type = ptrdiff_t;
@@ -303,7 +324,12 @@ template <typename T, bool = (is_trivially_copy_constructible<T>::value) &&
303324
(is_trivially_move_constructible<T>::value) &&
304325
std::is_trivially_destructible<T>::value>
305326
class SmallVectorTemplateBase : public SmallVectorTemplateCommon<T> {
327+
friend class SmallVectorTemplateCommon<T>;
328+
306329
protected:
330+
static constexpr bool TakesParamByValue = false;
331+
using ValueParamT = const T &;
332+
307333
SmallVectorTemplateBase(size_t Size) : SmallVectorTemplateCommon<T>(Size) {}
308334

309335
static void destroy_range(T *S, T *E) {
@@ -333,20 +359,32 @@ class SmallVectorTemplateBase : public SmallVectorTemplateCommon<T> {
333359
/// element, or MinSize more elements if specified.
334360
void grow(size_t MinSize = 0);
335361

362+
/// Reserve enough space to add one element, and return the updated element
363+
/// pointer in case it was a reference to the storage.
364+
const T *reserveForParamAndGetAddress(const T &Elt, size_t N = 1) {
365+
return this->reserveForParamAndGetAddressImpl(this, Elt, N);
366+
}
367+
368+
/// Reserve enough space to add one element, and return the updated element
369+
/// pointer in case it was a reference to the storage.
370+
T *reserveForParamAndGetAddress(T &Elt, size_t N = 1) {
371+
return const_cast<T *>(
372+
this->reserveForParamAndGetAddressImpl(this, Elt, N));
373+
}
374+
375+
static T &&forward_value_param(T &&V) { return std::move(V); }
376+
static const T &forward_value_param(const T &V) { return V; }
377+
336378
public:
337379
void push_back(const T &Elt) {
338-
this->assertSafeToAdd(&Elt);
339-
if (LLVM_UNLIKELY(this->size() >= this->capacity()))
340-
this->grow();
341-
::new ((void*) this->end()) T(Elt);
380+
const T *EltPtr = reserveForParamAndGetAddress(Elt);
381+
::new ((void *)this->end()) T(*EltPtr);
342382
this->set_size(this->size() + 1);
343383
}
344384

345385
void push_back(T &&Elt) {
346-
this->assertSafeToAdd(&Elt);
347-
if (LLVM_UNLIKELY(this->size() >= this->capacity()))
348-
this->grow();
349-
::new ((void*) this->end()) T(::std::move(Elt));
386+
T *EltPtr = reserveForParamAndGetAddress(Elt);
387+
::new ((void *)this->end()) T(::std::move(*EltPtr));
350388
this->set_size(this->size() + 1);
351389
}
352390

@@ -396,7 +434,18 @@ void SmallVectorTemplateBase<T, TriviallyCopyable>::grow(size_t MinSize) {
396434
/// skipping destruction.
397435
template <typename T>
398436
class SmallVectorTemplateBase<T, true> : public SmallVectorTemplateCommon<T> {
437+
friend class SmallVectorTemplateCommon<T>;
438+
399439
protected:
440+
/// True if it's cheap enough to take parameters by value. Doing so avoids
441+
/// overhead related to mitigations for reference invalidation.
442+
static constexpr bool TakesParamByValue = sizeof(T) <= 2 * sizeof(void *);
443+
444+
/// Either const T& or T, depending on whether it's cheap enough to take
445+
/// parameters by value.
446+
using ValueParamT =
447+
typename std::conditional<TakesParamByValue, T, const T &>::type;
448+
400449
SmallVectorTemplateBase(size_t Size) : SmallVectorTemplateCommon<T>(Size) {}
401450

402451
// No need to do a destroy loop for POD's.
@@ -437,12 +486,26 @@ class SmallVectorTemplateBase<T, true> : public SmallVectorTemplateCommon<T> {
437486
/// least one more element or MinSize if specified.
438487
void grow(size_t MinSize = 0) { this->grow_pod(MinSize, sizeof(T)); }
439488

489+
/// Reserve enough space to add one element, and return the updated element
490+
/// pointer in case it was a reference to the storage.
491+
const T *reserveForParamAndGetAddress(const T &Elt, size_t N = 1) {
492+
return this->reserveForParamAndGetAddressImpl(this, Elt, N);
493+
}
494+
495+
/// Reserve enough space to add one element, and return the updated element
496+
/// pointer in case it was a reference to the storage.
497+
T *reserveForParamAndGetAddress(T &Elt, size_t N = 1) {
498+
return const_cast<T *>(
499+
this->reserveForParamAndGetAddressImpl(this, Elt, N));
500+
}
501+
502+
/// Copy \p V or return a reference, depending on \a ValueParamT.
503+
static ValueParamT forward_value_param(ValueParamT V) { return V; }
504+
440505
public:
441-
void push_back(const T &Elt) {
442-
this->assertSafeToAdd(&Elt);
443-
if (LLVM_UNLIKELY(this->size() >= this->capacity()))
444-
this->grow();
445-
memcpy(reinterpret_cast<void *>(this->end()), &Elt, sizeof(T));
506+
void push_back(ValueParamT Elt) {
507+
const T *EltPtr = reserveForParamAndGetAddress(Elt);
508+
memcpy(reinterpret_cast<void *>(this->end()), EltPtr, sizeof(T));
446509
this->set_size(this->size() + 1);
447510
}
448511

@@ -462,6 +525,9 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
462525
using size_type = typename SuperClass::size_type;
463526

464527
protected:
528+
using SmallVectorTemplateBase<T>::TakesParamByValue;
529+
using ValueParamT = typename SuperClass::ValueParamT;
530+
465531
// Default ctor - Initialize to empty.
466532
explicit SmallVectorImpl(unsigned N)
467533
: SmallVectorTemplateBase<T>(N) {}
@@ -502,7 +568,7 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
502568
/// Like resize, but \ref T is POD, the new values won't be initialized.
503569
void resize_for_overwrite(size_type N) { resizeImpl<true>(N); }
504570

505-
void resize(size_type N, const T &NV) {
571+
void resize(size_type N, ValueParamT NV) {
506572
if (N == this->size())
507573
return;
508574

@@ -511,11 +577,8 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
511577
return;
512578
}
513579

514-
this->assertSafeToReferenceAfterResize(&NV, N);
515-
if (this->capacity() < N)
516-
this->grow(N);
517-
std::uninitialized_fill(this->end(), this->begin() + N, NV);
518-
this->set_size(N);
580+
// N > this->size(). Defer to append.
581+
this->append(N - this->size(), NV);
519582
}
520583

521584
void reserve(size_type N) {
@@ -551,12 +614,9 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
551614
}
552615

553616
/// Append \p NumInputs copies of \p Elt to the end.
554-
void append(size_type NumInputs, const T &Elt) {
555-
this->assertSafeToAdd(&Elt, NumInputs);
556-
if (NumInputs > this->capacity() - this->size())
557-
this->grow(this->size()+NumInputs);
558-
559-
std::uninitialized_fill_n(this->end(), NumInputs, Elt);
617+
void append(size_type NumInputs, ValueParamT Elt) {
618+
const T *EltPtr = this->reserveForParamAndGetAddress(Elt, NumInputs);
619+
std::uninitialized_fill_n(this->end(), NumInputs, *EltPtr);
560620
this->set_size(this->size() + NumInputs);
561621
}
562622

@@ -622,31 +682,35 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
622682

623683
private:
624684
template <class ArgType> iterator insert_one_impl(iterator I, ArgType &&Elt) {
685+
// Callers ensure that ArgType is derived from T.
686+
static_assert(
687+
std::is_same<std::remove_const_t<std::remove_reference_t<ArgType>>,
688+
T>::value,
689+
"ArgType must be derived from T!");
690+
625691
if (I == this->end()) { // Important special case for empty vector.
626692
this->push_back(::std::forward<ArgType>(Elt));
627693
return this->end()-1;
628694
}
629695

630696
assert(this->isReferenceToStorage(I) && "Insertion iterator is out of bounds.");
631697

632-
// Check that adding an element won't invalidate Elt.
633-
this->assertSafeToAdd(&Elt);
634-
635-
if (this->size() >= this->capacity()) {
636-
size_t EltNo = I-this->begin();
637-
this->grow();
638-
I = this->begin()+EltNo;
639-
}
698+
// Grow if necessary.
699+
size_t Index = I - this->begin();
700+
std::remove_reference_t<ArgType> *EltPtr =
701+
this->reserveForParamAndGetAddress(Elt);
702+
I = this->begin() + Index;
640703

641704
::new ((void*) this->end()) T(::std::move(this->back()));
642705
// Push everything else over.
643706
std::move_backward(I, this->end()-1, this->end());
644707
this->set_size(this->size() + 1);
645708

646709
// If we just moved the element we're inserting, be sure to update
647-
// the reference.
648-
std::remove_reference_t<ArgType> *EltPtr = &Elt;
649-
if (this->isReferenceToRange(EltPtr, I, this->end()))
710+
// the reference (never happens if TakesParamByValue).
711+
static_assert(!TakesParamByValue || std::is_same<ArgType, T>::value,
712+
"ArgType must be 'T' when taking by value!");
713+
if (!TakesParamByValue && this->isReferenceToRange(EltPtr, I, this->end()))
650714
++EltPtr;
651715

652716
*I = ::std::forward<ArgType>(*EltPtr);
@@ -655,12 +719,14 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
655719

656720
public:
657721
iterator insert(iterator I, T &&Elt) {
658-
return insert_one_impl(I, std::move(Elt));
722+
return insert_one_impl(I, this->forward_value_param(std::move(Elt)));
659723
}
660724

661-
iterator insert(iterator I, const T &Elt) { return insert_one_impl(I, Elt); }
725+
iterator insert(iterator I, const T &Elt) {
726+
return insert_one_impl(I, this->forward_value_param(Elt));
727+
}
662728

663-
iterator insert(iterator I, size_type NumToInsert, const T &Elt) {
729+
iterator insert(iterator I, size_type NumToInsert, ValueParamT Elt) {
664730
// Convert iterator to elt# to avoid invalidating iterator when we reserve()
665731
size_t InsertElt = I - this->begin();
666732

@@ -671,11 +737,9 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
671737

672738
assert(this->isReferenceToStorage(I) && "Insertion iterator is out of bounds.");
673739

674-
// Check that adding NumToInsert elements won't invalidate Elt.
675-
this->assertSafeToAdd(&Elt, NumToInsert);
676-
677-
// Ensure there is enough space.
678-
reserve(this->size() + NumToInsert);
740+
// Ensure there is enough space, and get the (maybe updated) address of
741+
// Elt.
742+
const T *EltPtr = this->reserveForParamAndGetAddress(Elt, NumToInsert);
679743

680744
// Uninvalidate the iterator.
681745
I = this->begin()+InsertElt;
@@ -692,7 +756,12 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
692756
// Copy the existing elements that get replaced.
693757
std::move_backward(I, OldEnd-NumToInsert, OldEnd);
694758

695-
std::fill_n(I, NumToInsert, Elt);
759+
// If we just moved the element we're inserting, be sure to update
760+
// the reference (never happens if TakesParamByValue).
761+
if (!TakesParamByValue && I <= EltPtr && EltPtr < this->end())
762+
EltPtr += NumToInsert;
763+
764+
std::fill_n(I, NumToInsert, *EltPtr);
696765
return I;
697766
}
698767

@@ -705,11 +774,16 @@ class SmallVectorImpl : public SmallVectorTemplateBase<T> {
705774
size_t NumOverwritten = OldEnd-I;
706775
this->uninitialized_move(I, OldEnd, this->end()-NumOverwritten);
707776

777+
// If we just moved the element we're inserting, be sure to update
778+
// the reference (never happens if TakesParamByValue).
779+
if (!TakesParamByValue && I <= EltPtr && EltPtr < this->end())
780+
EltPtr += NumToInsert;
781+
708782
// Replace the overwritten part.
709-
std::fill_n(I, NumOverwritten, Elt);
783+
std::fill_n(I, NumOverwritten, *EltPtr);
710784

711785
// Insert the non-overwritten middle part.
712-
std::uninitialized_fill_n(OldEnd, NumToInsert-NumOverwritten, Elt);
786+
std::uninitialized_fill_n(OldEnd, NumToInsert - NumOverwritten, *EltPtr);
713787
return I;
714788
}
715789

0 commit comments

Comments
 (0)