From 8dd9615dfbd148993964ea6f2de6c6a94f49660c Mon Sep 17 00:00:00 2001 From: ChiaHungDuan Date: Mon, 9 Oct 2023 13:54:27 -0700 Subject: [PATCH] =?UTF-8?q?Revert=20"[scudo]=20Make=20local=20cache=20be?= =?UTF-8?q?=20agnostic=20to=20the=20type=20of=20node=20in=20f=E2=80=A6=20(?= =?UTF-8?q?#68626)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit …reelist (#67379)" This reverts commit b9c6737ba7307308ecb6ec4cecc4c07e48e7c141. --- .../lib/scudo/standalone/CMakeLists.txt | 1 - .../lib/scudo/standalone/allocator_common.h | 85 -------------- .../lib/scudo/standalone/local_cache.h | 110 +++++++++++++++--- compiler-rt/lib/scudo/standalone/primary32.h | 41 ++----- compiler-rt/lib/scudo/standalone/primary64.h | 41 ++----- .../scudo/standalone/tests/primary_test.cpp | 7 +- 6 files changed, 118 insertions(+), 167 deletions(-) delete mode 100644 compiler-rt/lib/scudo/standalone/allocator_common.h diff --git a/compiler-rt/lib/scudo/standalone/CMakeLists.txt b/compiler-rt/lib/scudo/standalone/CMakeLists.txt index c4d3ea1e4f05ba..2b7a613066b83b 100644 --- a/compiler-rt/lib/scudo/standalone/CMakeLists.txt +++ b/compiler-rt/lib/scudo/standalone/CMakeLists.txt @@ -56,7 +56,6 @@ if(ANDROID) endif() set(SCUDO_HEADERS - allocator_common.h allocator_config.h atomic_helpers.h bytemap.h diff --git a/compiler-rt/lib/scudo/standalone/allocator_common.h b/compiler-rt/lib/scudo/standalone/allocator_common.h deleted file mode 100644 index 95f4776ac596dc..00000000000000 --- a/compiler-rt/lib/scudo/standalone/allocator_common.h +++ /dev/null @@ -1,85 +0,0 @@ -//===-- allocator_common.h --------------------------------------*- C++ -*-===// -// -// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. -// See https://llvm.org/LICENSE.txt for license information. -// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception -// -//===----------------------------------------------------------------------===// - -#ifndef SCUDO_ALLOCATOR_COMMON_H_ -#define SCUDO_ALLOCATOR_COMMON_H_ - -#include "common.h" -#include "list.h" - -namespace scudo { - -template struct TransferBatch { - typedef typename SizeClassAllocator::SizeClassMap SizeClassMap; - typedef typename SizeClassAllocator::CompactPtrT CompactPtrT; - - static const u16 MaxNumCached = SizeClassMap::MaxNumCachedHint; - void setFromArray(CompactPtrT *Array, u16 N) { - DCHECK_LE(N, MaxNumCached); - Count = N; - memcpy(Batch, Array, sizeof(Batch[0]) * Count); - } - void appendFromArray(CompactPtrT *Array, u16 N) { - DCHECK_LE(N, MaxNumCached - Count); - memcpy(Batch + Count, Array, sizeof(Batch[0]) * N); - // u16 will be promoted to int by arithmetic type conversion. - Count = static_cast(Count + N); - } - void appendFromTransferBatch(TransferBatch *B, u16 N) { - DCHECK_LE(N, MaxNumCached - Count); - DCHECK_GE(B->Count, N); - // Append from the back of `B`. - memcpy(Batch + Count, B->Batch + (B->Count - N), sizeof(Batch[0]) * N); - // u16 will be promoted to int by arithmetic type conversion. - Count = static_cast(Count + N); - B->Count = static_cast(B->Count - N); - } - void clear() { Count = 0; } - void add(CompactPtrT P) { - DCHECK_LT(Count, MaxNumCached); - Batch[Count++] = P; - } - void moveToArray(CompactPtrT *Array) { - memcpy(Array, Batch, sizeof(Batch[0]) * Count); - clear(); - } - u16 getCount() const { return Count; } - bool isEmpty() const { return Count == 0U; } - CompactPtrT get(u16 I) const { - DCHECK_LE(I, Count); - return Batch[I]; - } - TransferBatch *Next; - -private: - CompactPtrT Batch[MaxNumCached]; - u16 Count; -}; - -// A BatchGroup is used to collect blocks. Each group has a group id to -// identify the group kind of contained blocks. -template struct BatchGroup { - // `Next` is used by IntrusiveList. - BatchGroup *Next; - // The compact base address of each group - uptr CompactPtrGroupBase; - // Cache value of SizeClassAllocatorLocalCache::getMaxCached() - u16 MaxCachedPerBatch; - // Number of blocks pushed into this group. This is an increment-only - // counter. - uptr PushedBlocks; - // This is used to track how many bytes are not in-use since last time we - // tried to release pages. - uptr BytesInBGAtLastCheckpoint; - // Blocks are managed by TransferBatch in a list. - SinglyLinkedList> Batches; -}; - -} // namespace scudo - -#endif // SCUDO_ALLOCATOR_COMMON_H_ diff --git a/compiler-rt/lib/scudo/standalone/local_cache.h b/compiler-rt/lib/scudo/standalone/local_cache.h index 8cb02abd16fd75..1095eb5f186d1e 100644 --- a/compiler-rt/lib/scudo/standalone/local_cache.h +++ b/compiler-rt/lib/scudo/standalone/local_cache.h @@ -22,6 +22,74 @@ template struct SizeClassAllocatorLocalCache { typedef typename SizeClassAllocator::SizeClassMap SizeClassMap; typedef typename SizeClassAllocator::CompactPtrT CompactPtrT; + struct TransferBatch { + static const u16 MaxNumCached = SizeClassMap::MaxNumCachedHint; + void setFromArray(CompactPtrT *Array, u16 N) { + DCHECK_LE(N, MaxNumCached); + Count = N; + memcpy(Batch, Array, sizeof(Batch[0]) * Count); + } + void appendFromArray(CompactPtrT *Array, u16 N) { + DCHECK_LE(N, MaxNumCached - Count); + memcpy(Batch + Count, Array, sizeof(Batch[0]) * N); + // u16 will be promoted to int by arithmetic type conversion. + Count = static_cast(Count + N); + } + void appendFromTransferBatch(TransferBatch *B, u16 N) { + DCHECK_LE(N, MaxNumCached - Count); + DCHECK_GE(B->Count, N); + // Append from the back of `B`. + memcpy(Batch + Count, B->Batch + (B->Count - N), sizeof(Batch[0]) * N); + // u16 will be promoted to int by arithmetic type conversion. + Count = static_cast(Count + N); + B->Count = static_cast(B->Count - N); + } + void clear() { Count = 0; } + void add(CompactPtrT P) { + DCHECK_LT(Count, MaxNumCached); + Batch[Count++] = P; + } + void copyToArray(CompactPtrT *Array) const { + memcpy(Array, Batch, sizeof(Batch[0]) * Count); + } + u16 getCount() const { return Count; } + bool isEmpty() const { return Count == 0U; } + CompactPtrT get(u16 I) const { + DCHECK_LE(I, Count); + return Batch[I]; + } + static u16 getMaxCached(uptr Size) { + return Min(MaxNumCached, SizeClassMap::getMaxCachedHint(Size)); + } + TransferBatch *Next; + + private: + CompactPtrT Batch[MaxNumCached]; + u16 Count; + }; + + // A BatchGroup is used to collect blocks. Each group has a group id to + // identify the group kind of contained blocks. + struct BatchGroup { + // `Next` is used by IntrusiveList. + BatchGroup *Next; + // The compact base address of each group + uptr CompactPtrGroupBase; + // Cache value of TransferBatch::getMaxCached() + u16 MaxCachedPerBatch; + // Number of blocks pushed into this group. This is an increment-only + // counter. + uptr PushedBlocks; + // This is used to track how many bytes are not in-use since last time we + // tried to release pages. + uptr BytesInBGAtLastCheckpoint; + // Blocks are managed by TransferBatch in a list. + SinglyLinkedList Batches; + }; + + static_assert(sizeof(BatchGroup) <= sizeof(TransferBatch), + "BatchGroup uses the same class size as TransferBatch"); + void init(GlobalStats *S, SizeClassAllocator *A) { DCHECK(isEmpty()); Stats.init(); @@ -83,7 +151,7 @@ template struct SizeClassAllocatorLocalCache { } void drain() { - // Drain BatchClassId last as it may be needed while draining normal blocks. + // Drain BatchClassId last as createBatch can refill it. for (uptr I = 0; I < NumClasses; ++I) { if (I == BatchClassId) continue; @@ -95,11 +163,19 @@ template struct SizeClassAllocatorLocalCache { DCHECK(isEmpty()); } - void *getBatchClassBlock() { - void *B = allocate(BatchClassId); + TransferBatch *createBatch(uptr ClassId, void *B) { + if (ClassId != BatchClassId) + B = allocate(BatchClassId); if (UNLIKELY(!B)) reportOutOfMemory(SizeClassAllocator::getSizeByClassId(BatchClassId)); - return B; + return reinterpret_cast(B); + } + + BatchGroup *createGroup() { + void *Ptr = allocate(BatchClassId); + if (UNLIKELY(!Ptr)) + reportOutOfMemory(SizeClassAllocator::getSizeByClassId(BatchClassId)); + return reinterpret_cast(Ptr); } LocalStats &getStats() { return Stats; } @@ -127,11 +203,6 @@ template struct SizeClassAllocatorLocalCache { Str->append(" No block is cached.\n"); } - static u16 getMaxCached(uptr Size) { - return Min(SizeClassMap::MaxNumCachedHint, - SizeClassMap::getMaxCachedHint(Size)); - } - private: static const uptr NumClasses = SizeClassMap::NumClasses; static const uptr BatchClassId = SizeClassMap::BatchClassId; @@ -140,7 +211,7 @@ template struct SizeClassAllocatorLocalCache { u16 MaxCount; // Note: ClassSize is zero for the transfer batch. uptr ClassSize; - CompactPtrT Chunks[2 * SizeClassMap::MaxNumCachedHint]; + CompactPtrT Chunks[2 * TransferBatch::MaxNumCached]; }; PerClass PerClassArray[NumClasses] = {}; LocalStats Stats; @@ -157,7 +228,7 @@ template struct SizeClassAllocatorLocalCache { for (uptr I = 0; I < NumClasses; I++) { PerClass *P = &PerClassArray[I]; const uptr Size = SizeClassAllocator::getSizeByClassId(I); - P->MaxCount = static_cast(2 * getMaxCached(Size)); + P->MaxCount = static_cast(2 * TransferBatch::getMaxCached(Size)); if (I != BatchClassId) { P->ClassSize = Size; } else { @@ -175,14 +246,15 @@ template struct SizeClassAllocatorLocalCache { NOINLINE bool refill(PerClass *C, uptr ClassId) { initCacheMaybe(C); - - // TODO(chiahungduan): Pass the max number cached for each size class. - const u16 NumBlocksRefilled = - Allocator->popBlocks(this, ClassId, C->Chunks); - DCHECK_LE(NumBlocksRefilled, - getMaxCached(SizeClassAllocator::getSizeByClassId(ClassId))); - C->Count += NumBlocksRefilled; - return NumBlocksRefilled != 0; + TransferBatch *B = Allocator->popBatch(this, ClassId); + if (UNLIKELY(!B)) + return false; + DCHECK_GT(B->getCount(), 0); + C->Count = B->getCount(); + B->copyToArray(C->Chunks); + B->clear(); + destroyBatch(ClassId, B); + return true; } NOINLINE void drain(PerClass *C, uptr ClassId) { diff --git a/compiler-rt/lib/scudo/standalone/primary32.h b/compiler-rt/lib/scudo/standalone/primary32.h index e153a3bf871cb9..533615ad3816d0 100644 --- a/compiler-rt/lib/scudo/standalone/primary32.h +++ b/compiler-rt/lib/scudo/standalone/primary32.h @@ -9,7 +9,6 @@ #ifndef SCUDO_PRIMARY32_H_ #define SCUDO_PRIMARY32_H_ -#include "allocator_common.h" #include "bytemap.h" #include "common.h" #include "list.h" @@ -54,11 +53,8 @@ template class SizeClassAllocator32 { ""); typedef SizeClassAllocator32 ThisT; typedef SizeClassAllocatorLocalCache CacheT; - typedef TransferBatch TransferBatch; - typedef BatchGroup BatchGroup; - - static_assert(sizeof(BatchGroup) <= sizeof(TransferBatch), - "BatchGroup uses the same class size as TransferBatch"); + typedef typename CacheT::TransferBatch TransferBatch; + typedef typename CacheT::BatchGroup BatchGroup; static uptr getSizeByClassId(uptr ClassId) { return (ClassId == SizeClassMap::BatchClassId) @@ -191,21 +187,6 @@ template class SizeClassAllocator32 { return BlockSize > PageSize; } - u16 popBlocks(CacheT *C, uptr ClassId, CompactPtrT *ToArray) { - TransferBatch *B = popBatch(C, ClassId); - if (!B) - return 0; - - const u16 Count = B->getCount(); - DCHECK_GT(Count, 0U); - B->moveToArray(ToArray); - - if (ClassId != SizeClassMap::BatchClassId) - C->deallocate(SizeClassMap::BatchClassId, B); - - return Count; - } - TransferBatch *popBatch(CacheT *C, uptr ClassId) { DCHECK_LT(ClassId, NumClasses); SizeClassInfo *Sci = getSizeClassInfo(ClassId); @@ -539,8 +520,8 @@ template class SizeClassAllocator32 { // from `CreateGroup` in `pushBlocksImpl` BG->PushedBlocks = 1; BG->BytesInBGAtLastCheckpoint = 0; - BG->MaxCachedPerBatch = - CacheT::getMaxCached(getSizeByClassId(SizeClassMap::BatchClassId)); + BG->MaxCachedPerBatch = TransferBatch::getMaxCached( + getSizeByClassId(SizeClassMap::BatchClassId)); Sci->FreeListInfo.BlockList.push_front(BG); } @@ -619,17 +600,17 @@ template class SizeClassAllocator32 { DCHECK_GT(Size, 0U); auto CreateGroup = [&](uptr CompactPtrGroupBase) { - BatchGroup *BG = reinterpret_cast(C->getBatchClassBlock()); + BatchGroup *BG = C->createGroup(); BG->Batches.clear(); - TransferBatch *TB = - reinterpret_cast(C->getBatchClassBlock()); + TransferBatch *TB = C->createBatch(ClassId, nullptr); TB->clear(); BG->CompactPtrGroupBase = CompactPtrGroupBase; BG->Batches.push_front(TB); BG->PushedBlocks = 0; BG->BytesInBGAtLastCheckpoint = 0; - BG->MaxCachedPerBatch = CacheT::getMaxCached(getSizeByClassId(ClassId)); + BG->MaxCachedPerBatch = + TransferBatch::getMaxCached(getSizeByClassId(ClassId)); return BG; }; @@ -644,7 +625,9 @@ template class SizeClassAllocator32 { u16 UnusedSlots = static_cast(BG->MaxCachedPerBatch - CurBatch->getCount()); if (UnusedSlots == 0) { - CurBatch = reinterpret_cast(C->getBatchClassBlock()); + CurBatch = C->createBatch( + ClassId, + reinterpret_cast(decompactPtr(ClassId, Array[I]))); CurBatch->clear(); Batches.push_front(CurBatch); UnusedSlots = BG->MaxCachedPerBatch; @@ -792,7 +775,7 @@ template class SizeClassAllocator32 { } const uptr Size = getSizeByClassId(ClassId); - const u16 MaxCount = CacheT::getMaxCached(Size); + const u16 MaxCount = TransferBatch::getMaxCached(Size); DCHECK_GT(MaxCount, 0U); // The maximum number of blocks we should carve in the region is dictated // by the maximum number of batches we want to fill, and the amount of diff --git a/compiler-rt/lib/scudo/standalone/primary64.h b/compiler-rt/lib/scudo/standalone/primary64.h index 7d555684e4ec9a..6d160b4c64d75f 100644 --- a/compiler-rt/lib/scudo/standalone/primary64.h +++ b/compiler-rt/lib/scudo/standalone/primary64.h @@ -9,7 +9,6 @@ #ifndef SCUDO_PRIMARY64_H_ #define SCUDO_PRIMARY64_H_ -#include "allocator_common.h" #include "bytemap.h" #include "common.h" #include "list.h" @@ -56,11 +55,8 @@ template class SizeClassAllocator64 { static const uptr GroupScale = GroupSizeLog - CompactPtrScale; typedef SizeClassAllocator64 ThisT; typedef SizeClassAllocatorLocalCache CacheT; - typedef TransferBatch TransferBatch; - typedef BatchGroup BatchGroup; - - static_assert(sizeof(BatchGroup) <= sizeof(TransferBatch), - "BatchGroup uses the same class size as TransferBatch"); + typedef typename CacheT::TransferBatch TransferBatch; + typedef typename CacheT::BatchGroup BatchGroup; static uptr getSizeByClassId(uptr ClassId) { return (ClassId == SizeClassMap::BatchClassId) @@ -207,21 +203,6 @@ template class SizeClassAllocator64 { DCHECK_EQ(BlocksInUse, BatchClassUsedInFreeLists); } - u16 popBlocks(CacheT *C, uptr ClassId, CompactPtrT *ToArray) { - TransferBatch *B = popBatch(C, ClassId); - if (!B) - return 0; - - const u16 Count = B->getCount(); - DCHECK_GT(Count, 0U); - B->moveToArray(ToArray); - - if (ClassId != SizeClassMap::BatchClassId) - C->deallocate(SizeClassMap::BatchClassId, B); - - return Count; - } - TransferBatch *popBatch(CacheT *C, uptr ClassId) { DCHECK_LT(ClassId, NumClasses); RegionInfo *Region = getRegionInfo(ClassId); @@ -649,8 +630,8 @@ template class SizeClassAllocator64 { // from `CreateGroup` in `pushBlocksImpl` BG->PushedBlocks = 1; BG->BytesInBGAtLastCheckpoint = 0; - BG->MaxCachedPerBatch = - CacheT::getMaxCached(getSizeByClassId(SizeClassMap::BatchClassId)); + BG->MaxCachedPerBatch = TransferBatch::getMaxCached( + getSizeByClassId(SizeClassMap::BatchClassId)); Region->FreeListInfo.BlockList.push_front(BG); } @@ -728,17 +709,17 @@ template class SizeClassAllocator64 { DCHECK_GT(Size, 0U); auto CreateGroup = [&](uptr CompactPtrGroupBase) { - BatchGroup *BG = reinterpret_cast(C->getBatchClassBlock()); + BatchGroup *BG = C->createGroup(); BG->Batches.clear(); - TransferBatch *TB = - reinterpret_cast(C->getBatchClassBlock()); + TransferBatch *TB = C->createBatch(ClassId, nullptr); TB->clear(); BG->CompactPtrGroupBase = CompactPtrGroupBase; BG->Batches.push_front(TB); BG->PushedBlocks = 0; BG->BytesInBGAtLastCheckpoint = 0; - BG->MaxCachedPerBatch = CacheT::getMaxCached(getSizeByClassId(ClassId)); + BG->MaxCachedPerBatch = + TransferBatch::getMaxCached(getSizeByClassId(ClassId)); return BG; }; @@ -753,7 +734,9 @@ template class SizeClassAllocator64 { u16 UnusedSlots = static_cast(BG->MaxCachedPerBatch - CurBatch->getCount()); if (UnusedSlots == 0) { - CurBatch = reinterpret_cast(C->getBatchClassBlock()); + CurBatch = C->createBatch( + ClassId, + reinterpret_cast(decompactPtr(ClassId, Array[I]))); CurBatch->clear(); Batches.push_front(CurBatch); UnusedSlots = BG->MaxCachedPerBatch; @@ -884,7 +867,7 @@ template class SizeClassAllocator64 { RegionInfo *Region) REQUIRES(Region->MMLock) EXCLUDES(Region->FLLock) { const uptr Size = getSizeByClassId(ClassId); - const u16 MaxCount = CacheT::getMaxCached(Size); + const u16 MaxCount = TransferBatch::getMaxCached(Size); const uptr RegionBeg = Region->RegionBeg; const uptr MappedUser = Region->MemMapInfo.MappedUser; diff --git a/compiler-rt/lib/scudo/standalone/tests/primary_test.cpp b/compiler-rt/lib/scudo/standalone/tests/primary_test.cpp index e368f521bea71a..074977ff27e65f 100644 --- a/compiler-rt/lib/scudo/standalone/tests/primary_test.cpp +++ b/compiler-rt/lib/scudo/standalone/tests/primary_test.cpp @@ -207,7 +207,7 @@ struct SmallRegionsConfig { // For the 32-bit one, it requires actually exhausting memory, so we skip it. TEST(ScudoPrimaryTest, Primary64OOM) { using Primary = scudo::SizeClassAllocator64; - using TransferBatch = Primary::TransferBatch; + using TransferBatch = Primary::CacheT::TransferBatch; Primary Allocator; Allocator.init(/*ReleaseToOsInterval=*/-1); typename Primary::CacheT Cache; @@ -233,9 +233,8 @@ TEST(ScudoPrimaryTest, Primary64OOM) { while (!Batches.empty()) { TransferBatch *B = Batches.back(); Batches.pop_back(); - const scudo::u16 Count = B->getCount(); - B->moveToArray(Blocks); - Allocator.pushBlocks(&Cache, ClassId, Blocks, Count); + B->copyToArray(Blocks); + Allocator.pushBlocks(&Cache, ClassId, Blocks, B->getCount()); Cache.deallocate(Primary::SizeClassMap::BatchClassId, B); } Cache.destroy(nullptr);