third_party/WebKit/Source/wtf/PartitionAlloc.h

   1 /*
   2  * Copyright (C) 2013 Google Inc. All rights reserved.
   3  *
   4  * Redistribution and use in source and binary forms, with or without
   5  * modification, are permitted provided that the following conditions are
   6  * met:
   7  *
   8  *     * Redistributions of source code must retain the above copyright
   9  * notice, this list of conditions and the following disclaimer.
  10  *     * Redistributions in binary form must reproduce the above
  11  * copyright notice, this list of conditions and the following disclaimer
  12  * in the documentation and/or other materials provided with the
  13  * distribution.
  14  *     * Neither the name of Google Inc. nor the names of its
  15  * contributors may be used to endorse or promote products derived from
  16  * this software without specific prior written permission.
  17  *
  18  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  19  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  20  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  21  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  22  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  23  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  24  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  25  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  26  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  27  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  28  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  29  */
  30
  31 #ifndef WTF_PartitionAlloc_h
  32 #define WTF_PartitionAlloc_h
  33
  34 // DESCRIPTION
  35 // partitionAlloc() / partitionAllocGeneric() and partitionFree() /
  36 // partitionFreeGeneric() are approximately analagous to malloc() and free().
  37 //
  38 // The main difference is that a PartitionRoot / PartitionRootGeneric object
  39 // must be supplied to these functions, representing a specific "heap partition"
  40 // that will be used to satisfy the allocation. Different partitions are
  41 // guaranteed to exist in separate address spaces, including being separate from
  42 // the main system heap. If the contained objects are all freed, physical memory
  43 // is returned to the system but the address space remains reserved.
  44 //
  45 // THE ONLY LEGITIMATE WAY TO OBTAIN A PartitionRoot IS THROUGH THE
  46 // SizeSpecificPartitionAllocator / PartitionAllocatorGeneric classes. To
  47 // minimize the instruction count to the fullest extent possible, the
  48 // PartitionRoot is really just a header adjacent to other data areas provided
  49 // by the allocator class.
  50 //
  51 // The partitionAlloc() variant of the API has the following caveats:
  52 // - Allocations and frees against a single partition must be single threaded.
  53 // - Allocations must not exceed a max size, chosen at compile-time via a
  54 // templated parameter to PartitionAllocator.
  55 // - Allocation sizes must be aligned to the system pointer size.
  56 // - Allocations are bucketed exactly according to size.
  57 //
  58 // And for partitionAllocGeneric():
  59 // - Multi-threaded use against a single partition is ok; locking is handled.
  60 // - Allocations of any arbitrary size can be handled (subject to a limit of
  61 // INT_MAX bytes for security reasons).
  62 // - Bucketing is by approximate size, for example an allocation of 4000 bytes
  63 // might be placed into a 4096-byte bucket. Bucket sizes are chosen to try and
  64 // keep worst-case waste to ~10%.
  65 //
  66 // The allocators are designed to be extremely fast, thanks to the following
  67 // properties and design:
  68 // - Just a single (reasonably predicatable) branch in the hot / fast path for
  69 // both allocating and (significantly) freeing.
  70 // - A minimal number of operations in the hot / fast path, with the slow paths
  71 // in separate functions, leading to the possibility of inlining.
  72 // - Each partition page (which is usually multiple physical pages) has a
  73 // metadata structure which allows fast mapping of free() address to an
  74 // underlying bucket.
  75 // - Supports a lock-free API for fast performance in single-threaded cases.
  76 // - The freelist for a given bucket is split across a number of partition
  77 // pages, enabling various simple tricks to try and minimize fragmentation.
  78 // - Fine-grained bucket sizes leading to less waste and better packing.
  79 //
  80 // The following security properties are provided at this time:
  81 // - Linear overflows cannot corrupt into the partition.
  82 // - Linear overflows cannot corrupt out of the partition.
  83 // - Freed pages will only be re-used within the partition.
  84 //   (exception: large allocations > ~1MB)
  85 // - Freed pages will only hold same-sized objects when re-used.
  86 // - Dereference of freelist pointer should fault.
  87 // - Out-of-line main metadata: linear over or underflow cannot corrupt it.
  88 // - Partial pointer overwrite of freelist pointer should fault.
  89 // - Rudimentary double-free detection.
  90 // - Large allocations (> ~1MB) are guard-paged at the beginning and end.
  91 //
  92 // The following security properties could be investigated in the future:
  93 // - Per-object bucketing (instead of per-size) is mostly available at the API,
  94 // but not used yet.
  95 // - No randomness of freelist entries or bucket position.
  96 // - Better checking for wild pointers in free().
  97 // - Better freelist masking function to guarantee fault on 32-bit.
  98
  99 #include "wtf/Assertions.h"
 100 #include "wtf/BitwiseOperations.h"
 101 #include "wtf/ByteSwap.h"
 102 #include "wtf/CPU.h"
 103 #include "wtf/PageAllocator.h"
 104 #include "wtf/SpinLock.h"
 105
 106 #include <limits.h>
 107
 108 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 109 #include <stdlib.h>
 110 #endif
 111
 112 #if ENABLE(ASSERT)
 113 #include <string.h>
 114 #endif
 115
 116 namespace WTF {
 117
 118 // Allocation granularity of sizeof(void*) bytes.
 119 static const size_t kAllocationGranularity = sizeof(void*);
 120 static const size_t kAllocationGranularityMask = kAllocationGranularity - 1;
 121 static const size_t kBucketShift = (kAllocationGranularity == 8) ? 3 : 2;
 122
 123 // Underlying partition storage pages are a power-of-two size. It is typical
 124 // for a partition page to be based on multiple system pages. Most references to
 125 // "page" refer to partition pages.
 126 // We also have the concept of "super pages" -- these are the underlying system
 127 // allocations we make. Super pages contain multiple partition pages inside them
 128 // and include space for a small amount of metadata per partition page.
 129 // Inside super pages, we store "slot spans". A slot span is a continguous range
 130 // of one or more partition pages that stores allocations of the same size.
 131 // Slot span sizes are adjusted depending on the allocation size, to make sure
 132 // the packing does not lead to unused (wasted) space at the end of the last
 133 // system page of the span. For our current max slot span size of 64k and other
 134 // constant values, we pack _all_ partitionAllocGeneric() sizes perfectly up
 135 // against the end of a system page.
 136 static const size_t kPartitionPageShift = 14; // 16KB
 137 static const size_t kPartitionPageSize = 1 << kPartitionPageShift;
 138 static const size_t kPartitionPageOffsetMask = kPartitionPageSize - 1;
 139 static const size_t kPartitionPageBaseMask = ~kPartitionPageOffsetMask;
 140 static const size_t kMaxPartitionPagesPerSlotSpan = 4;
 141
 142 // To avoid fragmentation via never-used freelist entries, we hand out partition
 143 // freelist sections gradually, in units of the dominant system page size.
 144 // What we're actually doing is avoiding filling the full partition page (16 KB)
 145 // with freelist pointers right away. Writing freelist pointers will fault and
 146 // dirty a private page, which is very wasteful if we never actually store
 147 // objects there.
 148 static const size_t kNumSystemPagesPerPartitionPage = kPartitionPageSize / kSystemPageSize;
 149 static const size_t kMaxSystemPagesPerSlotSpan = kNumSystemPagesPerPartitionPage * kMaxPartitionPagesPerSlotSpan;
 150
 151 // We reserve virtual address space in 2MB chunks (aligned to 2MB as well).
 152 // These chunks are called "super pages". We do this so that we can store
 153 // metadata in the first few pages of each 2MB aligned section. This leads to
 154 // a very fast free(). We specifically choose 2MB because this virtual address
 155 // block represents a full but single PTE allocation on ARM, ia32 and x64.
 156 //
 157 // The layout of the super page is as follows. The sizes below are the same
 158 // for 32 bit and 64 bit.
 159 //
 160 //   | Guard page (4KB) | Metadata page (4KB) | Guard pages (8KB) | Slot span | Slot span | ... | Slot span | Guard page (4KB) |
 161 //
 162 //   - Each slot span is a contiguous range of one or more PartitionPages.
 163 //   - The metadata page has the following format. Note that the PartitionPage
 164 //     that is not at the head of a slot span is "unused". In other words,
 165 //     the metadata for the slot span is stored only in the first PartitionPage
 166 //     of the slot span. Metadata accesses to other PartitionPages are
 167 //     redirected to the first PartitionPage.
 168 //
 169 //     | SuperPageExtentEntry (32B) | PartitionPage of slot span 1 (32B, used) | PartitionPage of slot span 1 (32B, unused) | PartitionPage of slot span 1 (32B, unused) | PartitionPage of slot span 2 (32B, used) | PartitionPage of slot span 3 (32B, used) | ... | PartitionPage of slot span N (32B, unused) |
 170 //
 171 // A direct mapped page has a similar layout to fake it looking like a super page:
 172 //
 173 //     | Guard page (4KB) | Metadata page (4KB) | Guard pages (8KB) | Direct mapped object | Guard page (4KB) |
 174 //
 175 //    - The metadata page has the following layout:
 176 //
 177 //     | SuperPageExtentEntry (32B) | PartitionPage (32B) | PartitionBucket (32B) | PartitionDirectMapExtent (8B) |
 178 static const size_t kSuperPageShift = 21; // 2MB
 179 static const size_t kSuperPageSize = 1 << kSuperPageShift;
 180 static const size_t kSuperPageOffsetMask = kSuperPageSize - 1;
 181 static const size_t kSuperPageBaseMask = ~kSuperPageOffsetMask;
 182 static const size_t kNumPartitionPagesPerSuperPage = kSuperPageSize / kPartitionPageSize;
 183
 184 static const size_t kPageMetadataShift = 5; // 32 bytes per partition page.
 185 static const size_t kPageMetadataSize = 1 << kPageMetadataShift;
 186
 187 // The following kGeneric* constants apply to the generic variants of the API.
 188 // The "order" of an allocation is closely related to the power-of-two size of
 189 // the allocation. More precisely, the order is the bit index of the
 190 // most-significant-bit in the allocation size, where the bit numbers starts
 191 // at index 1 for the least-significant-bit.
 192 // In terms of allocation sizes, order 0 covers 0, order 1 covers 1, order 2
 193 // covers 2->3, order 3 covers 4->7, order 4 covers 8->15.
 194 static const size_t kGenericMinBucketedOrder = 4; // 8 bytes.
 195 static const size_t kGenericMaxBucketedOrder = 20; // Largest bucketed order is 1<<(20-1) (storing 512KB -> almost 1MB)
 196 static const size_t kGenericNumBucketedOrders = (kGenericMaxBucketedOrder - kGenericMinBucketedOrder) + 1;
 197 static const size_t kGenericNumBucketsPerOrderBits = 3; // Eight buckets per order (for the higher orders), e.g. order 8 is 128, 144, 160, ..., 240
 198 static const size_t kGenericNumBucketsPerOrder = 1 << kGenericNumBucketsPerOrderBits;
 199 static const size_t kGenericNumBuckets = kGenericNumBucketedOrders * kGenericNumBucketsPerOrder;
 200 static const size_t kGenericSmallestBucket = 1 << (kGenericMinBucketedOrder - 1);
 201 static const size_t kGenericMaxBucketSpacing = 1 << ((kGenericMaxBucketedOrder - 1) - kGenericNumBucketsPerOrderBits);
 202 static const size_t kGenericMaxBucketed = (1 << (kGenericMaxBucketedOrder - 1)) + ((kGenericNumBucketsPerOrder - 1) * kGenericMaxBucketSpacing);
 203 static const size_t kGenericMinDirectMappedDownsize = kGenericMaxBucketed + 1; // Limit when downsizing a direct mapping using realloc().
 204 static const size_t kGenericMaxDirectMapped = INT_MAX - kSystemPageSize;
 205 static const size_t kBitsPerSizet = sizeof(void*) * CHAR_BIT;
 206
 207 // Constants for the memory reclaim logic.
 208 static const size_t kMaxFreeableSpans = 16;
 209
 210 // If the total size in bytes of allocated but not committed pages exceeds this
 211 // value (probably it is a "out of virtual address space" crash),
 212 // a special crash stack trace is generated at |partitionOutOfMemory|.
 213 // This is to distinguish "out of virtual address space" from
 214 // "out of physical memory" in crash reports.
 215 static const size_t kReasonableSizeOfUnusedPages = 1024 * 1024 * 1024; // 1GiB
 216
 217 #if ENABLE(ASSERT)
 218 // These two byte values match tcmalloc.
 219 static const unsigned char kUninitializedByte = 0xAB;
 220 static const unsigned char kFreedByte = 0xCD;
 221 static const size_t kCookieSize = 16; // Handles alignment up to XMM instructions on Intel.
 222 static const unsigned char kCookieValue[kCookieSize] = { 0xDE, 0xAD, 0xBE, 0xEF, 0xCA, 0xFE, 0xD0, 0x0D, 0x13, 0x37, 0xF0, 0x05, 0xBA, 0x11, 0xAB, 0x1E };
 223 #endif
 224
 225 struct PartitionBucket;
 226 struct PartitionRootBase;
 227
 228 struct PartitionFreelistEntry {
 229     PartitionFreelistEntry* next;
 230 };
 231
 232 // Some notes on page states. A page can be in one of four major states:
 233 // 1) Active.
 234 // 2) Full.
 235 // 3) Empty.
 236 // 4) Decommitted.
 237 // An active page has available free slots. A full page has no free slots. An
 238 // empty page has no free slots, and a decommitted page is an empty page that
 239 // had its backing memory released back to the system.
 240 // There are two linked lists tracking the pages. The "active page" list is an
 241 // approximation of a list of active pages. It is an approximation because
 242 // full, empty and decommitted pages may briefly be present in the list until
 243 // we next do a scan over it.
 244 // The "empty page" list is an accurate list of pages which are either empty
 245 // or decommitted.
 246 //
 247 // The significant page transitions are:
 248 // - free() will detect when a full page has a slot free()'d and immediately
 249 // return the page to the head of the active list.
 250 // - free() will detect when a page is fully emptied. It _may_ add it to the
 251 // empty list or it _may_ leave it on the active list until a future list scan.
 252 // - malloc() _may_ scan the active page list in order to fulfil the request.
 253 // If it does this, full, empty and decommitted pages encountered will be
 254 // booted out of the active list. If there are no suitable active pages found,
 255 // an empty or decommitted page (if one exists) will be pulled from the empty
 256 // list on to the active list.
 257 struct PartitionPage {
 258     PartitionFreelistEntry* freelistHead;
 259     PartitionPage* nextPage;
 260     PartitionBucket* bucket;
 261     int16_t numAllocatedSlots; // Deliberately signed, 0 for empty or decommitted page, -n for full pages.
 262     uint16_t numUnprovisionedSlots;
 263     uint16_t pageOffset;
 264     int16_t emptyCacheIndex; // -1 if not in the empty cache.
 265 };
 266
 267 struct PartitionBucket {
 268     PartitionPage* activePagesHead; // Accessed most in hot path => goes first.
 269     PartitionPage* emptyPagesHead;
 270     PartitionPage* decommittedPagesHead;
 271     uint32_t slotSize;
 272     uint16_t numSystemPagesPerSlotSpan;
 273     uint16_t numFullPages;
 274 };
 275
 276 // An "extent" is a span of consecutive superpages. We link to the partition's
 277 // next extent (if there is one) at the very start of a superpage's metadata
 278 // area.
 279 struct PartitionSuperPageExtentEntry {
 280     PartitionRootBase* root;
 281     char* superPageBase;
 282     char* superPagesEnd;
 283     PartitionSuperPageExtentEntry* next;
 284 };
 285
 286 struct PartitionDirectMapExtent {
 287     PartitionDirectMapExtent* nextExtent;
 288     PartitionDirectMapExtent* prevExtent;
 289     PartitionBucket* bucket;
 290     size_t mapSize; // Mapped size, not including guard pages and meta-data.
 291 };
 292
 293 struct WTF_EXPORT PartitionRootBase {
 294     size_t totalSizeOfCommittedPages;
 295     size_t totalSizeOfSuperPages;
 296     size_t totalSizeOfDirectMappedPages;
 297     // Invariant: totalSizeOfCommittedPages <= totalSizeOfSuperPages + totalSizeOfDirectMappedPages.
 298     unsigned numBuckets;
 299     unsigned maxAllocation;
 300     bool initialized;
 301     char* nextSuperPage;
 302     char* nextPartitionPage;
 303     char* nextPartitionPageEnd;
 304     PartitionSuperPageExtentEntry* currentExtent;
 305     PartitionSuperPageExtentEntry* firstExtent;
 306     PartitionDirectMapExtent* directMapList;
 307     PartitionPage* globalEmptyPageRing[kMaxFreeableSpans];
 308     int16_t globalEmptyPageRingIndex;
 309     uintptr_t invertedSelf;
 310
 311     static int gInitializedLock;
 312     static bool gInitialized;
 313     // gSeedPage is used as a sentinel to indicate that there is no page
 314     // in the active page list. We can use nullptr, but in that case we need
 315     // to add a null-check branch to the hot allocation path. We want to avoid
 316     // that.
 317     static PartitionPage gSeedPage;
 318     static PartitionBucket gPagedBucket;
 319     // gOomHandlingFunction is invoked when ParitionAlloc hits OutOfMemory.
 320     static void (*gOomHandlingFunction)();
 321 };
 322
 323 // Never instantiate a PartitionRoot directly, instead use PartitionAlloc.
 324 struct PartitionRoot : public PartitionRootBase {
 325     // The PartitionAlloc templated class ensures the following is correct.
 326     ALWAYS_INLINE PartitionBucket* buckets() { return reinterpret_cast<PartitionBucket*>(this + 1); }
 327     ALWAYS_INLINE const PartitionBucket* buckets() const { return reinterpret_cast<const PartitionBucket*>(this + 1); }
 328 };
 329
 330 // Never instantiate a PartitionRootGeneric directly, instead use PartitionAllocatorGeneric.
 331 struct PartitionRootGeneric : public PartitionRootBase {
 332     int lock;
 333     // Some pre-computed constants.
 334     size_t orderIndexShifts[kBitsPerSizet + 1];
 335     size_t orderSubIndexMasks[kBitsPerSizet + 1];
 336     // The bucket lookup table lets us map a size_t to a bucket quickly.
 337     // The trailing +1 caters for the overflow case for very large allocation sizes.
 338     // It is one flat array instead of a 2D array because in the 2D world, we'd
 339     // need to index array[blah][max+1] which risks undefined behavior.
 340     PartitionBucket* bucketLookups[((kBitsPerSizet + 1) * kGenericNumBucketsPerOrder) + 1];
 341     PartitionBucket buckets[kGenericNumBuckets];
 342 };
 343
 344 // Flags for partitionAllocGenericFlags.
 345 enum PartitionAllocFlags {
 346     PartitionAllocReturnNull = 1 << 0,
 347 };
 348
 349 // Struct used to retrieve total memory usage of a partition. Used by
 350 // PartitionStatsDumper implementation.
 351 struct PartitionMemoryStats {
 352     size_t totalMmappedBytes; // Total bytes mmaped from the system.
 353     size_t totalCommittedBytes; // Total size of commmitted pages.
 354     size_t totalResidentBytes; // Total bytes provisioned by the partition.
 355     size_t totalActiveBytes; // Total active bytes in the partition.
 356     size_t totalDecommittableBytes; // Total bytes that could be decommitted.
 357     size_t totalDiscardableBytes; // Total bytes that could be discarded.
 358 };
 359
 360 // Struct used to retrieve memory statistics about a partition bucket. Used by
 361 // PartitionStatsDumper implementation.
 362 struct PartitionBucketMemoryStats {
 363     bool isValid; // Used to check if the stats is valid.
 364     bool isDirectMap; // True if this is a direct mapping; size will not be unique.
 365     uint32_t bucketSlotSize; // The size of the slot in bytes.
 366     uint32_t allocatedPageSize; // Total size the partition page allocated from the system.
 367     uint32_t activeBytes; // Total active bytes used in the bucket.
 368     uint32_t residentBytes; // Total bytes provisioned in the bucket.
 369     uint32_t decommittableBytes; // Total bytes that could be decommitted.
 370     uint32_t discardableBytes; // Total bytes that could be discarded.
 371     uint32_t numFullPages; // Number of pages with all slots allocated.
 372     uint32_t numActivePages; // Number of pages that have at least one provisioned slot.
 373     uint32_t numEmptyPages; // Number of pages that are empty but not decommitted.
 374     uint32_t numDecommittedPages; // Number of pages that are empty and decommitted.
 375 };
 376
 377 // Interface that is passed to partitionDumpStats and
 378 // partitionDumpStatsGeneric for using the memory statistics.
 379 class WTF_EXPORT PartitionStatsDumper {
 380 public:
 381     // Called to dump total memory used by partition, once per partition.
 382     virtual void partitionDumpTotals(const char* partitionName, const PartitionMemoryStats*) = 0;
 383
 384     // Called to dump stats about buckets, for each bucket.
 385     virtual void partitionsDumpBucketStats(const char* partitionName, const PartitionBucketMemoryStats*) = 0;
 386 };
 387
 388 WTF_EXPORT void partitionAllocGlobalInit(void (*oomHandlingFunction)());
 389 WTF_EXPORT void partitionAllocInit(PartitionRoot*, size_t numBuckets, size_t maxAllocation);
 390 WTF_EXPORT bool partitionAllocShutdown(PartitionRoot*);
 391 WTF_EXPORT void partitionAllocGenericInit(PartitionRootGeneric*);
 392 WTF_EXPORT bool partitionAllocGenericShutdown(PartitionRootGeneric*);
 393
 394 enum PartitionPurgeFlags {
 395     // Decommitting the ring list of empty pages is reasonably fast.
 396     PartitionPurgeDecommitEmptyPages = 1 << 0,
 397     // Discarding unused system pages is slower, because it involves walking all
 398     // freelists in all active partition pages of all buckets >= system page
 399     // size. It often frees a similar amount of memory to decommitting the empty
 400     // pages, though.
 401     PartitionPurgeDiscardUnusedSystemPages = 1 << 1,
 402 };
 403
 404 WTF_EXPORT void partitionPurgeMemory(PartitionRoot*, int);
 405 WTF_EXPORT void partitionPurgeMemoryGeneric(PartitionRootGeneric*, int);
 406
 407 WTF_EXPORT NEVER_INLINE void* partitionAllocSlowPath(PartitionRootBase*, int, size_t, PartitionBucket*);
 408 WTF_EXPORT NEVER_INLINE void partitionFreeSlowPath(PartitionPage*);
 409 WTF_EXPORT NEVER_INLINE void* partitionReallocGeneric(PartitionRootGeneric*, void*, size_t);
 410
 411 WTF_EXPORT void partitionDumpStats(PartitionRoot*, const char* partitionName, bool isLightDump, PartitionStatsDumper*);
 412 WTF_EXPORT void partitionDumpStatsGeneric(PartitionRootGeneric*, const char* partitionName, bool isLightDump, PartitionStatsDumper*);
 413
 414 ALWAYS_INLINE PartitionFreelistEntry* partitionFreelistMask(PartitionFreelistEntry* ptr)
 415 {
 416     // We use bswap on little endian as a fast mask for two reasons:
 417     // 1) If an object is freed and its vtable used where the attacker doesn't
 418     // get the chance to run allocations between the free and use, the vtable
 419     // dereference is likely to fault.
 420     // 2) If the attacker has a linear buffer overflow and elects to try and
 421     // corrupt a freelist pointer, partial pointer overwrite attacks are
 422     // thwarted.
 423     // For big endian, similar guarantees are arrived at with a negation.
 424 #if CPU(BIG_ENDIAN)
 425     uintptr_t masked = ~reinterpret_cast<uintptr_t>(ptr);
 426 #else
 427     uintptr_t masked = bswapuintptrt(reinterpret_cast<uintptr_t>(ptr));
 428 #endif
 429     return reinterpret_cast<PartitionFreelistEntry*>(masked);
 430 }
 431
 432 ALWAYS_INLINE size_t partitionCookieSizeAdjustAdd(size_t size)
 433 {
 434 #if ENABLE(ASSERT)
 435     // Add space for cookies, checking for integer overflow.
 436     ASSERT(size + (2 * kCookieSize) > size);
 437     size += 2 * kCookieSize;
 438 #endif
 439     return size;
 440 }
 441
 442 ALWAYS_INLINE size_t partitionCookieSizeAdjustSubtract(size_t size)
 443 {
 444 #if ENABLE(ASSERT)
 445     // Remove space for cookies.
 446     ASSERT(size >= 2 * kCookieSize);
 447     size -= 2 * kCookieSize;
 448 #endif
 449     return size;
 450 }
 451
 452 ALWAYS_INLINE void* partitionCookieFreePointerAdjust(void* ptr)
 453 {
 454 #if ENABLE(ASSERT)
 455     // The value given to the application is actually just after the cookie.
 456     ptr = static_cast<char*>(ptr) - kCookieSize;
 457 #endif
 458     return ptr;
 459 }
 460
 461 ALWAYS_INLINE void partitionCookieWriteValue(void* ptr)
 462 {
 463 #if ENABLE(ASSERT)
 464     unsigned char* cookiePtr = reinterpret_cast<unsigned char*>(ptr);
 465     for (size_t i = 0; i < kCookieSize; ++i, ++cookiePtr)
 466         *cookiePtr = kCookieValue[i];
 467 #endif
 468 }
 469
 470 ALWAYS_INLINE void partitionCookieCheckValue(void* ptr)
 471 {
 472 #if ENABLE(ASSERT)
 473     unsigned char* cookiePtr = reinterpret_cast<unsigned char*>(ptr);
 474     for (size_t i = 0; i < kCookieSize; ++i, ++cookiePtr)
 475         ASSERT(*cookiePtr == kCookieValue[i]);
 476 #endif
 477 }
 478
 479 ALWAYS_INLINE char* partitionSuperPageToMetadataArea(char* ptr)
 480 {
 481     uintptr_t pointerAsUint = reinterpret_cast<uintptr_t>(ptr);
 482     ASSERT(!(pointerAsUint & kSuperPageOffsetMask));
 483     // The metadata area is exactly one system page (the guard page) into the
 484     // super page.
 485     return reinterpret_cast<char*>(pointerAsUint + kSystemPageSize);
 486 }
 487
 488 ALWAYS_INLINE PartitionPage* partitionPointerToPageNoAlignmentCheck(void* ptr)
 489 {
 490     uintptr_t pointerAsUint = reinterpret_cast<uintptr_t>(ptr);
 491     char* superPagePtr = reinterpret_cast<char*>(pointerAsUint & kSuperPageBaseMask);
 492     uintptr_t partitionPageIndex = (pointerAsUint & kSuperPageOffsetMask) >> kPartitionPageShift;
 493     // Index 0 is invalid because it is the metadata and guard area and
 494     // the last index is invalid because it is a guard page.
 495     ASSERT(partitionPageIndex);
 496     ASSERT(partitionPageIndex < kNumPartitionPagesPerSuperPage - 1);
 497     PartitionPage* page = reinterpret_cast<PartitionPage*>(partitionSuperPageToMetadataArea(superPagePtr) + (partitionPageIndex << kPageMetadataShift));
 498     // Partition pages in the same slot span can share the same page object. Adjust for that.
 499     size_t delta = page->pageOffset << kPageMetadataShift;
 500     page = reinterpret_cast<PartitionPage*>(reinterpret_cast<char*>(page) - delta);
 501     return page;
 502 }
 503
 504 ALWAYS_INLINE void* partitionPageToPointer(const PartitionPage* page)
 505 {
 506     uintptr_t pointerAsUint = reinterpret_cast<uintptr_t>(page);
 507     uintptr_t superPageOffset = (pointerAsUint & kSuperPageOffsetMask);
 508     ASSERT(superPageOffset > kSystemPageSize);
 509     ASSERT(superPageOffset < kSystemPageSize + (kNumPartitionPagesPerSuperPage * kPageMetadataSize));
 510     uintptr_t partitionPageIndex = (superPageOffset - kSystemPageSize) >> kPageMetadataShift;
 511     // Index 0 is invalid because it is the metadata area and the last index is invalid because it is a guard page.
 512     ASSERT(partitionPageIndex);
 513     ASSERT(partitionPageIndex < kNumPartitionPagesPerSuperPage - 1);
 514     uintptr_t superPageBase = (pointerAsUint & kSuperPageBaseMask);
 515     void* ret = reinterpret_cast<void*>(superPageBase + (partitionPageIndex << kPartitionPageShift));
 516     return ret;
 517 }
 518
 519 ALWAYS_INLINE PartitionPage* partitionPointerToPage(void* ptr)
 520 {
 521     PartitionPage* page = partitionPointerToPageNoAlignmentCheck(ptr);
 522     // Checks that the pointer is a multiple of bucket size.
 523     ASSERT(!((reinterpret_cast<uintptr_t>(ptr) - reinterpret_cast<uintptr_t>(partitionPageToPointer(page))) % page->bucket->slotSize));
 524     return page;
 525 }
 526
 527 ALWAYS_INLINE bool partitionBucketIsDirectMapped(const PartitionBucket* bucket)
 528 {
 529     return !bucket->numSystemPagesPerSlotSpan;
 530 }
 531
 532 ALWAYS_INLINE size_t partitionBucketBytes(const PartitionBucket* bucket)
 533 {
 534     return bucket->numSystemPagesPerSlotSpan * kSystemPageSize;
 535 }
 536
 537 ALWAYS_INLINE uint16_t partitionBucketSlots(const PartitionBucket* bucket)
 538 {
 539     return static_cast<uint16_t>(partitionBucketBytes(bucket) / bucket->slotSize);
 540 }
 541
 542 ALWAYS_INLINE size_t* partitionPageGetRawSizePtr(PartitionPage* page)
 543 {
 544     // For single-slot buckets which span more than one partition page, we
 545     // have some spare metadata space to store the raw allocation size. We
 546     // can use this to report better statistics.
 547     PartitionBucket* bucket = page->bucket;
 548     if (bucket->slotSize <= kMaxSystemPagesPerSlotSpan * kSystemPageSize)
 549         return nullptr;
 550
 551     ASSERT((bucket->slotSize % kSystemPageSize) == 0);
 552     ASSERT(partitionBucketIsDirectMapped(bucket) || partitionBucketSlots(bucket) == 1);
 553     page++;
 554     return reinterpret_cast<size_t*>(&page->freelistHead);
 555 }
 556
 557 ALWAYS_INLINE size_t partitionPageGetRawSize(PartitionPage* page)
 558 {
 559     size_t* rawSizePtr = partitionPageGetRawSizePtr(page);
 560     if (UNLIKELY(rawSizePtr != nullptr))
 561         return *rawSizePtr;
 562     return 0;
 563 }
 564
 565 ALWAYS_INLINE PartitionRootBase* partitionPageToRoot(PartitionPage* page)
 566 {
 567     PartitionSuperPageExtentEntry* extentEntry = reinterpret_cast<PartitionSuperPageExtentEntry*>(reinterpret_cast<uintptr_t>(page) & kSystemPageBaseMask);
 568     return extentEntry->root;
 569 }
 570
 571 ALWAYS_INLINE bool partitionPointerIsValid(void* ptr)
 572 {
 573     PartitionPage* page = partitionPointerToPage(ptr);
 574     PartitionRootBase* root = partitionPageToRoot(page);
 575     return root->invertedSelf == ~reinterpret_cast<uintptr_t>(root);
 576 }
 577
 578 ALWAYS_INLINE void* partitionBucketAlloc(PartitionRootBase* root, int flags, size_t size, PartitionBucket* bucket)
 579 {
 580     PartitionPage* page = bucket->activePagesHead;
 581     // Check that this page is neither full nor freed.
 582     ASSERT(page->numAllocatedSlots >= 0);
 583     void* ret = page->freelistHead;
 584     if (LIKELY(ret != 0)) {
 585         // If these asserts fire, you probably corrupted memory.
 586         ASSERT(partitionPointerIsValid(ret));
 587         // All large allocations must go through the slow path to correctly
 588         // update the size metadata.
 589         ASSERT(partitionPageGetRawSize(page) == 0);
 590         PartitionFreelistEntry* newHead = partitionFreelistMask(static_cast<PartitionFreelistEntry*>(ret)->next);
 591         page->freelistHead = newHead;
 592         page->numAllocatedSlots++;
 593     } else {
 594         ret = partitionAllocSlowPath(root, flags, size, bucket);
 595         ASSERT(!ret || partitionPointerIsValid(ret));
 596     }
 597 #if ENABLE(ASSERT)
 598     if (!ret)
 599         return 0;
 600     // Fill the uninitialized pattern, and write the cookies.
 601     page = partitionPointerToPage(ret);
 602     size_t slotSize = page->bucket->slotSize;
 603     size_t rawSize = partitionPageGetRawSize(page);
 604     if (rawSize) {
 605         ASSERT(rawSize == size);
 606         slotSize = rawSize;
 607     }
 608     size_t noCookieSize = partitionCookieSizeAdjustSubtract(slotSize);
 609     char* charRet = static_cast<char*>(ret);
 610     // The value given to the application is actually just after the cookie.
 611     ret = charRet + kCookieSize;
 612     memset(ret, kUninitializedByte, noCookieSize);
 613     partitionCookieWriteValue(charRet);
 614     partitionCookieWriteValue(charRet + kCookieSize + noCookieSize);
 615 #endif
 616     return ret;
 617 }
 618
 619 ALWAYS_INLINE void* partitionAlloc(PartitionRoot* root, size_t size)
 620 {
 621 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 622     void* result = malloc(size);
 623     RELEASE_ASSERT(result);
 624     return result;
 625 #else
 626     size = partitionCookieSizeAdjustAdd(size);
 627     ASSERT(root->initialized);
 628     size_t index = size >> kBucketShift;
 629     ASSERT(index < root->numBuckets);
 630     ASSERT(size == index << kBucketShift);
 631     PartitionBucket* bucket = &root->buckets()[index];
 632     return partitionBucketAlloc(root, 0, size, bucket);
 633 #endif // defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 634 }
 635
 636 ALWAYS_INLINE void partitionFreeWithPage(void* ptr, PartitionPage* page)
 637 {
 638     // If these asserts fire, you probably corrupted memory.
 639 #if ENABLE(ASSERT)
 640     size_t slotSize = page->bucket->slotSize;
 641     size_t rawSize = partitionPageGetRawSize(page);
 642     if (rawSize)
 643         slotSize = rawSize;
 644     partitionCookieCheckValue(ptr);
 645     partitionCookieCheckValue(reinterpret_cast<char*>(ptr) + slotSize - kCookieSize);
 646     memset(ptr, kFreedByte, slotSize);
 647 #endif
 648     ASSERT(page->numAllocatedSlots);
 649     PartitionFreelistEntry* freelistHead = page->freelistHead;
 650     ASSERT(!freelistHead || partitionPointerIsValid(freelistHead));
 651     RELEASE_ASSERT_WITH_SECURITY_IMPLICATION(ptr != freelistHead); // Catches an immediate double free.
 652     ASSERT_WITH_SECURITY_IMPLICATION(!freelistHead || ptr != partitionFreelistMask(freelistHead->next)); // Look for double free one level deeper in debug.
 653     PartitionFreelistEntry* entry = static_cast<PartitionFreelistEntry*>(ptr);
 654     entry->next = partitionFreelistMask(freelistHead);
 655     page->freelistHead = entry;
 656     --page->numAllocatedSlots;
 657     if (UNLIKELY(page->numAllocatedSlots <= 0)) {
 658         partitionFreeSlowPath(page);
 659     } else {
 660         // All single-slot allocations must go through the slow path to
 661         // correctly update the size metadata.
 662         ASSERT(partitionPageGetRawSize(page) == 0);
 663     }
 664 }
 665
 666 ALWAYS_INLINE void partitionFree(void* ptr)
 667 {
 668 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 669     free(ptr);
 670 #else
 671     ptr = partitionCookieFreePointerAdjust(ptr);
 672     ASSERT(partitionPointerIsValid(ptr));
 673     PartitionPage* page = partitionPointerToPage(ptr);
 674     partitionFreeWithPage(ptr, page);
 675 #endif
 676 }
 677
 678 ALWAYS_INLINE PartitionBucket* partitionGenericSizeToBucket(PartitionRootGeneric* root, size_t size)
 679 {
 680     size_t order = kBitsPerSizet - countLeadingZerosSizet(size);
 681     // The order index is simply the next few bits after the most significant bit.
 682     size_t orderIndex = (size >> root->orderIndexShifts[order]) & (kGenericNumBucketsPerOrder - 1);
 683     // And if the remaining bits are non-zero we must bump the bucket up.
 684     size_t subOrderIndex = size & root->orderSubIndexMasks[order];
 685     PartitionBucket* bucket = root->bucketLookups[(order << kGenericNumBucketsPerOrderBits) + orderIndex + !!subOrderIndex];
 686     ASSERT(!bucket->slotSize || bucket->slotSize >= size);
 687     ASSERT(!(bucket->slotSize % kGenericSmallestBucket));
 688     return bucket;
 689 }
 690
 691 ALWAYS_INLINE void* partitionAllocGenericFlags(PartitionRootGeneric* root, int flags, size_t size)
 692 {
 693 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 694     void* result = malloc(size);
 695     RELEASE_ASSERT(result);
 696     return result;
 697 #else
 698     ASSERT(root->initialized);
 699     size = partitionCookieSizeAdjustAdd(size);
 700     PartitionBucket* bucket = partitionGenericSizeToBucket(root, size);
 701     spinLockLock(&root->lock);
 702     void* ret = partitionBucketAlloc(root, flags, size, bucket);
 703     spinLockUnlock(&root->lock);
 704     return ret;
 705 #endif
 706 }
 707
 708 ALWAYS_INLINE void* partitionAllocGeneric(PartitionRootGeneric* root, size_t size)
 709 {
 710     return partitionAllocGenericFlags(root, 0, size);
 711 }
 712
 713 ALWAYS_INLINE void partitionFreeGeneric(PartitionRootGeneric* root, void* ptr)
 714 {
 715 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 716     free(ptr);
 717 #else
 718     ASSERT(root->initialized);
 719
 720     if (UNLIKELY(!ptr))
 721         return;
 722
 723     ptr = partitionCookieFreePointerAdjust(ptr);
 724     ASSERT(partitionPointerIsValid(ptr));
 725     PartitionPage* page = partitionPointerToPage(ptr);
 726     spinLockLock(&root->lock);
 727     partitionFreeWithPage(ptr, page);
 728     spinLockUnlock(&root->lock);
 729 #endif
 730 }
 731
 732 ALWAYS_INLINE size_t partitionDirectMapSize(size_t size)
 733 {
 734     // Caller must check that the size is not above the kGenericMaxDirectMapped
 735     // limit before calling. This also guards against integer overflow in the
 736     // calculation here.
 737     ASSERT(size <= kGenericMaxDirectMapped);
 738     return (size + kSystemPageOffsetMask) & kSystemPageBaseMask;
 739 }
 740
 741 ALWAYS_INLINE size_t partitionAllocActualSize(PartitionRootGeneric* root, size_t size)
 742 {
 743 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 744     return size;
 745 #else
 746     ASSERT(root->initialized);
 747     size = partitionCookieSizeAdjustAdd(size);
 748     PartitionBucket* bucket = partitionGenericSizeToBucket(root, size);
 749     if (LIKELY(!partitionBucketIsDirectMapped(bucket))) {
 750         size = bucket->slotSize;
 751     } else if (size > kGenericMaxDirectMapped) {
 752         // Too large to allocate => return the size unchanged.
 753     } else {
 754         ASSERT(bucket == &PartitionRootBase::gPagedBucket);
 755         size = partitionDirectMapSize(size);
 756     }
 757     return partitionCookieSizeAdjustSubtract(size);
 758 #endif
 759 }
 760
 761 ALWAYS_INLINE bool partitionAllocSupportsGetSize()
 762 {
 763 #if defined(MEMORY_TOOL_REPLACES_ALLOCATOR)
 764     return false;
 765 #else
 766     return true;
 767 #endif
 768 }
 769
 770 ALWAYS_INLINE size_t partitionAllocGetSize(void* ptr)
 771 {
 772     // No need to lock here. Only 'ptr' being freed by another thread could
 773     // cause trouble, and the caller is responsible for that not happening.
 774     ASSERT(partitionAllocSupportsGetSize());
 775     ptr = partitionCookieFreePointerAdjust(ptr);
 776     ASSERT(partitionPointerIsValid(ptr));
 777     PartitionPage* page = partitionPointerToPage(ptr);
 778     size_t size = page->bucket->slotSize;
 779     return partitionCookieSizeAdjustSubtract(size);
 780 }
 781
 782 // N (or more accurately, N - sizeof(void*)) represents the largest size in
 783 // bytes that will be handled by a SizeSpecificPartitionAllocator.
 784 // Attempts to partitionAlloc() more than this amount will fail.
 785 template <size_t N>
 786 class SizeSpecificPartitionAllocator {
 787 public:
 788     static const size_t kMaxAllocation = N - kAllocationGranularity;
 789     static const size_t kNumBuckets = N / kAllocationGranularity;
 790     void init() { partitionAllocInit(&m_partitionRoot, kNumBuckets, kMaxAllocation); }
 791     bool shutdown() { return partitionAllocShutdown(&m_partitionRoot); }
 792     ALWAYS_INLINE PartitionRoot* root() { return &m_partitionRoot; }
 793 private:
 794     PartitionRoot m_partitionRoot;
 795     PartitionBucket m_actualBuckets[kNumBuckets];
 796 };
 797
 798 class PartitionAllocatorGeneric {
 799 public:
 800     void init() { partitionAllocGenericInit(&m_partitionRoot); }
 801     bool shutdown() { return partitionAllocGenericShutdown(&m_partitionRoot); }
 802     ALWAYS_INLINE PartitionRootGeneric* root() { return &m_partitionRoot; }
 803 private:
 804     PartitionRootGeneric m_partitionRoot;
 805 };
 806
 807 } // namespace WTF
 808
 809 using WTF::SizeSpecificPartitionAllocator;
 810 using WTF::PartitionAllocatorGeneric;
 811 using WTF::PartitionRoot;
 812 using WTF::partitionAllocInit;
 813 using WTF::partitionAllocShutdown;
 814 using WTF::partitionAlloc;
 815 using WTF::partitionFree;
 816 using WTF::partitionAllocGeneric;
 817 using WTF::partitionFreeGeneric;
 818 using WTF::partitionReallocGeneric;
 819 using WTF::partitionAllocActualSize;
 820 using WTF::partitionAllocSupportsGetSize;
 821 using WTF::partitionAllocGetSize;
 822
 823 #endif // WTF_PartitionAlloc_h