memory/replace/phc/PHC.cpp

   1 /* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
   2 /* vim: set ts=8 sts=2 et sw=2 tw=80: */
   3 /* This Source Code Form is subject to the terms of the Mozilla Public
   4  * License, v. 2.0. If a copy of the MPL was not distributed with this
   5  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
   6
   7 // PHC is a probabilistic heap checker. A tiny fraction of randomly chosen heap
   8 // allocations are subject to some expensive checking via the use of OS page
   9 // access protection. A failed check triggers a crash, whereupon useful
  10 // information about the failure is put into the crash report. The cost and
  11 // coverage for each user is minimal, but spread over the entire user base the
  12 // coverage becomes significant.
  13 //
  14 // The idea comes from Chromium, where it is called GWP-ASAN. (Firefox uses PHC
  15 // as the name because GWP-ASAN is long, awkward, and doesn't have any
  16 // particular meaning.)
  17 //
  18 // In the current implementation up to 64 allocations per process can become
  19 // PHC allocations. These allocations must be page-sized or smaller. Each PHC
  20 // allocation gets its own page, and when the allocation is freed its page is
  21 // marked inaccessible until the page is reused for another allocation. This
  22 // means that a use-after-free defect (which includes double-frees) will be
  23 // caught if the use occurs before the page is reused for another allocation.
  24 // The crash report will contain stack traces for the allocation site, the free
  25 // site, and the use-after-free site, which is often enough to diagnose the
  26 // defect.
  27 //
  28 // Also, each PHC allocation is followed by a guard page. The PHC allocation is
  29 // positioned so that its end abuts the guard page (or as close as possible,
  30 // given alignment constraints). This means that a bounds violation at the end
  31 // of the allocation (overflow) will be caught. The crash report will contain
  32 // stack traces for the allocation site and the bounds violation use site,
  33 // which is often enough to diagnose the defect.
  34 //
  35 // (A bounds violation at the start of the allocation (underflow) will not be
  36 // caught, unless it is sufficiently large to hit the preceding allocation's
  37 // guard page, which is not that likely. It would be possible to look more
  38 // assiduously for underflow by randomly placing some allocations at the end of
  39 // the page and some at the start of the page, and GWP-ASAN does this. PHC does
  40 // not, however, because overflow is likely to be much more common than
  41 // underflow in practice.)
  42 //
  43 // We use a simple heuristic to categorize a guard page access as overflow or
  44 // underflow: if the address falls in the lower half of the guard page, we
  45 // assume it is overflow, otherwise we assume it is underflow. More
  46 // sophisticated heuristics are possible, but this one is very simple, and it is
  47 // likely that most overflows/underflows in practice are very close to the page
  48 // boundary.
  49 //
  50 // The design space for the randomization strategy is large. The current
  51 // implementation has a large random delay before it starts operating, and a
  52 // small random delay between each PHC allocation attempt. Each freed PHC
  53 // allocation is quarantined for a medium random delay before being reused, in
  54 // order to increase the chance of catching UAFs.
  55 //
  56 // The basic cost of PHC's operation is as follows.
  57 //
  58 // - The physical memory cost is 64 pages plus some metadata (including stack
  59 //   traces) for each page. This amounts to 256 KiB per process on
  60 //   architectures with 4 KiB pages and 1024 KiB on macOS/AArch64 which uses
  61 //   16 KiB pages.
  62 //
  63 // - The virtual memory cost is the physical memory cost plus the guard pages:
  64 //   another 64 pages. This amounts to another 256 KiB per process on
  65 //   architectures with 4 KiB pages and 1024 KiB on macOS/AArch64 which uses
  66 //   16 KiB pages. PHC is currently only enabled on 64-bit platforms so the
  67 //   impact of the virtual memory usage is negligible.
  68 //
  69 // - Every allocation requires a size check and a decrement-and-check of an
  70 //   atomic counter. When the counter reaches zero a PHC allocation can occur,
  71 //   which involves marking a page as accessible and getting a stack trace for
  72 //   the allocation site. Otherwise, mozjemalloc performs the allocation.
  73 //
  74 // - Every deallocation requires a range check on the pointer to see if it
  75 //   involves a PHC allocation. (The choice to only do PHC allocations that are
  76 //   a page or smaller enables this range check, because the 64 pages are
  77 //   contiguous. Allowing larger allocations would make this more complicated,
  78 //   and we definitely don't want something as slow as a hash table lookup on
  79 //   every deallocation.) PHC deallocations involve marking a page as
  80 //   inaccessible and getting a stack trace for the deallocation site.
  81 //
  82 // Note that calls to realloc(), free(), and malloc_usable_size() will
  83 // immediately crash if the given pointer falls within a page allocation's
  84 // page, but does not point to the start of the allocation itself.
  85 //
  86 //   void* p = malloc(64);
  87 //   free(p + 1);     // p+1 doesn't point to the allocation start; crash
  88 //
  89 // Such crashes will not have the PHC fields in the crash report.
  90 //
  91 // PHC-specific tests can be run with the following commands:
  92 // - gtests: `./mach gtest '*PHC*'`
  93 // - xpcshell-tests: `./mach test toolkit/crashreporter/test/unit`
  94 //   - This runs some non-PHC tests as well.
  95
  96 #include "PHC.h"
  97
  98 #include <stdlib.h>
  99 #include <time.h>
 100
 101 #include <algorithm>
 102
 103 #ifdef XP_WIN
 104 #  include <process.h>
 105 #else
 106 #  include <sys/mman.h>
 107 #  include <sys/types.h>
 108 #  include <pthread.h>
 109 #  include <unistd.h>
 110 #endif
 111
 112 #include "replace_malloc.h"
 113 #include "FdPrintf.h"
 114 #include "Mutex.h"
 115 #include "mozilla/Assertions.h"
 116 #include "mozilla/Atomics.h"
 117 #include "mozilla/Attributes.h"
 118 #include "mozilla/CheckedInt.h"
 119 #include "mozilla/Maybe.h"
 120 #include "mozilla/StackWalk.h"
 121 #include "mozilla/ThreadLocal.h"
 122 #include "mozilla/XorShift128PlusRNG.h"
 123
 124 using namespace mozilla;
 125
 126 //---------------------------------------------------------------------------
 127 // Utilities
 128 //---------------------------------------------------------------------------
 129
 130 #ifdef ANDROID
 131 // Android doesn't have pthread_atfork defined in pthread.h.
 132 extern "C" MOZ_EXPORT int pthread_atfork(void (*)(void), void (*)(void),
 133                                          void (*)(void));
 134 #endif
 135
 136 #ifndef DISALLOW_COPY_AND_ASSIGN
 137 #  define DISALLOW_COPY_AND_ASSIGN(T) \
 138     T(const T&);                      \
 139     void operator=(const T&)
 140 #endif
 141
 142 static malloc_table_t sMallocTable;
 143
 144 // This class provides infallible operations for the small number of heap
 145 // allocations that PHC does for itself. It would be nice if we could use the
 146 // InfallibleAllocPolicy from mozalloc, but PHC cannot use mozalloc.
 147 class InfallibleAllocPolicy {
 148  public:
 149   static void AbortOnFailure(const void* aP) {
 150     if (!aP) {
 151       MOZ_CRASH("PHC failed to allocate");
 152     }
 153   }
 154
 155   template <class T>
 156   static T* new_() {
 157     void* p = sMallocTable.malloc(sizeof(T));
 158     AbortOnFailure(p);
 159     return new (p) T;
 160   }
 161 };
 162
 163 //---------------------------------------------------------------------------
 164 // Stack traces
 165 //---------------------------------------------------------------------------
 166
 167 // This code is similar to the equivalent code within DMD.
 168
 169 class StackTrace : public phc::StackTrace {
 170  public:
 171   StackTrace() : phc::StackTrace() {}
 172
 173   void Clear() { mLength = 0; }
 174
 175   void Fill();
 176
 177  private:
 178   static void StackWalkCallback(uint32_t aFrameNumber, void* aPc, void* aSp,
 179                                 void* aClosure) {
 180     StackTrace* st = (StackTrace*)aClosure;
 181     MOZ_ASSERT(st->mLength < kMaxFrames);
 182     st->mPcs[st->mLength] = aPc;
 183     st->mLength++;
 184     MOZ_ASSERT(st->mLength == aFrameNumber);
 185   }
 186 };
 187
 188 // WARNING WARNING WARNING: this function must only be called when GMut::sMutex
 189 // is *not* locked, otherwise we might get deadlocks.
 190 //
 191 // How? On Windows, MozStackWalk() can lock a mutex, M, from the shared library
 192 // loader. Another thread might call malloc() while holding M locked (when
 193 // loading a shared library) and try to lock GMut::sMutex, causing a deadlock.
 194 // So GMut::sMutex can't be locked during the call to MozStackWalk(). (For
 195 // details, see https://bugzilla.mozilla.org/show_bug.cgi?id=374829#c8. On
 196 // Linux, something similar can happen; see bug 824340. So we just disallow it
 197 // on all platforms.)
 198 //
 199 // In DMD, to avoid this problem we temporarily unlock the equivalent mutex for
 200 // the MozStackWalk() call. But that's grotty, and things are a bit different
 201 // here, so we just require that stack traces be obtained before locking
 202 // GMut::sMutex.
 203 //
 204 // Unfortunately, there is no reliable way at compile-time or run-time to ensure
 205 // this pre-condition. Hence this large comment.
 206 //
 207 void StackTrace::Fill() {
 208   mLength = 0;
 209
 210 #if defined(XP_WIN) && defined(_M_IX86)
 211   // This avoids MozStackWalk(), which causes unusably slow startup on Win32
 212   // when it is called during static initialization (see bug 1241684).
 213   //
 214   // This code is cribbed from the Gecko Profiler, which also uses
 215   // FramePointerStackWalk() on Win32: Registers::SyncPopulate() for the
 216   // frame pointer, and GetStackTop() for the stack end.
 217   CONTEXT context;
 218   RtlCaptureContext(&context);
 219   void** fp = reinterpret_cast<void**>(context.Ebp);
 220
 221   PNT_TIB pTib = reinterpret_cast<PNT_TIB>(NtCurrentTeb());
 222   void* stackEnd = static_cast<void*>(pTib->StackBase);
 223   FramePointerStackWalk(StackWalkCallback, kMaxFrames, this, fp, stackEnd);
 224 #elif defined(XP_MACOSX)
 225   // This avoids MozStackWalk(), which has become unusably slow on Mac due to
 226   // changes in libunwind.
 227   //
 228   // This code is cribbed from the Gecko Profiler, which also uses
 229   // FramePointerStackWalk() on Mac: Registers::SyncPopulate() for the frame
 230   // pointer, and GetStackTop() for the stack end.
 231 #  pragma GCC diagnostic push
 232 #  pragma GCC diagnostic ignored "-Wframe-address"
 233   void** fp = reinterpret_cast<void**>(__builtin_frame_address(1));
 234 #  pragma GCC diagnostic pop
 235   void* stackEnd = pthread_get_stackaddr_np(pthread_self());
 236   FramePointerStackWalk(StackWalkCallback, kMaxFrames, this, fp, stackEnd);
 237 #else
 238   MozStackWalk(StackWalkCallback, nullptr, kMaxFrames, this);
 239 #endif
 240 }
 241
 242 //---------------------------------------------------------------------------
 243 // Logging
 244 //---------------------------------------------------------------------------
 245
 246 // Change this to 1 to enable some PHC logging. Useful for debugging.
 247 #define PHC_LOGGING 0
 248
 249 #if PHC_LOGGING
 250
 251 static size_t GetPid() { return size_t(getpid()); }
 252
 253 static size_t GetTid() {
 254 #  if defined(XP_WIN)
 255   return size_t(GetCurrentThreadId());
 256 #  else
 257   return size_t(pthread_self());
 258 #  endif
 259 }
 260
 261 #  if defined(XP_WIN)
 262 #    define LOG_STDERR \
 263       reinterpret_cast<intptr_t>(GetStdHandle(STD_ERROR_HANDLE))
 264 #  else
 265 #    define LOG_STDERR 2
 266 #  endif
 267 #  define LOG(fmt, ...)                                                \
 268     FdPrintf(LOG_STDERR, "PHC[%zu,%zu,~%zu] " fmt, GetPid(), GetTid(), \
 269              size_t(GAtomic::Now()), __VA_ARGS__)
 270
 271 #else
 272
 273 #  define LOG(fmt, ...)
 274
 275 #endif  // PHC_LOGGING
 276
 277 //---------------------------------------------------------------------------
 278 // Global state
 279 //---------------------------------------------------------------------------
 280
 281 // Throughout this entire file time is measured as the number of sub-page
 282 // allocations performed (by PHC and mozjemalloc combined). `Time` is 64-bit
 283 // because we could have more than 2**32 allocations in a long-running session.
 284 // `Delay` is 32-bit because the delays used within PHC are always much smaller
 285 // than 2**32.
 286 using Time = uint64_t;   // A moment in time.
 287 using Delay = uint32_t;  // A time duration.
 288
 289 // PHC only runs if the page size is 4 KiB; anything more is uncommon and would
 290 // use too much memory. So we hardwire this size for all platforms but macOS
 291 // on ARM processors. For the latter we make an exception because the minimum
 292 // page size supported is 16KiB so there's no way to go below that.
 293 static const size_t kPageSize =
 294 #if defined(XP_MACOSX) && defined(__aarch64__)
 295     16384
 296 #else
 297     4096
 298 #endif
 299     ;
 300
 301 // There are two kinds of page.
 302 // - Allocation pages, from which allocations are made.
 303 // - Guard pages, which are never touched by PHC.
 304 //
 305 // These page kinds are interleaved; each allocation page has a guard page on
 306 // either side.
 307 static const size_t kNumAllocPages = kPageSize == 4096 ? 4096 : 1024;
 308 static const size_t kNumAllPages = kNumAllocPages * 2 + 1;
 309
 310 // The total size of the allocation pages and guard pages.
 311 static const size_t kAllPagesSize = kNumAllPages * kPageSize;
 312
 313 // The junk value used to fill new allocation in debug builds. It's same value
 314 // as the one used by mozjemalloc. PHC applies it unconditionally in debug
 315 // builds. Unlike mozjemalloc, PHC doesn't consult the MALLOC_OPTIONS
 316 // environment variable to possibly change that behaviour.
 317 //
 318 // Also note that, unlike mozjemalloc, PHC doesn't have a poison value for freed
 319 // allocations because freed allocations are protected by OS page protection.
 320 #ifdef DEBUG
 321 const uint8_t kAllocJunk = 0xe4;
 322 #endif
 323
 324 // The maximum time.
 325 static const Time kMaxTime = ~(Time(0));
 326
 327 // The average delay before doing any page allocations at the start of a
 328 // process. Note that roughly 1 million allocations occur in the main process
 329 // while starting the browser. The delay range is 1..kAvgFirstAllocDelay*2.
 330 static const Delay kAvgFirstAllocDelay = 64 * 1024;
 331
 332 // The average delay until the next attempted page allocation, once we get past
 333 // the first delay. The delay range is 1..kAvgAllocDelay*2.
 334 static const Delay kAvgAllocDelay = 16 * 1024;
 335
 336 // The average delay before reusing a freed page. Should be significantly larger
 337 // than kAvgAllocDelay, otherwise there's not much point in having it. The delay
 338 // range is (kAvgAllocDelay / 2)..(kAvgAllocDelay / 2 * 3). This is different to
 339 // the other delay ranges in not having a minimum of 1, because that's such a
 340 // short delay that there is a high likelihood of bad stacks in any crash
 341 // report.
 342 static const Delay kAvgPageReuseDelay = 256 * 1024;
 343
 344 // Truncate aRnd to the range (1 .. AvgDelay*2). If aRnd is random, this
 345 // results in an average value of aAvgDelay + 0.5, which is close enough to
 346 // aAvgDelay. aAvgDelay must be a power-of-two (otherwise it will crash) for
 347 // speed.
 348 template <Delay AvgDelay>
 349 constexpr Delay Rnd64ToDelay(uint64_t aRnd) {
 350   static_assert(IsPowerOfTwo(AvgDelay), "must be a power of two");
 351
 352   return aRnd % (AvgDelay * 2) + 1;
 353 }
 354
 355 // Maps a pointer to a PHC-specific structure:
 356 // - Nothing
 357 // - A guard page (it is unspecified which one)
 358 // - An allocation page (with an index < kNumAllocPages)
 359 //
 360 // The standard way of handling a PtrKind is to check IsNothing(), and if that
 361 // fails, to check IsGuardPage(), and if that fails, to call AllocPage().
 362 class PtrKind {
 363  private:
 364   enum class Tag : uint8_t {
 365     Nothing,
 366     GuardPage,
 367     AllocPage,
 368   };
 369
 370   Tag mTag;
 371   uintptr_t mIndex;  // Only used if mTag == Tag::AllocPage.
 372
 373  public:
 374   // Detect what a pointer points to. This constructor must be fast because it
 375   // is called for every call to free(), realloc(), malloc_usable_size(), and
 376   // jemalloc_ptr_info().
 377   PtrKind(const void* aPtr, const uint8_t* aPagesStart,
 378           const uint8_t* aPagesLimit) {
 379     if (!(aPagesStart <= aPtr && aPtr < aPagesLimit)) {
 380       mTag = Tag::Nothing;
 381     } else {
 382       uintptr_t offset = static_cast<const uint8_t*>(aPtr) - aPagesStart;
 383       uintptr_t allPageIndex = offset / kPageSize;
 384       MOZ_ASSERT(allPageIndex < kNumAllPages);
 385       if (allPageIndex & 1) {
 386         // Odd-indexed pages are allocation pages.
 387         uintptr_t allocPageIndex = allPageIndex / 2;
 388         MOZ_ASSERT(allocPageIndex < kNumAllocPages);
 389         mTag = Tag::AllocPage;
 390         mIndex = allocPageIndex;
 391       } else {
 392         // Even-numbered pages are guard pages.
 393         mTag = Tag::GuardPage;
 394       }
 395     }
 396   }
 397
 398   bool IsNothing() const { return mTag == Tag::Nothing; }
 399   bool IsGuardPage() const { return mTag == Tag::GuardPage; }
 400
 401   // This should only be called after IsNothing() and IsGuardPage() have been
 402   // checked and failed.
 403   uintptr_t AllocPageIndex() const {
 404     MOZ_RELEASE_ASSERT(mTag == Tag::AllocPage);
 405     return mIndex;
 406   }
 407 };
 408
 409 // Shared, atomic, mutable global state.
 410 class GAtomic {
 411  public:
 412   static void Init(Delay aFirstDelay) {
 413     sAllocDelay = aFirstDelay;
 414
 415     LOG("Initial sAllocDelay <- %zu\n", size_t(aFirstDelay));
 416   }
 417
 418   static Time Now() { return sNow; }
 419
 420   static void IncrementNow() { sNow++; }
 421
 422   // Decrements the delay and returns the decremented value.
 423   static int32_t DecrementDelay() { return --sAllocDelay; }
 424
 425   static void SetAllocDelay(Delay aAllocDelay) { sAllocDelay = aAllocDelay; }
 426
 427  private:
 428   // The current time. Relaxed semantics because it's primarily used for
 429   // determining if an allocation can be recycled yet and therefore it doesn't
 430   // need to be exact.
 431   static Atomic<Time, Relaxed> sNow;
 432
 433   // Delay until the next attempt at a page allocation. See the comment in
 434   // MaybePageAlloc() for an explanation of why it is a signed integer, and why
 435   // it uses ReleaseAcquire semantics.
 436   static Atomic<Delay, ReleaseAcquire> sAllocDelay;
 437 };
 438
 439 Atomic<Time, Relaxed> GAtomic::sNow;
 440 Atomic<Delay, ReleaseAcquire> GAtomic::sAllocDelay;
 441
 442 // Shared, immutable global state. Initialized by replace_init() and never
 443 // changed after that. replace_init() runs early enough that no synchronization
 444 // is needed.
 445 class GConst {
 446  private:
 447   // The bounds of the allocated pages.
 448   uint8_t* const mPagesStart;
 449   uint8_t* const mPagesLimit;
 450
 451   // Allocates the allocation pages and the guard pages, contiguously.
 452   uint8_t* AllocAllPages() {
 453     // Allocate the pages so that they are inaccessible. They are never freed,
 454     // because it would happen at process termination when it would be of little
 455     // use.
 456     void* pages =
 457 #ifdef XP_WIN
 458         VirtualAlloc(nullptr, kAllPagesSize, MEM_RESERVE, PAGE_NOACCESS);
 459 #else
 460         mmap(nullptr, kAllPagesSize, PROT_NONE, MAP_ANONYMOUS | MAP_PRIVATE, -1,
 461              0);
 462 #endif
 463     if (!pages) {
 464       MOZ_CRASH();
 465     }
 466
 467     return static_cast<uint8_t*>(pages);
 468   }
 469
 470  public:
 471   GConst()
 472       : mPagesStart(AllocAllPages()), mPagesLimit(mPagesStart + kAllPagesSize) {
 473     LOG("AllocAllPages at %p..%p\n", mPagesStart, mPagesLimit);
 474   }
 475
 476   class PtrKind PtrKind(const void* aPtr) {
 477     class PtrKind pk(aPtr, mPagesStart, mPagesLimit);
 478     return pk;
 479   }
 480
 481   bool IsInFirstGuardPage(const void* aPtr) {
 482     return mPagesStart <= aPtr && aPtr < mPagesStart + kPageSize;
 483   }
 484
 485   // Get the address of the allocation page referred to via an index. Used when
 486   // marking the page as accessible/inaccessible.
 487   uint8_t* AllocPagePtr(uintptr_t aIndex) {
 488     MOZ_ASSERT(aIndex < kNumAllocPages);
 489     // Multiply by two and add one to account for allocation pages *and* guard
 490     // pages.
 491     return mPagesStart + (2 * aIndex + 1) * kPageSize;
 492   }
 493 };
 494
 495 static GConst* gConst;
 496
 497 // On MacOS, the first __thread/thread_local access calls malloc, which leads
 498 // to an infinite loop. So we use pthread-based TLS instead, which somehow
 499 // doesn't have this problem.
 500 #if !defined(XP_DARWIN)
 501 #  define PHC_THREAD_LOCAL(T) MOZ_THREAD_LOCAL(T)
 502 #else
 503 #  define PHC_THREAD_LOCAL(T) \
 504     detail::ThreadLocal<T, detail::ThreadLocalKeyStorage>
 505 #endif
 506
 507 // Thread-local state.
 508 class GTls {
 509   GTls(const GTls&) = delete;
 510
 511   const GTls& operator=(const GTls&) = delete;
 512
 513   // When true, PHC does as little as possible.
 514   //
 515   // (a) It does not allocate any new page allocations.
 516   //
 517   // (b) It avoids doing any operations that might call malloc/free/etc., which
 518   //     would cause re-entry into PHC. (In practice, MozStackWalk() is the
 519   //     only such operation.) Note that calls to the functions in sMallocTable
 520   //     are ok.
 521   //
 522   // For example, replace_malloc() will just fall back to mozjemalloc. However,
 523   // operations involving existing allocations are more complex, because those
 524   // existing allocations may be page allocations. For example, if
 525   // replace_free() is passed a page allocation on a PHC-disabled thread, it
 526   // will free the page allocation in the usual way, but it will get a dummy
 527   // freeStack in order to avoid calling MozStackWalk(), as per (b) above.
 528   //
 529   // This single disabling mechanism has two distinct uses.
 530   //
 531   // - It's used to prevent re-entry into PHC, which can cause correctness
 532   //   problems. For example, consider this sequence.
 533   //
 534   //   1. enter replace_free()
 535   //   2. which calls PageFree()
 536   //   3. which calls MozStackWalk()
 537   //   4. which locks a mutex M, and then calls malloc
 538   //   5. enter replace_malloc()
 539   //   6. which calls MaybePageAlloc()
 540   //   7. which calls MozStackWalk()
 541   //   8. which (re)locks a mutex M --> deadlock
 542   //
 543   //   We avoid this sequence by "disabling" the thread in PageFree() (at step
 544   //   2), which causes MaybePageAlloc() to fail, avoiding the call to
 545   //   MozStackWalk() (at step 7).
 546   //
 547   //   In practice, realloc or free of a PHC allocation is unlikely on a thread
 548   //   that is disabled because of this use: MozStackWalk() will probably only
 549   //   realloc/free allocations that it allocated itself, but those won't be
 550   //   page allocations because PHC is disabled before calling MozStackWalk().
 551   //
 552   //   (Note that MaybePageAlloc() could safely do a page allocation so long as
 553   //   it avoided calling MozStackWalk() by getting a dummy allocStack. But it
 554   //   wouldn't be useful, and it would prevent the second use below.)
 555   //
 556   // - It's used to prevent PHC allocations in some tests that rely on
 557   //   mozjemalloc's exact allocation behaviour, which PHC does not replicate
 558   //   exactly. (Note that (b) isn't necessary for this use -- MozStackWalk()
 559   //   could be safely called -- but it is necessary for the first use above.)
 560   //
 561   static PHC_THREAD_LOCAL(bool) tlsIsDisabled;
 562
 563  public:
 564   static void Init() {
 565     if (!tlsIsDisabled.init()) {
 566       MOZ_CRASH();
 567     }
 568   }
 569
 570   static void DisableOnCurrentThread() {
 571     MOZ_ASSERT(!GTls::tlsIsDisabled.get());
 572     tlsIsDisabled.set(true);
 573   }
 574
 575   static void EnableOnCurrentThread() {
 576     MOZ_ASSERT(GTls::tlsIsDisabled.get());
 577     tlsIsDisabled.set(false);
 578   }
 579
 580   static bool IsDisabledOnCurrentThread() { return tlsIsDisabled.get(); }
 581 };
 582
 583 PHC_THREAD_LOCAL(bool) GTls::tlsIsDisabled;
 584
 585 class AutoDisableOnCurrentThread {
 586   AutoDisableOnCurrentThread(const AutoDisableOnCurrentThread&) = delete;
 587
 588   const AutoDisableOnCurrentThread& operator=(
 589       const AutoDisableOnCurrentThread&) = delete;
 590
 591  public:
 592   explicit AutoDisableOnCurrentThread() { GTls::DisableOnCurrentThread(); }
 593   ~AutoDisableOnCurrentThread() { GTls::EnableOnCurrentThread(); }
 594 };
 595
 596 // This type is used as a proof-of-lock token, to make it clear which functions
 597 // require sMutex to be locked.
 598 using GMutLock = const MutexAutoLock&;
 599
 600 // Shared, mutable global state. Protected by sMutex; all accessing functions
 601 // take a GMutLock as proof that sMutex is held.
 602 class GMut {
 603   enum class AllocPageState {
 604     NeverAllocated = 0,
 605     InUse = 1,
 606     Freed = 2,
 607   };
 608
 609   // Metadata for each allocation page.
 610   class AllocPageInfo {
 611    public:
 612     AllocPageInfo()
 613         : mState(AllocPageState::NeverAllocated),
 614           mArenaId(),
 615           mBaseAddr(nullptr),
 616           mAllocStack(),
 617           mFreeStack(),
 618           mReuseTime(0) {}
 619
 620     // The current allocation page state.
 621     AllocPageState mState;
 622
 623     // The arena that the allocation is nominally from. This isn't meaningful
 624     // within PHC, which has no arenas. But it is necessary for reallocation of
 625     // page allocations as normal allocations, such as in this code:
 626     //
 627     //   p = moz_arena_malloc(arenaId, 4096);
 628     //   realloc(p, 8192);
 629     //
 630     // The realloc is more than one page, and thus too large for PHC to handle.
 631     // Therefore, if PHC handles the first allocation, it must ask mozjemalloc
 632     // to allocate the 8192 bytes in the correct arena, and to do that, it must
 633     // call sMallocTable.moz_arena_malloc with the correct arenaId under the
 634     // covers. Therefore it must record that arenaId.
 635     //
 636     // This field is also needed for jemalloc_ptr_info() to work, because it
 637     // also returns the arena ID (but only in debug builds).
 638     //
 639     // - NeverAllocated: must be 0.
 640     // - InUse | Freed: can be any valid arena ID value.
 641     Maybe<arena_id_t> mArenaId;
 642
 643     // The starting address of the allocation. Will not be the same as the page
 644     // address unless the allocation is a full page.
 645     // - NeverAllocated: must be 0.
 646     // - InUse | Freed: must be within the allocation page.
 647     uint8_t* mBaseAddr;
 648
 649     // Usable size is computed as the number of bytes between the pointer and
 650     // the end of the allocation page. This might be bigger than the requested
 651     // size, especially if an outsized alignment is requested.
 652     size_t UsableSize() const {
 653       return mState == AllocPageState::NeverAllocated
 654                  ? 0
 655                  : kPageSize - (reinterpret_cast<uintptr_t>(mBaseAddr) &
 656                                 (kPageSize - 1));
 657     }
 658
 659     // The internal fragmentation for this allocation.
 660     size_t FragmentationBytes() const {
 661       MOZ_ASSERT(kPageSize >= UsableSize());
 662       return mState == AllocPageState::InUse ? kPageSize - UsableSize() : 0;
 663     }
 664
 665     // The allocation stack.
 666     // - NeverAllocated: Nothing.
 667     // - InUse | Freed: Some.
 668     Maybe<StackTrace> mAllocStack;
 669
 670     // The free stack.
 671     // - NeverAllocated | InUse: Nothing.
 672     // - Freed: Some.
 673     Maybe<StackTrace> mFreeStack;
 674
 675     // The time at which the page is available for reuse, as measured against
 676     // GAtomic::sNow. When the page is in use this value will be kMaxTime.
 677     // - NeverAllocated: must be 0.
 678     // - InUse: must be kMaxTime.
 679     // - Freed: must be > 0 and < kMaxTime.
 680     Time mReuseTime;
 681   };
 682
 683  public:
 684   // The mutex that protects the other members.
 685   static Mutex sMutex MOZ_UNANNOTATED;
 686
 687   GMut() : mRNG(RandomSeed<0>(), RandomSeed<1>()), mAllocPages() {
 688     sMutex.Init();
 689   }
 690
 691   uint64_t Random64(GMutLock) { return mRNG.next(); }
 692
 693   bool IsPageInUse(GMutLock, uintptr_t aIndex) {
 694     return mAllocPages[aIndex].mState == AllocPageState::InUse;
 695   }
 696
 697   // Is the page free? And if so, has enough time passed that we can use it?
 698   bool IsPageAllocatable(GMutLock, uintptr_t aIndex, Time aNow) {
 699     const AllocPageInfo& page = mAllocPages[aIndex];
 700     return page.mState != AllocPageState::InUse && aNow >= page.mReuseTime;
 701   }
 702
 703   // Get the address of the allocation page referred to via an index. Used
 704   // when checking pointers against page boundaries.
 705   uint8_t* AllocPageBaseAddr(GMutLock, uintptr_t aIndex) {
 706     return mAllocPages[aIndex].mBaseAddr;
 707   }
 708
 709   Maybe<arena_id_t> PageArena(GMutLock aLock, uintptr_t aIndex) {
 710     const AllocPageInfo& page = mAllocPages[aIndex];
 711     AssertAllocPageInUse(aLock, page);
 712
 713     return page.mArenaId;
 714   }
 715
 716   size_t PageUsableSize(GMutLock aLock, uintptr_t aIndex) {
 717     const AllocPageInfo& page = mAllocPages[aIndex];
 718     AssertAllocPageInUse(aLock, page);
 719
 720     return page.UsableSize();
 721   }
 722
 723   // The total fragmentation in PHC
 724   size_t FragmentationBytes() const {
 725     size_t sum = 0;
 726     for (const auto& page : mAllocPages) {
 727       sum += page.FragmentationBytes();
 728     }
 729     return sum;
 730   }
 731
 732   void SetPageInUse(GMutLock aLock, uintptr_t aIndex,
 733                     const Maybe<arena_id_t>& aArenaId, uint8_t* aBaseAddr,
 734                     const StackTrace& aAllocStack) {
 735     AllocPageInfo& page = mAllocPages[aIndex];
 736     AssertAllocPageNotInUse(aLock, page);
 737
 738     page.mState = AllocPageState::InUse;
 739     page.mArenaId = aArenaId;
 740     page.mBaseAddr = aBaseAddr;
 741     page.mAllocStack = Some(aAllocStack);
 742     page.mFreeStack = Nothing();
 743     page.mReuseTime = kMaxTime;
 744   }
 745
 746 #if PHC_LOGGING
 747   Time GetFreeTime(uintptr_t aIndex) const { return mFreeTime[aIndex]; }
 748 #endif
 749
 750   void ResizePageInUse(GMutLock aLock, uintptr_t aIndex,
 751                        const Maybe<arena_id_t>& aArenaId, uint8_t* aNewBaseAddr,
 752                        const StackTrace& aAllocStack) {
 753     AllocPageInfo& page = mAllocPages[aIndex];
 754     AssertAllocPageInUse(aLock, page);
 755
 756     // page.mState is not changed.
 757     if (aArenaId.isSome()) {
 758       // Crash if the arenas don't match.
 759       MOZ_RELEASE_ASSERT(page.mArenaId == aArenaId);
 760     }
 761     page.mBaseAddr = aNewBaseAddr;
 762     // We could just keep the original alloc stack, but the realloc stack is
 763     // more recent and therefore seems more useful.
 764     page.mAllocStack = Some(aAllocStack);
 765     // page.mFreeStack is not changed.
 766     // page.mReuseTime is not changed.
 767   };
 768
 769   void SetPageFreed(GMutLock aLock, uintptr_t aIndex,
 770                     const Maybe<arena_id_t>& aArenaId,
 771                     const StackTrace& aFreeStack, Delay aReuseDelay) {
 772     AllocPageInfo& page = mAllocPages[aIndex];
 773     AssertAllocPageInUse(aLock, page);
 774
 775     page.mState = AllocPageState::Freed;
 776
 777     // page.mArenaId is left unchanged, for jemalloc_ptr_info() calls that
 778     // occur after freeing (e.g. in the PtrInfo test in TestJemalloc.cpp).
 779     if (aArenaId.isSome()) {
 780       // Crash if the arenas don't match.
 781       MOZ_RELEASE_ASSERT(page.mArenaId == aArenaId);
 782     }
 783
 784     // page.musableSize is left unchanged, for reporting on UAF, and for
 785     // jemalloc_ptr_info() calls that occur after freeing (e.g. in the PtrInfo
 786     // test in TestJemalloc.cpp).
 787
 788     // page.mAllocStack is left unchanged, for reporting on UAF.
 789
 790     page.mFreeStack = Some(aFreeStack);
 791     Time now = GAtomic::Now();
 792 #if PHC_LOGGING
 793     mFreeTime[aIndex] = now;
 794 #endif
 795     page.mReuseTime = now + aReuseDelay;
 796   }
 797
 798   static void CrashOnGuardPage(void* aPtr) {
 799     // An operation on a guard page? This is a bounds violation. Deliberately
 800     // touch the page in question, to cause a crash that triggers the usual PHC
 801     // machinery.
 802     LOG("CrashOnGuardPage(%p), bounds violation\n", aPtr);
 803     *static_cast<uint8_t*>(aPtr) = 0;
 804     MOZ_CRASH("unreachable");
 805   }
 806
 807   void EnsureValidAndInUse(GMutLock, void* aPtr, uintptr_t aIndex)
 808       MOZ_REQUIRES(sMutex) {
 809     const AllocPageInfo& page = mAllocPages[aIndex];
 810
 811     // The pointer must point to the start of the allocation.
 812     MOZ_RELEASE_ASSERT(page.mBaseAddr == aPtr);
 813
 814     if (page.mState == AllocPageState::Freed) {
 815       LOG("EnsureValidAndInUse(%p), use-after-free\n", aPtr);
 816       // An operation on a freed page? This is a particular kind of
 817       // use-after-free. Deliberately touch the page in question, in order to
 818       // cause a crash that triggers the usual PHC machinery. But unlock sMutex
 819       // first, because that self-same PHC machinery needs to re-lock it, and
 820       // the crash causes non-local control flow so sMutex won't be unlocked
 821       // the normal way in the caller.
 822       sMutex.Unlock();
 823       *static_cast<uint8_t*>(aPtr) = 0;
 824       MOZ_CRASH("unreachable");
 825     }
 826   }
 827
 828   void FillAddrInfo(GMutLock, uintptr_t aIndex, const void* aBaseAddr,
 829                     bool isGuardPage, phc::AddrInfo& aOut) {
 830     const AllocPageInfo& page = mAllocPages[aIndex];
 831     if (isGuardPage) {
 832       aOut.mKind = phc::AddrInfo::Kind::GuardPage;
 833     } else {
 834       switch (page.mState) {
 835         case AllocPageState::NeverAllocated:
 836           aOut.mKind = phc::AddrInfo::Kind::NeverAllocatedPage;
 837           break;
 838
 839         case AllocPageState::InUse:
 840           aOut.mKind = phc::AddrInfo::Kind::InUsePage;
 841           break;
 842
 843         case AllocPageState::Freed:
 844           aOut.mKind = phc::AddrInfo::Kind::FreedPage;
 845           break;
 846
 847         default:
 848           MOZ_CRASH();
 849       }
 850     }
 851     aOut.mBaseAddr = page.mBaseAddr;
 852     aOut.mUsableSize = page.UsableSize();
 853     aOut.mAllocStack = page.mAllocStack;
 854     aOut.mFreeStack = page.mFreeStack;
 855   }
 856
 857   void FillJemallocPtrInfo(GMutLock, const void* aPtr, uintptr_t aIndex,
 858                            jemalloc_ptr_info_t* aInfo) {
 859     const AllocPageInfo& page = mAllocPages[aIndex];
 860     switch (page.mState) {
 861       case AllocPageState::NeverAllocated:
 862         break;
 863
 864       case AllocPageState::InUse: {
 865         // Only return TagLiveAlloc if the pointer is within the bounds of the
 866         // allocation's usable size.
 867         uint8_t* base = page.mBaseAddr;
 868         uint8_t* limit = base + page.UsableSize();
 869         if (base <= aPtr && aPtr < limit) {
 870           *aInfo = {TagLiveAlloc, page.mBaseAddr, page.UsableSize(),
 871                     page.mArenaId.valueOr(0)};
 872           return;
 873         }
 874         break;
 875       }
 876
 877       case AllocPageState::Freed: {
 878         // Only return TagFreedAlloc if the pointer is within the bounds of the
 879         // former allocation's usable size.
 880         uint8_t* base = page.mBaseAddr;
 881         uint8_t* limit = base + page.UsableSize();
 882         if (base <= aPtr && aPtr < limit) {
 883           *aInfo = {TagFreedAlloc, page.mBaseAddr, page.UsableSize(),
 884                     page.mArenaId.valueOr(0)};
 885           return;
 886         }
 887         break;
 888       }
 889
 890       default:
 891         MOZ_CRASH();
 892     }
 893
 894     // Pointers into guard pages will end up here, as will pointers into
 895     // allocation pages that aren't within the allocation's bounds.
 896     *aInfo = {TagUnknown, nullptr, 0, 0};
 897   }
 898
 899 #ifndef XP_WIN
 900   static void prefork() MOZ_NO_THREAD_SAFETY_ANALYSIS { sMutex.Lock(); }
 901   static void postfork_parent() MOZ_NO_THREAD_SAFETY_ANALYSIS {
 902     sMutex.Unlock();
 903   }
 904   static void postfork_child() { sMutex.Init(); }
 905 #endif
 906
 907 #if PHC_LOGGING
 908   void IncPageAllocHits(GMutLock) { mPageAllocHits++; }
 909   void IncPageAllocMisses(GMutLock) { mPageAllocMisses++; }
 910 #else
 911   void IncPageAllocHits(GMutLock) {}
 912   void IncPageAllocMisses(GMutLock) {}
 913 #endif
 914
 915 #if PHC_LOGGING
 916   struct PageStats {
 917     size_t mNumAlloced = 0;
 918     size_t mNumFreed = 0;
 919   };
 920
 921   PageStats GetPageStats(GMutLock) {
 922     PageStats stats;
 923
 924     for (const auto& page : mAllocPages) {
 925       stats.mNumAlloced += page.mState == AllocPageState::InUse ? 1 : 0;
 926       stats.mNumFreed += page.mState == AllocPageState::Freed ? 1 : 0;
 927     }
 928
 929     return stats;
 930   }
 931
 932   size_t PageAllocHits(GMutLock) { return mPageAllocHits; }
 933   size_t PageAllocAttempts(GMutLock) {
 934     return mPageAllocHits + mPageAllocMisses;
 935   }
 936
 937   // This is an integer because FdPrintf only supports integer printing.
 938   size_t PageAllocHitRate(GMutLock) {
 939     return mPageAllocHits * 100 / (mPageAllocHits + mPageAllocMisses);
 940   }
 941 #endif
 942
 943  private:
 944   template <int N>
 945   uint64_t RandomSeed() {
 946     // An older version of this code used RandomUint64() here, but on Mac that
 947     // function uses arc4random(), which can allocate, which would cause
 948     // re-entry, which would be bad. So we just use time() and a local variable
 949     // address. These are mediocre sources of entropy, but good enough for PHC.
 950     static_assert(N == 0 || N == 1, "must be 0 or 1");
 951     uint64_t seed;
 952     if (N == 0) {
 953       time_t t = time(nullptr);
 954       seed = t ^ (t << 32);
 955     } else {
 956       seed = uintptr_t(&seed) ^ (uintptr_t(&seed) << 32);
 957     }
 958     return seed;
 959   }
 960
 961   void AssertAllocPageInUse(GMutLock, const AllocPageInfo& aPage) {
 962     MOZ_ASSERT(aPage.mState == AllocPageState::InUse);
 963     // There is nothing to assert about aPage.mArenaId.
 964     MOZ_ASSERT(aPage.mBaseAddr);
 965     MOZ_ASSERT(aPage.UsableSize() > 0);
 966     MOZ_ASSERT(aPage.mAllocStack.isSome());
 967     MOZ_ASSERT(aPage.mFreeStack.isNothing());
 968     MOZ_ASSERT(aPage.mReuseTime == kMaxTime);
 969   }
 970
 971   void AssertAllocPageNotInUse(GMutLock, const AllocPageInfo& aPage) {
 972     // We can assert a lot about `NeverAllocated` pages, but not much about
 973     // `Freed` pages.
 974 #ifdef DEBUG
 975     bool isFresh = aPage.mState == AllocPageState::NeverAllocated;
 976     MOZ_ASSERT(isFresh || aPage.mState == AllocPageState::Freed);
 977     MOZ_ASSERT_IF(isFresh, aPage.mArenaId == Nothing());
 978     MOZ_ASSERT(isFresh == (aPage.mBaseAddr == nullptr));
 979     MOZ_ASSERT(isFresh == (aPage.mAllocStack.isNothing()));
 980     MOZ_ASSERT(isFresh == (aPage.mFreeStack.isNothing()));
 981     MOZ_ASSERT(aPage.mReuseTime != kMaxTime);
 982 #endif
 983   }
 984
 985   // RNG for deciding which allocations to treat specially. It doesn't need to
 986   // be high quality.
 987   //
 988   // This is a raw pointer for the reason explained in the comment above
 989   // GMut's constructor. Don't change it to UniquePtr or anything like that.
 990   non_crypto::XorShift128PlusRNG mRNG;
 991
 992   AllocPageInfo mAllocPages[kNumAllocPages];
 993 #if PHC_LOGGING
 994   Time mFreeTime[kNumAllocPages];
 995
 996   // How many allocations that could have been page allocs actually were? As
 997   // constrained kNumAllocPages. If the hit ratio isn't close to 100% it's
 998   // likely that the global constants are poorly chosen.
 999   size_t mPageAllocHits = 0;
1000   size_t mPageAllocMisses = 0;
1001 #endif
1002 };
1003
1004 Mutex GMut::sMutex;
1005
1006 static GMut* gMut;
1007
1008 //---------------------------------------------------------------------------
1009 // Page allocation operations
1010 //---------------------------------------------------------------------------
1011
1012 // Attempt a page allocation if the time and the size are right. Allocated
1013 // memory is zeroed if aZero is true. On failure, the caller should attempt a
1014 // normal allocation via sMallocTable. Can be called in a context where
1015 // GMut::sMutex is locked.
1016 static void* MaybePageAlloc(const Maybe<arena_id_t>& aArenaId, size_t aReqSize,
1017                             size_t aAlignment, bool aZero) {
1018   MOZ_ASSERT(IsPowerOfTwo(aAlignment));
1019
1020   if (aReqSize > kPageSize) {
1021     return nullptr;
1022   }
1023
1024   GAtomic::IncrementNow();
1025
1026   // Decrement the delay. If it's zero, we do a page allocation and reset the
1027   // delay to a random number. Because the assignment to the random number isn't
1028   // atomic w.r.t. the decrement, we might have a sequence like this:
1029   //
1030   //     Thread 1                      Thread 2           Thread 3
1031   //     --------                      --------           --------
1032   // (a) newDelay = --sAllocDelay (-> 0)
1033   // (b)                               --sAllocDelay (-> -1)
1034   // (c) (newDelay != 0) fails
1035   // (d)                                                  --sAllocDelay (-> -2)
1036   // (e) sAllocDelay = new_random_number()
1037   //
1038   // It's critical that sAllocDelay has ReleaseAcquire semantics, because that
1039   // guarantees that exactly one thread will see sAllocDelay have the value 0.
1040   // (Relaxed semantics wouldn't guarantee that.)
1041   //
1042   // It's also nice that sAllocDelay is signed, given that we can decrement to
1043   // below zero. (Strictly speaking, an unsigned integer would also work due
1044   // to wrapping, but a signed integer is conceptually cleaner.)
1045   //
1046   // Finally, note that the decrements that occur between (a) and (e) above are
1047   // effectively ignored, because (e) clobbers them. This shouldn't be a
1048   // problem; it effectively just adds a little more randomness to
1049   // new_random_number(). An early version of this code tried to account for
1050   // these decrements by doing `sAllocDelay += new_random_number()`. However, if
1051   // new_random_value() is small, the number of decrements between (a) and (e)
1052   // can easily exceed it, whereupon sAllocDelay ends up negative after
1053   // `sAllocDelay += new_random_number()`, and the zero-check never succeeds
1054   // again. (At least, not until sAllocDelay wraps around on overflow, which
1055   // would take a very long time indeed.)
1056   //
1057   int32_t newDelay = GAtomic::DecrementDelay();
1058   if (newDelay != 0) {
1059     return nullptr;
1060   }
1061
1062   if (GTls::IsDisabledOnCurrentThread()) {
1063     return nullptr;
1064   }
1065
1066   // Disable on this thread *before* getting the stack trace.
1067   AutoDisableOnCurrentThread disable;
1068
1069   // Get the stack trace *before* locking the mutex. If we return nullptr then
1070   // it was a waste, but it's not so frequent, and doing a stack walk while
1071   // the mutex is locked is problematic (see the big comment on
1072   // StackTrace::Fill() for details).
1073   StackTrace allocStack;
1074   allocStack.Fill();
1075
1076   MutexAutoLock lock(GMut::sMutex);
1077
1078   Time now = GAtomic::Now();
1079   Delay newAllocDelay = Rnd64ToDelay<kAvgAllocDelay>(gMut->Random64(lock));
1080
1081   // We start at a random page alloc and wrap around, to ensure pages get even
1082   // amounts of use.
1083   uint8_t* ptr = nullptr;
1084   uint8_t* pagePtr = nullptr;
1085   for (uintptr_t n = 0, i = size_t(gMut->Random64(lock)) % kNumAllocPages;
1086        n < kNumAllocPages; n++, i = (i + 1) % kNumAllocPages) {
1087     if (!gMut->IsPageAllocatable(lock, i, now)) {
1088       continue;
1089     }
1090
1091 #if PHC_LOGGING
1092     Time lifetime = 0;
1093 #endif
1094     pagePtr = gConst->AllocPagePtr(i);
1095     MOZ_ASSERT(pagePtr);
1096     bool ok =
1097 #ifdef XP_WIN
1098         !!VirtualAlloc(pagePtr, kPageSize, MEM_COMMIT, PAGE_READWRITE);
1099 #else
1100         mprotect(pagePtr, kPageSize, PROT_READ | PROT_WRITE) == 0;
1101 #endif
1102
1103     if (!ok) {
1104       pagePtr = nullptr;
1105       continue;
1106     }
1107
1108     size_t usableSize = sMallocTable.malloc_good_size(aReqSize);
1109     MOZ_ASSERT(usableSize > 0);
1110
1111     // Put the allocation as close to the end of the page as possible,
1112     // allowing for alignment requirements.
1113     ptr = pagePtr + kPageSize - usableSize;
1114     if (aAlignment != 1) {
1115       ptr = reinterpret_cast<uint8_t*>(
1116           (reinterpret_cast<uintptr_t>(ptr) & ~(aAlignment - 1)));
1117     }
1118
1119 #if PHC_LOGGING
1120     Time then = gMut->GetFreeTime(i);
1121     lifetime = then != 0 ? now - then : 0;
1122 #endif
1123
1124     gMut->SetPageInUse(lock, i, aArenaId, ptr, allocStack);
1125
1126     if (aZero) {
1127       memset(ptr, 0, usableSize);
1128     } else {
1129 #ifdef DEBUG
1130       memset(ptr, kAllocJunk, usableSize);
1131 #endif
1132     }
1133
1134     gMut->IncPageAllocHits(lock);
1135 #if PHC_LOGGING
1136     GMut::PageStats stats = gMut->GetPageStats(lock);
1137 #endif
1138     LOG("PageAlloc(%zu, %zu) -> %p[%zu]/%p (%zu) (z%zu), sAllocDelay <- %zu, "
1139         "fullness %zu/%zu/%zu, hits %zu/%zu (%zu%%), lifetime %zu\n",
1140         aReqSize, aAlignment, pagePtr, i, ptr, usableSize, size_t(aZero),
1141         size_t(newAllocDelay), stats.mNumAlloced, stats.mNumFreed,
1142         kNumAllocPages, gMut->PageAllocHits(lock),
1143         gMut->PageAllocAttempts(lock), gMut->PageAllocHitRate(lock), lifetime);
1144     break;
1145   }
1146
1147   if (!pagePtr) {
1148     // No pages are available, or VirtualAlloc/mprotect failed.
1149     gMut->IncPageAllocMisses(lock);
1150 #if PHC_LOGGING
1151     GMut::PageStats stats = gMut->GetPageStats(lock);
1152 #endif
1153     LOG("No PageAlloc(%zu, %zu), sAllocDelay <- %zu, fullness %zu/%zu/%zu, "
1154         "hits %zu/%zu (%zu%%)\n",
1155         aReqSize, aAlignment, size_t(newAllocDelay), stats.mNumAlloced,
1156         stats.mNumFreed, kNumAllocPages, gMut->PageAllocHits(lock),
1157         gMut->PageAllocAttempts(lock), gMut->PageAllocHitRate(lock));
1158   }
1159
1160   // Set the new alloc delay.
1161   GAtomic::SetAllocDelay(newAllocDelay);
1162
1163   return ptr;
1164 }
1165
1166 static void FreePage(GMutLock aLock, uintptr_t aIndex,
1167                      const Maybe<arena_id_t>& aArenaId,
1168                      const StackTrace& aFreeStack, Delay aReuseDelay) {
1169   void* pagePtr = gConst->AllocPagePtr(aIndex);
1170
1171 #ifdef XP_WIN
1172   if (!VirtualFree(pagePtr, kPageSize, MEM_DECOMMIT)) {
1173     MOZ_CRASH("VirtualFree failed");
1174   }
1175 #else
1176   if (mmap(pagePtr, kPageSize, PROT_NONE, MAP_FIXED | MAP_PRIVATE | MAP_ANON,
1177            -1, 0) == MAP_FAILED) {
1178     MOZ_CRASH("mmap failed");
1179   }
1180 #endif
1181
1182   gMut->SetPageFreed(aLock, aIndex, aArenaId, aFreeStack, aReuseDelay);
1183 }
1184
1185 //---------------------------------------------------------------------------
1186 // replace-malloc machinery
1187 //---------------------------------------------------------------------------
1188
1189 // This handles malloc, moz_arena_malloc, and realloc-with-a-nullptr.
1190 MOZ_ALWAYS_INLINE static void* PageMalloc(const Maybe<arena_id_t>& aArenaId,
1191                                           size_t aReqSize) {
1192   void* ptr = MaybePageAlloc(aArenaId, aReqSize, /* aAlignment */ 1,
1193                              /* aZero */ false);
1194   return ptr ? ptr
1195              : (aArenaId.isSome()
1196                     ? sMallocTable.moz_arena_malloc(*aArenaId, aReqSize)
1197                     : sMallocTable.malloc(aReqSize));
1198 }
1199
1200 static void* replace_malloc(size_t aReqSize) {
1201   return PageMalloc(Nothing(), aReqSize);
1202 }
1203
1204 static Delay ReuseDelay(GMutLock aLock) {
1205   return (kAvgPageReuseDelay / 2) +
1206          Rnd64ToDelay<kAvgPageReuseDelay / 2>(gMut->Random64(aLock));
1207 }
1208
1209 // This handles both calloc and moz_arena_calloc.
1210 MOZ_ALWAYS_INLINE static void* PageCalloc(const Maybe<arena_id_t>& aArenaId,
1211                                           size_t aNum, size_t aReqSize) {
1212   CheckedInt<size_t> checkedSize = CheckedInt<size_t>(aNum) * aReqSize;
1213   if (!checkedSize.isValid()) {
1214     return nullptr;
1215   }
1216
1217   void* ptr = MaybePageAlloc(aArenaId, checkedSize.value(), /* aAlignment */ 1,
1218                              /* aZero */ true);
1219   return ptr ? ptr
1220              : (aArenaId.isSome()
1221                     ? sMallocTable.moz_arena_calloc(*aArenaId, aNum, aReqSize)
1222                     : sMallocTable.calloc(aNum, aReqSize));
1223 }
1224
1225 static void* replace_calloc(size_t aNum, size_t aReqSize) {
1226   return PageCalloc(Nothing(), aNum, aReqSize);
1227 }
1228
1229 // This function handles both realloc and moz_arena_realloc.
1230 //
1231 // As always, realloc is complicated, and doubly so when there are two
1232 // different kinds of allocations in play. Here are the possible transitions,
1233 // and what we do in practice.
1234 //
1235 // - normal-to-normal: This is straightforward and obviously necessary.
1236 //
1237 // - normal-to-page: This is disallowed because it would require getting the
1238 //   arenaId of the normal allocation, which isn't possible in non-DEBUG builds
1239 //   for security reasons.
1240 //
1241 // - page-to-page: This is done whenever possible, i.e. whenever the new size
1242 //   is less than or equal to 4 KiB. This choice counterbalances the
1243 //   disallowing of normal-to-page allocations, in order to avoid biasing
1244 //   towards or away from page allocations. It always occurs in-place.
1245 //
1246 // - page-to-normal: this is done only when necessary, i.e. only when the new
1247 //   size is greater than 4 KiB. This choice naturally flows from the
1248 //   prior choice on page-to-page transitions.
1249 //
1250 // In summary: realloc doesn't change the allocation kind unless it must.
1251 //
1252 MOZ_ALWAYS_INLINE static void* PageRealloc(const Maybe<arena_id_t>& aArenaId,
1253                                            void* aOldPtr, size_t aNewSize) {
1254   if (!aOldPtr) {
1255     // Null pointer. Treat like malloc(aNewSize).
1256     return PageMalloc(aArenaId, aNewSize);
1257   }
1258
1259   PtrKind pk = gConst->PtrKind(aOldPtr);
1260   if (pk.IsNothing()) {
1261     // A normal-to-normal transition.
1262     return aArenaId.isSome()
1263                ? sMallocTable.moz_arena_realloc(*aArenaId, aOldPtr, aNewSize)
1264                : sMallocTable.realloc(aOldPtr, aNewSize);
1265   }
1266
1267   if (pk.IsGuardPage()) {
1268     GMut::CrashOnGuardPage(aOldPtr);
1269   }
1270
1271   // At this point we know we have an allocation page.
1272   uintptr_t index = pk.AllocPageIndex();
1273
1274   // A page-to-something transition.
1275
1276   // Note that `disable` has no effect unless it is emplaced below.
1277   Maybe<AutoDisableOnCurrentThread> disable;
1278   // Get the stack trace *before* locking the mutex.
1279   StackTrace stack;
1280   if (GTls::IsDisabledOnCurrentThread()) {
1281     // PHC is disabled on this thread. Leave the stack empty.
1282   } else {
1283     // Disable on this thread *before* getting the stack trace.
1284     disable.emplace();
1285     stack.Fill();
1286   }
1287
1288   MutexAutoLock lock(GMut::sMutex);
1289
1290   // Check for realloc() of a freed block.
1291   gMut->EnsureValidAndInUse(lock, aOldPtr, index);
1292
1293   if (aNewSize <= kPageSize) {
1294     // A page-to-page transition. Just keep using the page allocation. We do
1295     // this even if the thread is disabled, because it doesn't create a new
1296     // page allocation. Note that ResizePageInUse() checks aArenaId.
1297     //
1298     // Move the bytes with memmove(), because the old allocation and the new
1299     // allocation overlap. Move the usable size rather than the requested size,
1300     // because the user might have used malloc_usable_size() and filled up the
1301     // usable size.
1302     size_t oldUsableSize = gMut->PageUsableSize(lock, index);
1303     size_t newUsableSize = sMallocTable.malloc_good_size(aNewSize);
1304     uint8_t* pagePtr = gConst->AllocPagePtr(index);
1305     uint8_t* newPtr = pagePtr + kPageSize - newUsableSize;
1306     memmove(newPtr, aOldPtr, std::min(oldUsableSize, aNewSize));
1307     gMut->ResizePageInUse(lock, index, aArenaId, newPtr, stack);
1308     LOG("PageRealloc-Reuse(%p, %zu) -> %p\n", aOldPtr, aNewSize, newPtr);
1309     return newPtr;
1310   }
1311
1312   // A page-to-normal transition (with the new size greater than page-sized).
1313   // (Note that aArenaId is checked below.)
1314   void* newPtr;
1315   if (aArenaId.isSome()) {
1316     newPtr = sMallocTable.moz_arena_malloc(*aArenaId, aNewSize);
1317   } else {
1318     Maybe<arena_id_t> oldArenaId = gMut->PageArena(lock, index);
1319     newPtr = (oldArenaId.isSome()
1320                   ? sMallocTable.moz_arena_malloc(*oldArenaId, aNewSize)
1321                   : sMallocTable.malloc(aNewSize));
1322   }
1323   if (!newPtr) {
1324     return nullptr;
1325   }
1326
1327   MOZ_ASSERT(aNewSize > kPageSize);
1328
1329   Delay reuseDelay = ReuseDelay(lock);
1330
1331   // Copy the usable size rather than the requested size, because the user
1332   // might have used malloc_usable_size() and filled up the usable size. Note
1333   // that FreePage() checks aArenaId (via SetPageFreed()).
1334   size_t oldUsableSize = gMut->PageUsableSize(lock, index);
1335   memcpy(newPtr, aOldPtr, std::min(oldUsableSize, aNewSize));
1336   FreePage(lock, index, aArenaId, stack, reuseDelay);
1337   LOG("PageRealloc-Free(%p[%zu], %zu) -> %p, %zu delay, reuse at ~%zu\n",
1338       aOldPtr, index, aNewSize, newPtr, size_t(reuseDelay),
1339       size_t(GAtomic::Now()) + reuseDelay);
1340
1341   return newPtr;
1342 }
1343
1344 static void* replace_realloc(void* aOldPtr, size_t aNewSize) {
1345   return PageRealloc(Nothing(), aOldPtr, aNewSize);
1346 }
1347
1348 // This handles both free and moz_arena_free.
1349 MOZ_ALWAYS_INLINE static void PageFree(const Maybe<arena_id_t>& aArenaId,
1350                                        void* aPtr) {
1351   PtrKind pk = gConst->PtrKind(aPtr);
1352   if (pk.IsNothing()) {
1353     // Not a page allocation.
1354     return aArenaId.isSome() ? sMallocTable.moz_arena_free(*aArenaId, aPtr)
1355                              : sMallocTable.free(aPtr);
1356   }
1357
1358   if (pk.IsGuardPage()) {
1359     GMut::CrashOnGuardPage(aPtr);
1360   }
1361
1362   // At this point we know we have an allocation page.
1363   uintptr_t index = pk.AllocPageIndex();
1364
1365   // Note that `disable` has no effect unless it is emplaced below.
1366   Maybe<AutoDisableOnCurrentThread> disable;
1367   // Get the stack trace *before* locking the mutex.
1368   StackTrace freeStack;
1369   if (GTls::IsDisabledOnCurrentThread()) {
1370     // PHC is disabled on this thread. Leave the stack empty.
1371   } else {
1372     // Disable on this thread *before* getting the stack trace.
1373     disable.emplace();
1374     freeStack.Fill();
1375   }
1376
1377   MutexAutoLock lock(GMut::sMutex);
1378
1379   // Check for a double-free.
1380   gMut->EnsureValidAndInUse(lock, aPtr, index);
1381
1382   // Note that FreePage() checks aArenaId (via SetPageFreed()).
1383   Delay reuseDelay = ReuseDelay(lock);
1384   FreePage(lock, index, aArenaId, freeStack, reuseDelay);
1385
1386 #if PHC_LOGGING
1387   GMut::PageStats stats = gMut->GetPageStats(lock);
1388 #endif
1389   LOG("PageFree(%p[%zu]), %zu delay, reuse at ~%zu, fullness %zu/%zu/%zu\n",
1390       aPtr, index, size_t(reuseDelay), size_t(GAtomic::Now()) + reuseDelay,
1391       stats.mNumAlloced, stats.mNumFreed, kNumAllocPages);
1392 }
1393
1394 static void replace_free(void* aPtr) { return PageFree(Nothing(), aPtr); }
1395
1396 // This handles memalign and moz_arena_memalign.
1397 MOZ_ALWAYS_INLINE static void* PageMemalign(const Maybe<arena_id_t>& aArenaId,
1398                                             size_t aAlignment,
1399                                             size_t aReqSize) {
1400   MOZ_RELEASE_ASSERT(IsPowerOfTwo(aAlignment));
1401
1402   // PHC can't satisfy an alignment greater than a page size, so fall back to
1403   // mozjemalloc in that case.
1404   void* ptr = nullptr;
1405   if (aAlignment <= kPageSize) {
1406     ptr = MaybePageAlloc(aArenaId, aReqSize, aAlignment, /* aZero */ false);
1407   }
1408   return ptr ? ptr
1409              : (aArenaId.isSome()
1410                     ? sMallocTable.moz_arena_memalign(*aArenaId, aAlignment,
1411                                                       aReqSize)
1412                     : sMallocTable.memalign(aAlignment, aReqSize));
1413 }
1414
1415 static void* replace_memalign(size_t aAlignment, size_t aReqSize) {
1416   return PageMemalign(Nothing(), aAlignment, aReqSize);
1417 }
1418
1419 static size_t replace_malloc_usable_size(usable_ptr_t aPtr) {
1420   PtrKind pk = gConst->PtrKind(aPtr);
1421   if (pk.IsNothing()) {
1422     // Not a page allocation. Measure it normally.
1423     return sMallocTable.malloc_usable_size(aPtr);
1424   }
1425
1426   if (pk.IsGuardPage()) {
1427     GMut::CrashOnGuardPage(const_cast<void*>(aPtr));
1428   }
1429
1430   // At this point we know aPtr lands within an allocation page, due to the
1431   // math done in the PtrKind constructor. But if aPtr points to memory
1432   // before the base address of the allocation, we return 0.
1433   uintptr_t index = pk.AllocPageIndex();
1434
1435   MutexAutoLock lock(GMut::sMutex);
1436
1437   void* pageBaseAddr = gMut->AllocPageBaseAddr(lock, index);
1438
1439   if (MOZ_UNLIKELY(aPtr < pageBaseAddr)) {
1440     return 0;
1441   }
1442
1443   return gMut->PageUsableSize(lock, index);
1444 }
1445
1446 static size_t metadata_size() {
1447   return sMallocTable.malloc_usable_size(gConst) +
1448          sMallocTable.malloc_usable_size(gMut);
1449 }
1450
1451 void replace_jemalloc_stats(jemalloc_stats_t* aStats,
1452                             jemalloc_bin_stats_t* aBinStats) {
1453   sMallocTable.jemalloc_stats_internal(aStats, aBinStats);
1454
1455   // Add all the pages to `mapped`.
1456   size_t mapped = kAllPagesSize;
1457   aStats->mapped += mapped;
1458
1459   size_t allocated = 0;
1460   {
1461     MutexAutoLock lock(GMut::sMutex);
1462
1463     // Add usable space of in-use allocations to `allocated`.
1464     for (size_t i = 0; i < kNumAllocPages; i++) {
1465       if (gMut->IsPageInUse(lock, i)) {
1466         allocated += gMut->PageUsableSize(lock, i);
1467       }
1468     }
1469   }
1470   aStats->allocated += allocated;
1471
1472   // guards is the gap between `allocated` and `mapped`. In some ways this
1473   // almost fits into aStats->wasted since it feels like wasted memory. However
1474   // wasted should only include committed memory and these guard pages are
1475   // uncommitted. Therefore we don't include it anywhere.
1476   // size_t guards = mapped - allocated;
1477
1478   // aStats.page_cache and aStats.bin_unused are left unchanged because PHC
1479   // doesn't have anything corresponding to those.
1480
1481   // The metadata is stored in normal heap allocations, so they're measured by
1482   // mozjemalloc as `allocated`. Move them into `bookkeeping`.
1483   // They're also reported under explicit/heap-overhead/phc/fragmentation in
1484   // about:memory.
1485   size_t bookkeeping = metadata_size();
1486   aStats->allocated -= bookkeeping;
1487   aStats->bookkeeping += bookkeeping;
1488 }
1489
1490 void replace_jemalloc_ptr_info(const void* aPtr, jemalloc_ptr_info_t* aInfo) {
1491   // We need to implement this properly, because various code locations do
1492   // things like checking that allocations are in the expected arena.
1493   PtrKind pk = gConst->PtrKind(aPtr);
1494   if (pk.IsNothing()) {
1495     // Not a page allocation.
1496     return sMallocTable.jemalloc_ptr_info(aPtr, aInfo);
1497   }
1498
1499   if (pk.IsGuardPage()) {
1500     // Treat a guard page as unknown because there's no better alternative.
1501     *aInfo = {TagUnknown, nullptr, 0, 0};
1502     return;
1503   }
1504
1505   // At this point we know we have an allocation page.
1506   uintptr_t index = pk.AllocPageIndex();
1507
1508   MutexAutoLock lock(GMut::sMutex);
1509
1510   gMut->FillJemallocPtrInfo(lock, aPtr, index, aInfo);
1511 #if DEBUG
1512   LOG("JemallocPtrInfo(%p[%zu]) -> {%zu, %p, %zu, %zu}\n", aPtr, index,
1513       size_t(aInfo->tag), aInfo->addr, aInfo->size, aInfo->arenaId);
1514 #else
1515   LOG("JemallocPtrInfo(%p[%zu]) -> {%zu, %p, %zu}\n", aPtr, index,
1516       size_t(aInfo->tag), aInfo->addr, aInfo->size);
1517 #endif
1518 }
1519
1520 arena_id_t replace_moz_create_arena_with_params(arena_params_t* aParams) {
1521   // No need to do anything special here.
1522   return sMallocTable.moz_create_arena_with_params(aParams);
1523 }
1524
1525 void replace_moz_dispose_arena(arena_id_t aArenaId) {
1526   // No need to do anything special here.
1527   return sMallocTable.moz_dispose_arena(aArenaId);
1528 }
1529
1530 void replace_moz_set_max_dirty_page_modifier(int32_t aModifier) {
1531   // No need to do anything special here.
1532   return sMallocTable.moz_set_max_dirty_page_modifier(aModifier);
1533 }
1534
1535 void* replace_moz_arena_malloc(arena_id_t aArenaId, size_t aReqSize) {
1536   return PageMalloc(Some(aArenaId), aReqSize);
1537 }
1538
1539 void* replace_moz_arena_calloc(arena_id_t aArenaId, size_t aNum,
1540                                size_t aReqSize) {
1541   return PageCalloc(Some(aArenaId), aNum, aReqSize);
1542 }
1543
1544 void* replace_moz_arena_realloc(arena_id_t aArenaId, void* aOldPtr,
1545                                 size_t aNewSize) {
1546   return PageRealloc(Some(aArenaId), aOldPtr, aNewSize);
1547 }
1548
1549 void replace_moz_arena_free(arena_id_t aArenaId, void* aPtr) {
1550   return PageFree(Some(aArenaId), aPtr);
1551 }
1552
1553 void* replace_moz_arena_memalign(arena_id_t aArenaId, size_t aAlignment,
1554                                  size_t aReqSize) {
1555   return PageMemalign(Some(aArenaId), aAlignment, aReqSize);
1556 }
1557
1558 class PHCBridge : public ReplaceMallocBridge {
1559   virtual bool IsPHCAllocation(const void* aPtr, phc::AddrInfo* aOut) override {
1560     PtrKind pk = gConst->PtrKind(aPtr);
1561     if (pk.IsNothing()) {
1562       return false;
1563     }
1564
1565     bool isGuardPage = false;
1566     if (pk.IsGuardPage()) {
1567       if ((uintptr_t(aPtr) % kPageSize) < (kPageSize / 2)) {
1568         // The address is in the lower half of a guard page, so it's probably an
1569         // overflow. But first check that it is not on the very first guard
1570         // page, in which case it cannot be an overflow, and we ignore it.
1571         if (gConst->IsInFirstGuardPage(aPtr)) {
1572           return false;
1573         }
1574
1575         // Get the allocation page preceding this guard page.
1576         pk = gConst->PtrKind(static_cast<const uint8_t*>(aPtr) - kPageSize);
1577
1578       } else {
1579         // The address is in the upper half of a guard page, so it's probably an
1580         // underflow. Get the allocation page following this guard page.
1581         pk = gConst->PtrKind(static_cast<const uint8_t*>(aPtr) + kPageSize);
1582       }
1583
1584       // Make a note of the fact that we hit a guard page.
1585       isGuardPage = true;
1586     }
1587
1588     // At this point we know we have an allocation page.
1589     uintptr_t index = pk.AllocPageIndex();
1590
1591     if (aOut) {
1592       MutexAutoLock lock(GMut::sMutex);
1593       gMut->FillAddrInfo(lock, index, aPtr, isGuardPage, *aOut);
1594       LOG("IsPHCAllocation: %zu, %p, %zu, %zu, %zu\n", size_t(aOut->mKind),
1595           aOut->mBaseAddr, aOut->mUsableSize,
1596           aOut->mAllocStack.isSome() ? aOut->mAllocStack->mLength : 0,
1597           aOut->mFreeStack.isSome() ? aOut->mFreeStack->mLength : 0);
1598     }
1599     return true;
1600   }
1601
1602   virtual void DisablePHCOnCurrentThread() override {
1603     GTls::DisableOnCurrentThread();
1604     LOG("DisablePHCOnCurrentThread: %zu\n", 0ul);
1605   }
1606
1607   virtual void ReenablePHCOnCurrentThread() override {
1608     GTls::EnableOnCurrentThread();
1609     LOG("ReenablePHCOnCurrentThread: %zu\n", 0ul);
1610   }
1611
1612   virtual bool IsPHCEnabledOnCurrentThread() override {
1613     bool enabled = !GTls::IsDisabledOnCurrentThread();
1614     LOG("IsPHCEnabledOnCurrentThread: %zu\n", size_t(enabled));
1615     return enabled;
1616   }
1617
1618   virtual void PHCMemoryUsage(
1619       mozilla::phc::MemoryUsage& aMemoryUsage) override {
1620     aMemoryUsage.mMetadataBytes = metadata_size();
1621     if (gMut) {
1622       MutexAutoLock lock(GMut::sMutex);
1623       aMemoryUsage.mFragmentationBytes = gMut->FragmentationBytes();
1624     } else {
1625       aMemoryUsage.mFragmentationBytes = 0;
1626     }
1627   }
1628 };
1629
1630 // WARNING: this function runs *very* early -- before all static initializers
1631 // have run. For this reason, non-scalar globals (gConst, gMut) are allocated
1632 // dynamically (so we can guarantee their construction in this function) rather
1633 // than statically. GAtomic and GTls contain simple static data that doesn't
1634 // involve static initializers so they don't need to be allocated dynamically.
1635 void replace_init(malloc_table_t* aMallocTable, ReplaceMallocBridge** aBridge) {
1636   // Don't run PHC if the page size isn't 4 KiB.
1637   jemalloc_stats_t stats;
1638   aMallocTable->jemalloc_stats_internal(&stats, nullptr);
1639   if (stats.page_size != kPageSize) {
1640     return;
1641   }
1642
1643   sMallocTable = *aMallocTable;
1644
1645   // The choices of which functions to replace are complex enough that we set
1646   // them individually instead of using MALLOC_FUNCS/malloc_decls.h.
1647
1648   aMallocTable->malloc = replace_malloc;
1649   aMallocTable->calloc = replace_calloc;
1650   aMallocTable->realloc = replace_realloc;
1651   aMallocTable->free = replace_free;
1652   aMallocTable->memalign = replace_memalign;
1653
1654   // posix_memalign, aligned_alloc & valloc: unset, which means they fall back
1655   // to replace_memalign.
1656   aMallocTable->malloc_usable_size = replace_malloc_usable_size;
1657   // default malloc_good_size: the default suffices.
1658
1659   aMallocTable->jemalloc_stats_internal = replace_jemalloc_stats;
1660   // jemalloc_purge_freed_pages: the default suffices.
1661   // jemalloc_free_dirty_pages: the default suffices.
1662   // jemalloc_thread_local_arena: the default suffices.
1663   aMallocTable->jemalloc_ptr_info = replace_jemalloc_ptr_info;
1664
1665   aMallocTable->moz_create_arena_with_params =
1666       replace_moz_create_arena_with_params;
1667   aMallocTable->moz_dispose_arena = replace_moz_dispose_arena;
1668   aMallocTable->moz_arena_malloc = replace_moz_arena_malloc;
1669   aMallocTable->moz_arena_calloc = replace_moz_arena_calloc;
1670   aMallocTable->moz_arena_realloc = replace_moz_arena_realloc;
1671   aMallocTable->moz_arena_free = replace_moz_arena_free;
1672   aMallocTable->moz_arena_memalign = replace_moz_arena_memalign;
1673
1674   static PHCBridge bridge;
1675   *aBridge = &bridge;
1676
1677 #ifndef XP_WIN
1678   // Avoid deadlocks when forking by acquiring our state lock prior to forking
1679   // and releasing it after forking. See |LogAlloc|'s |replace_init| for
1680   // in-depth details.
1681   //
1682   // Note: This must run after attempting an allocation so as to give the
1683   // system malloc a chance to insert its own atfork handler.
1684   sMallocTable.malloc(-1);
1685   pthread_atfork(GMut::prefork, GMut::postfork_parent, GMut::postfork_child);
1686 #endif
1687
1688   // gConst and gMut are never freed. They live for the life of the process.
1689   gConst = InfallibleAllocPolicy::new_<GConst>();
1690   GTls::Init();
1691   gMut = InfallibleAllocPolicy::new_<GMut>();
1692   {
1693     MutexAutoLock lock(GMut::sMutex);
1694     Delay firstAllocDelay =
1695         Rnd64ToDelay<kAvgFirstAllocDelay>(gMut->Random64(lock));
1696     GAtomic::Init(firstAllocDelay);
1697   }
1698 }