js/src/jit/BacktrackingAllocator.cpp

   1 /* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*-
   2  * vim: set ts=8 sts=2 et sw=2 tw=80:
   3  * This Source Code Form is subject to the terms of the Mozilla Public
   4  * License, v. 2.0. If a copy of the MPL was not distributed with this
   5  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
   6
   7 ///////////////////////////////////////////////////////////////////////////////
   8 //                                                                           //
   9 // Documentation.  Code starts about 670 lines down from here.               //
  10 //                                                                           //
  11 ///////////////////////////////////////////////////////////////////////////////
  12
  13 // [SMDOC] An overview of Ion's register allocator
  14 //
  15 // The intent of this documentation is to give maintainers a map with which to
  16 // navigate the allocator.  As further understanding is obtained, it should be
  17 // added to this overview.
  18 //
  19 // Where possible, invariants are stated and are marked "(INVAR)".  Many
  20 // details are omitted because their workings are currently unknown.  In
  21 // particular, this overview doesn't explain how Intel-style "modify" (tied)
  22 // operands are handled.  Facts or invariants that are speculative -- believed
  23 // to be true, but not verified at the time of writing -- are marked "(SPEC)".
  24 //
  25 // The various concepts are interdependent, so a single forwards reading of the
  26 // following won't make much sense.  Many concepts are explained only after
  27 // they are mentioned.
  28 //
  29 // Where possible examples are shown.  Without those the description is
  30 // excessively abstract.
  31 //
  32 // Names of the form ::name mean BacktrackingAllocator::name.
  33 //
  34 // The description falls into two sections:
  35 //
  36 // * Section 1: A tour of the data structures
  37 // * Section 2: The core allocation loop, and bundle splitting
  38 //
  39 // The allocator sometimes produces poor allocations, with excessive spilling
  40 // and register-to-register moves (bugs 1752520, bug 1714280 bug 1746596).
  41 // Work in bug 1752582 shows we can get better quality allocations from this
  42 // framework without having to make any large (conceptual) changes, by having
  43 // better splitting heuristics.
  44 //
  45 // At https://bugzilla.mozilla.org/show_bug.cgi?id=1758274#c17
  46 // (https://bugzilla.mozilla.org/attachment.cgi?id=9288467) is a document
  47 // written at the same time as these comments.  It describes some improvements
  48 // we could make to our splitting heuristics, particularly in the presence of
  49 // loops and calls, and shows why the current implementation sometimes produces
  50 // excessive spilling.  It builds on the commentary in this SMDOC.
  51 //
  52 //
  53 // Top level pipeline
  54 // ~~~~~~~~~~~~~~~~~~
  55 // There are three major phases in allocation.  They run sequentially, at a
  56 // per-function granularity.
  57 //
  58 // (1) Liveness analysis and bundle formation
  59 // (2) Bundle allocation and last-chance allocation
  60 // (3) Rewriting the function to create MoveGroups and to "install"
  61 //     the allocation
  62 //
  63 // The input language (LIR) is in SSA form, and phases (1) and (3) depend on
  64 // that SSAness.  Without it the allocator wouldn't work.
  65 //
  66 // The top level function is ::go.  The phases are divided into functions as
  67 // follows:
  68 //
  69 // (1) ::buildLivenessInfo, ::mergeAndQueueRegisters
  70 // (2) ::processBundle, ::tryAllocatingRegistersForSpillBundles,
  71 //     ::pickStackSlots
  72 // (3) ::createMoveGroupsFromLiveRangeTransitions, ::installAllocationsInLIR,
  73 //     ::populateSafepoints, ::annotateMoveGroups
  74 //
  75 // The code in this file is structured as much as possible in the same sequence
  76 // as flow through the pipeline.  Hence, top level function ::go is right at
  77 // the end.  Where a function depends on helper function(s), the helpers appear
  78 // first.
  79 //
  80 //
  81 // ========================================================================
  82 // ====                                                                ====
  83 // ==== Section 1: A tour of the data structures                       ====
  84 // ====                                                                ====
  85 // ========================================================================
  86 //
  87 // Here are the key data structures necessary for understanding what follows.
  88 //
  89 // Some basic data structures
  90 // ~~~~~~~~~~~~~~~~~~~~~~~~~~
  91 //
  92 // CodePosition
  93 // ------------
  94 // A CodePosition is an unsigned 32-bit int that indicates an instruction index
  95 // in the incoming LIR.  Each LIR actually has two code positions, one to
  96 // denote the "input" point (where, one might imagine, the operands are read,
  97 // at least useAtStart ones) and the "output" point, where operands are
  98 // written.  Eg:
  99 //
 100 //    Block 0 [successor 2] [successor 1]
 101 //      2-3 WasmParameter [def v1<g>:r14]
 102 //      4-5 WasmCall [use v1:F:r14]
 103 //      6-7 WasmLoadTls [def v2<o>] [use v1:R]
 104 //      8-9 WasmNullConstant [def v3<o>]
 105 //      10-11 Compare [def v4<i>] [use v2:R] [use v3:A]
 106 //      12-13 TestIAndBranch [use v4:R]
 107 //
 108 // So for example the WasmLoadTls insn has its input CodePosition as 6 and
 109 // output point as 7.  Input points are even numbered, output points are odd
 110 // numbered.  CodePositions 0 and 1 never appear, because LIR instruction IDs
 111 // start at 1.  Indeed, CodePosition 0 is assumed to be invalid and hence is
 112 // used as a marker for "unusual conditions" in various places.
 113 //
 114 // Phi nodes exist in the instruction stream too.  They always appear at the
 115 // start of blocks (of course) (SPEC), but their start and end points are
 116 // printed for the group as a whole.  This is to emphasise that they are really
 117 // parallel assignments and that printing them sequentially would misleadingly
 118 // imply that they are executed sequentially.  Example:
 119 //
 120 //    Block 6 [successor 7] [successor 8]
 121 //      56-59 Phi [def v19<o>] [use v2:A] [use v5:A] [use v13:A]
 122 //      56-59 Phi [def v20<o>] [use v7:A] [use v14:A] [use v12:A]
 123 //      60-61 WasmLoadSlot [def v21<o>] [use v1:R]
 124 //      62-63 Compare [def v22<i>] [use v20:R] [use v21:A]
 125 //      64-65 TestIAndBranch [use v22:R]
 126 //
 127 // See that both Phis are printed with limits 56-59, even though they are
 128 // stored in the LIR array like regular LIRs and so have code points 56-57 and
 129 // 58-59 in reality.
 130 //
 131 // The process of allocation adds MoveGroup LIRs to the function.  Each
 132 // incoming LIR has its own private list of MoveGroups (actually, 3 lists; two
 133 // for moves that conceptually take place before the instruction, and one for
 134 // moves after it).  Hence the CodePositions for LIRs (the "62-63", etc, above)
 135 // do not change as a result of allocation.
 136 //
 137 // Virtual registers (vregs) in LIR
 138 // --------------------------------
 139 // The MIR from which the LIR is derived, is standard SSA.  That SSAness is
 140 // carried through into the LIR (SPEC).  In the examples here, LIR SSA names
 141 // (virtual registers, a.k.a. vregs) are printed as "v<number>".  v0 never
 142 // appears and is presumed to be a special value, perhaps "invalid" (SPEC).
 143 //
 144 // The allocator core has a type VirtualRegister, but this is private to the
 145 // allocator and not part of the LIR.  It carries far more information than
 146 // merely the name of the vreg.  The allocator creates one VirtualRegister
 147 // structure for each vreg in the LIR.
 148 //
 149 // LDefinition and LUse
 150 // --------------------
 151 // These are part of the incoming LIR.  Each LIR instruction defines zero or
 152 // more values, and contains one LDefinition for each defined value (SPEC).
 153 // Each instruction has zero or more input operands, each of which has its own
 154 // LUse (SPEC).
 155 //
 156 // Both LDefinition and LUse hold both a virtual register name and, in general,
 157 // a real (physical) register identity.  The incoming LIR has the real register
 158 // fields unset, except in places where the incoming LIR has fixed register
 159 // constraints (SPEC).  Phase 3 of allocation will visit all of the
 160 // LDefinitions and LUses so as to write into the real register fields the
 161 // decisions made by the allocator.  For LUses, this is done by overwriting the
 162 // complete LUse with a different LAllocation, for example LStackSlot.  That's
 163 // possible because LUse is a child class of LAllocation.
 164 //
 165 // This action of reading and then later updating LDefinition/LUses is the core
 166 // of the allocator's interface to the outside world.
 167 //
 168 // To make visiting of LDefinitions/LUses possible, the allocator doesn't work
 169 // with LDefinition and LUse directly.  Rather it has pointers to them
 170 // (VirtualRegister::def_, UsePosition::use_).  Hence Phase 3 can modify the
 171 // LIR in-place.
 172 //
 173 // (INVARs, all SPEC):
 174 //
 175 // - The collective VirtualRegister::def_ values should be unique, and there
 176 //   should be a 1:1 mapping between the VirtualRegister::def_ values and the
 177 //   LDefinitions in the LIR.  (So that the LIR LDefinition has exactly one
 178 //   VirtualRegister::def_ to track it).  But only for the valid LDefinitions.
 179 //   If isBogusTemp() is true, the definition is invalid and doesn't have a
 180 //   vreg.
 181 //
 182 // - The same for uses: there must be a 1:1 correspondence between the
 183 //   CodePosition::use_ values and the LIR LUses.
 184 //
 185 // - The allocation process must preserve these 1:1 mappings.  That implies
 186 //   (weaker) that the number of VirtualRegisters and of UsePositions must
 187 //   remain constant through allocation.  (Eg: losing them would mean that some
 188 //   LIR def or use would necessarily not get annotated with its final
 189 //   allocation decision.  Duplicating them would lead to the possibility of
 190 //   conflicting allocation decisions.)
 191 //
 192 // Other comments regarding LIR
 193 // ----------------------------
 194 // The incoming LIR is structured into basic blocks and a CFG, as one would
 195 // expect.  These (insns, block boundaries, block edges etc) are available
 196 // through the BacktrackingAllocator object.  They are important for Phases 1
 197 // and 3 but not for Phase 2.
 198 //
 199 // Phase 3 "rewrites" the input LIR so as to "install" the final allocation.
 200 // It has to insert MoveGroup instructions, but that isn't done by pushing them
 201 // into the instruction array.  Rather, each LIR has 3 auxiliary sets of
 202 // MoveGroups (SPEC): two that "happen" conceptually before the LIR, and one
 203 // that happens after it.  The rewriter inserts MoveGroups into one of these 3
 204 // sets, and later code generation phases presumably insert the sets (suitably
 205 // translated) into the final machine code (SPEC).
 206 //
 207 //
 208 // Key data structures: LiveRange, VirtualRegister and LiveBundle
 209 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 210 //
 211 // These three have central roles in allocation.  Of them, LiveRange is the
 212 // most central.  VirtualRegister is conceptually important throughout, but
 213 // appears less frequently in the allocator code.  LiveBundle is important only
 214 // in Phase 2 (where it is central) and at the end of Phase 1, but plays no
 215 // role in Phase 3.
 216 //
 217 // It's important to understand that LiveRange and VirtualRegister correspond
 218 // to concepts visible in the incoming LIR, which is in SSA form.  LiveBundle
 219 // by comparison is related to neither the structure of LIR nor its SSA
 220 // properties.  Instead, LiveBundle is an essentially adminstrative structure
 221 // used to accelerate allocation and to implement a crude form of
 222 // move-coalescing.
 223 //
 224 // VirtualRegisters and LiveRanges are (almost) static throughout the process,
 225 // because they reflect aspects of the incoming LIR, which does not change.
 226 // LiveBundles by contrast come and go; they are created, but may be split up
 227 // into new bundles, and old ones abandoned.
 228 //
 229 // Each LiveRange is a member of two different linked lists, chained through
 230 // fields registerLink and bundleLink.
 231 //
 232 // A VirtualRegister (described in detail below) has a list of LiveRanges that
 233 // it "owns".  These are chained through LiveRange::registerLink.
 234 //
 235 // A LiveBundle (also described below) also has a list LiveRanges that it
 236 // "owns", chained through LiveRange::bundleLink.
 237 //
 238 // Hence each LiveRange is "owned" by one VirtualRegister and one LiveBundle.
 239 // LiveRanges may have their owning LiveBundle changed as a result of
 240 // splitting.  By contrast a LiveRange stays with its "owning" VirtualRegister
 241 // for ever.
 242 //
 243 // A few LiveRanges have no VirtualRegister.  This is used to implement
 244 // register spilling for calls.  Each physical register that's not preserved
 245 // across a call has a small range that covers the call.  It is
 246 // ::buildLivenessInfo that adds these small ranges.
 247 //
 248 // Iterating over every VirtualRegister in the system is a common operation and
 249 // is straightforward because (somewhat redundantly?) the LIRGraph knows the
 250 // number of vregs, and more importantly because BacktrackingAllocator::vregs
 251 // is a vector of all VirtualRegisters.  By contrast iterating over every
 252 // LiveBundle in the system is more complex because there is no top-level
 253 // registry of them.  It is still possible though.  See ::dumpLiveRangesByVReg
 254 // and ::dumpLiveRangesByBundle for example code.
 255 //
 256 // LiveRange
 257 // ---------
 258 // Fundamentally, a LiveRange (often written just "range") is a request for
 259 // storage of a LIR vreg for some contiguous sequence of LIRs.  A LiveRange
 260 // generally covers only a fraction of a vreg's overall lifetime, so multiple
 261 // LiveRanges are generally needed to cover the whole lifetime.
 262 //
 263 // A LiveRange contains (amongst other things):
 264 //
 265 // * the vreg for which it is for, as a VirtualRegister*
 266 //
 267 // * the range of CodePositions for which it is for, as a LiveRange::Range
 268 //
 269 // * auxiliary information:
 270 //
 271 //   - a boolean that indicates whether this LiveRange defines a value for the
 272 //     vreg.  If so, that definition is regarded as taking place at the first
 273 //     CodePoint of the range.
 274 //
 275 //   - a linked list of uses of the vreg within this range.  Each use is a pair
 276 //     of a CodePosition and an LUse*.  (INVAR): the uses are maintained in
 277 //     increasing order of CodePosition.  Multiple uses at the same
 278 //     CodePosition are permitted, since that is necessary to represent an LIR
 279 //     that uses the same vreg in more than one of its operand slots.
 280 //
 281 // Some important facts about LiveRanges are best illustrated with examples:
 282 //
 283 //   v25 75-82 { 75_def:R 78_v25:A 82_v25:A }
 284 //
 285 // This LiveRange is for vreg v25.  The value is defined at CodePosition 75,
 286 // with the LIR requiring that it be in a register.  It is used twice at
 287 // positions 78 and 82, both with no constraints (A meaning "any").  The range
 288 // runs from position 75 to 82 inclusive.  Note however that LiveRange::Range
 289 // uses non-inclusive range ends; hence its .to field would be 83, not 82.
 290 //
 291 //   v26 84-85 { 85_v26:R }
 292 //
 293 // This LiveRange is for vreg v26.  Here, there's only a single use of it at
 294 // position 85.  Presumably it is defined in some other LiveRange.
 295 //
 296 //   v19 74-79 { }
 297 //
 298 // This LiveRange is for vreg v19.  There is no def and no uses, so at first
 299 // glance this seems redundant.  But it isn't: it still expresses a request for
 300 // storage for v19 across 74-79, because Phase 1 regards v19 as being live in
 301 // this range (meaning: having a value that, if changed in this range, would
 302 // cause the program to fail).
 303 //
 304 // Other points:
 305 //
 306 // * (INVAR) Each vreg/VirtualRegister has at least one LiveRange.
 307 //
 308 // * (INVAR) Exactly one LiveRange of a vreg gives a definition for the value.
 309 //   All other LiveRanges must consist only of uses (including zero uses, for a
 310 //   "flow-though" range as mentioned above).  This requirement follows from
 311 //   the fact that LIR is in SSA form.
 312 //
 313 // * It follows from this, that the LiveRanges for a VirtualRegister must form
 314 //   a tree, where the parent-child relationship is "control flows directly
 315 //   from a parent LiveRange (anywhere in the LiveRange) to a child LiveRange
 316 //   (start)".  The entire tree carries only one value.  This is a use of
 317 //   SSAness in the allocator which is fundamental: without SSA input, this
 318 //   design would not work.
 319 //
 320 //   The root node (LiveRange) in the tree must be one that defines the value,
 321 //   and all other nodes must only use or be flow-throughs for the value.  It's
 322 //   OK for LiveRanges in the tree to overlap, providing that there is a unique
 323 //   root node -- otherwise it would be unclear which LiveRange provides the
 324 //   value.
 325 //
 326 //   The function ::createMoveGroupsFromLiveRangeTransitions runs after all
 327 //   LiveBundles have been allocated.  It visits each VirtualRegister tree in
 328 //   turn.  For every parent->child edge in a tree, it creates a MoveGroup that
 329 //   copies the value from the parent into the child -- this is how the
 330 //   allocator decides where to put MoveGroups.  There are various other
 331 //   details not described here.
 332 //
 333 // * It's important to understand that a LiveRange carries no meaning about
 334 //   control flow beyond that implied by the SSA (hence, dominance)
 335 //   relationship between a def and its uses.  In particular, there's no
 336 //   implication that execution "flowing into" the start of the range implies
 337 //   that it will "flow out" of the end.  Or that any particular use will or
 338 //   will not be executed.
 339 //
 340 // * (very SPEC) Indeed, even if a range has a def, there's no implication that
 341 //   a use later in the range will have been immediately preceded by execution
 342 //   of the def.  It could be that the def is executed, flow jumps somewhere
 343 //   else, and later jumps back into the middle of the range, where there are
 344 //   then some uses.
 345 //
 346 // * Uses of a vreg by a phi node are not mentioned in the use list of a
 347 //   LiveRange.  The reasons for this are unknown, but it is speculated that
 348 //   this is because we don't need to know about phi uses where we use the list
 349 //   of positions.  See comments on VirtualRegister::usedByPhi_.
 350 //
 351 // * Similarly, a definition of a vreg by a phi node is not regarded as being a
 352 //   definition point (why not?), at least as the view of
 353 //   LiveRange::hasDefinition_.
 354 //
 355 // * LiveRanges that nevertheless include a phi-defined value have their first
 356 //   point set to the first of the block of phis, even if the var isn't defined
 357 //   by that specific phi.  Eg:
 358 //
 359 //    Block 6 [successor 7] [successor 8]
 360 //      56-59 Phi [def v19<o>] [use v2:A] [use v5:A] [use v13:A]
 361 //      56-59 Phi [def v20<o>] [use v7:A] [use v14:A] [use v12:A]
 362 //      60-61 WasmLoadSlot [def v21<o>] [use v1:R]
 363 //      62-63 Compare [def v22<i>] [use v20:R] [use v21:A]
 364 //
 365 //   The relevant live range for v20 is
 366 //
 367 //    v20 56-65 { 63_v20:R }
 368 //
 369 //   Observe that it starts at 56, not 58.
 370 //
 371 // VirtualRegister
 372 // ---------------
 373 // Each VirtualRegister is associated with an SSA value created by the LIR.
 374 // Fundamentally it is a container to hold all of the LiveRanges that together
 375 // indicate where the value must be kept live.  This is a linked list beginning
 376 // at VirtualRegister::ranges_, and which, as described above, is chained
 377 // through LiveRange::registerLink.  The set of LiveRanges must logically form
 378 // a tree, rooted at the LiveRange which defines the value.
 379 //
 380 // For adminstrative convenience, the linked list must contain the LiveRanges
 381 // in order of increasing start point.
 382 //
 383 // There are various auxiliary fields, most importantly the LIR node and the
 384 // associated LDefinition that define the value.
 385 //
 386 // It is OK, and quite common, for LiveRanges of a VirtualRegister to overlap.
 387 // The effect will be that, in an overlapped area, there are two storage
 388 // locations holding the value.  This is OK -- although wasteful of storage
 389 // resources -- because the SSAness means the value must be the same in both
 390 // locations.  Hence there's no questions like "which LiveRange holds the most
 391 // up-to-date value?", since it's all just one value anyway.
 392 //
 393 // Note by contrast, it is *not* OK for the LiveRanges of a LiveBundle to
 394 // overlap.
 395 //
 396 // LiveBundle
 397 // ----------
 398 // Similar to VirtualRegister, a LiveBundle is also, fundamentally, a container
 399 // for a set of LiveRanges.  The set is stored as a linked list, rooted at
 400 // LiveBundle::ranges_ and chained through LiveRange::bundleLink.
 401 //
 402 // However, the similarity ends there:
 403 //
 404 // * The LiveRanges in a LiveBundle absolutely must not overlap.  They must
 405 //   indicate disjoint sets of CodePositions, and must be stored in the list in
 406 //   order of increasing CodePosition.  Because of the no-overlap requirement,
 407 //   these ranges form a total ordering regardless of whether one uses the
 408 //   LiveRange::Range::from_ or ::to_ fields for comparison.
 409 //
 410 // * The LiveRanges in a LiveBundle can otherwise be entirely arbitrary and
 411 //   unrelated.  They can be from different VirtualRegisters and can have no
 412 //   particular mutual significance w.r.t. the SSAness or structure of the
 413 //   input LIR.
 414 //
 415 // LiveBundles are the fundamental unit of allocation.  The allocator attempts
 416 // to find a single storage location that will work for all LiveRanges in the
 417 // bundle.  That's why the ranges must not overlap.  If no such location can be
 418 // found, the allocator may decide to split the bundle into multiple smaller
 419 // bundles.  Each of those may be allocated independently.
 420 //
 421 // The other really important field is LiveBundle::alloc_, indicating the
 422 // chosen storage location.
 423 //
 424 // Here's an example, for a LiveBundle before it has been allocated:
 425 //
 426 //   LB2(parent=none v3 8-21 { 16_v3:A } ## v3 24-25 { 25_v3:F:xmm0 })
 427 //
 428 // LB merely indicates "LiveBundle", and the 2 is the debugId_ value (see
 429 // below).  This bundle has two LiveRanges
 430 //
 431 //   v3 8-21 { 16_v3:A }
 432 //   v3 24-25 { 25_v3:F:xmm0 }
 433 //
 434 // both of which (coincidentally) are for the same VirtualRegister, v3.The
 435 // second LiveRange has a fixed use in `xmm0`, whilst the first one doesn't
 436 // care (A meaning "any location") so the allocator *could* choose `xmm0` for
 437 // the bundle as a whole.
 438 //
 439 // One might ask: why bother with LiveBundle at all?  After all, it would be
 440 // possible to get correct allocations by allocating each LiveRange
 441 // individually, then leaving ::createMoveGroupsFromLiveRangeTransitions to add
 442 // MoveGroups to join up LiveRanges that form each SSA value tree (that is,
 443 // LiveRanges belonging to each VirtualRegister).
 444 //
 445 // There are two reasons:
 446 //
 447 // (1) By putting multiple LiveRanges into each LiveBundle, we can end up with
 448 //     many fewer LiveBundles than LiveRanges.  Since the cost of allocating a
 449 //     LiveBundle is substantially less than the cost of allocating each of its
 450 //     LiveRanges individually, the allocator will run faster.
 451 //
 452 // (2) It provides a crude form of move-coalescing.  There are situations where
 453 //     it would be beneficial, although not mandatory, to have two LiveRanges
 454 //     assigned to the same storage unit.  Most importantly: (a) LiveRanges
 455 //     that form all of the inputs, and the output, of a phi node.  (b)
 456 //     LiveRanges for the output and first-operand values in the case where we
 457 //     are targetting Intel-style instructions.
 458 //
 459 //     In such cases, if the bundle can be allocated as-is, then no extra moves
 460 //     are necessary.  If not (and the bundle is split), then
 461 //     ::createMoveGroupsFromLiveRangeTransitions will later fix things up by
 462 //     inserting MoveGroups in the right places.
 463 //
 464 // Merging of LiveRanges into LiveBundles is done in Phase 1, by
 465 // ::mergeAndQueueRegisters, after liveness analysis (which generates only
 466 // LiveRanges).
 467 //
 468 // For the bundle mentioned above, viz
 469 //
 470 //   LB2(parent=none v3 8-21 { 16_v3:A } ## v3 24-25 { 25_v3:F:xmm0 })
 471 //
 472 // the allocator did not in the end choose to allocate it to `xmm0`.  Instead
 473 // it was split into two bundles, LB6 (a "spill parent", or root node in the
 474 // trees described above), and LB9, a leaf node, that points to its parent LB6:
 475 //
 476 //   LB6(parent=none v3 8-21 %xmm1.s { 16_v3:A } ## v3 24-25 %xmm1.s { })
 477 //   LB9(parent=LB6 v3 24-25 %xmm0.s { 25_v3:F:rax })
 478 //
 479 // Note that both bundles now have an allocation, and that is printed,
 480 // redundantly, for each LiveRange in the bundle -- hence the repeated
 481 // `%xmm1.s` in the lines above.  Since all LiveRanges in a LiveBundle must be
 482 // allocated to the same storage location, we never expect to see output like
 483 // this
 484 //
 485 //   LB6(parent=none v3 8-21 %xmm1.s { 16_v3:A } ## v3 24-25 %xmm2.s { })
 486 //
 487 // and that is in any case impossible, since a LiveRange doesn't have an
 488 // LAllocation field.  Instead it has a pointer to its LiveBundle, and the
 489 // LAllocation lives in the LiveBundle.
 490 //
 491 // For the resulting allocation (LB6 and LB9), all the LiveRanges are use-only
 492 // or flow-through.  There are no definitions.  But they are all for the same
 493 // VirtualReg, v3, so they all have the same value.  An important question is
 494 // where they "get their value from".  The answer is that
 495 // ::createMoveGroupsFromLiveRangeTransitions will have to insert suitable
 496 // MoveGroups so that each LiveRange for v3 can "acquire" the value from a
 497 // previously-executed LiveRange, except for the range that defines it.  The
 498 // defining LiveRange is not visible here; either it is in some other
 499 // LiveBundle, not shown, or (more likely) the value is defined by a phi-node,
 500 // in which case, as mentioned previously, it is not shown as having an
 501 // explicit definition in any LiveRange.
 502 //
 503 // LiveBundles also have a `SpillSet* spill_` field (see below) and a
 504 // `LiveBundle* spillParent_`.  The latter is used to ensure that all bundles
 505 // originating from an "original" bundle share the same spill slot.  The
 506 // `spillParent_` pointers can be thought of creating a 1-level tree, where
 507 // each node points at its parent.  Since the tree can be only 1-level, the
 508 // following invariant (INVAR) must be maintained:
 509 //
 510 // * if a LiveBundle has a non-null spillParent_ field, then it is a leaf node,
 511 //   and no other LiveBundle can point at this one.
 512 //
 513 // * else (it has a null spillParent_ field) it is a root node, and so other
 514 //   LiveBundles may point at it.
 515 //
 516 // When compiled with JS_JITSPEW, LiveBundle has a 32-bit `debugId_` field.
 517 // This is used only for debug printing, and makes it easier to see
 518 // parent-child relationships induced by the `spillParent_` pointers.
 519 //
 520 // The "life cycle" of LiveBundles is described in Section 2 below.
 521 //
 522 //
 523 // Secondary data structures: SpillSet, Requirement
 524 // ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 525 //
 526 // SpillSet
 527 // --------
 528 // A SpillSet is a container for a set of LiveBundles that have been spilled,
 529 // all of which are assigned the same spill slot.  The set is represented as a
 530 // vector of points to LiveBundles.  SpillSet also contains the identity of the
 531 // spill slot (its LAllocation).
 532 //
 533 // A LiveBundle, if it is to be spilled, has a pointer to the relevant
 534 // SpillSet, and the SpillSet in turn has a pointer back to the LiveBundle in
 535 // its vector thereof.  So LiveBundles (that are to be spilled) and SpillSets
 536 // point at each other.
 537 //
 538 // (SPEC) LiveBundles that are not to be spilled (or for which the decision has
 539 // yet to be made, have their SpillSet pointers as null.  (/SPEC)
 540 //
 541 // Requirement
 542 // -----------
 543 // Requirements are used transiently during the main allocation loop.  It
 544 // summarises the set of constraints on storage location (must be any register,
 545 // must be this specific register, must be stack, etc) for a LiveBundle.  This
 546 // is so that the main allocation loop knows what kind of storage location it
 547 // must choose in order to satisfy all of the defs and uses within the bundle.
 548 //
 549 // What Requirement provides is (a) a partially ordered set of locations, and
 550 // (b) a constraint-merging method `merge`.
 551 //
 552 // Requirement needs a rewrite (and, in fact, that has already happened in
 553 // un-landed code in bug 1758274) for the following reasons:
 554 //
 555 // * it's potentially buggy (bug 1761654), although that doesn't currently
 556 //   affect us, for reasons which are unclear.
 557 //
 558 // * the partially ordered set has a top point, meaning "no constraint", but it
 559 //   doesn't have a corresponding bottom point, meaning "impossible
 560 //   constraints".  (So it's a partially ordered set, but not a lattice).  This
 561 //   leads to awkward coding in some places, which would be simplified if there
 562 //   were an explicit way to indicate "impossible constraint".
 563 //
 564 //
 565 // Some ASCII art
 566 // ~~~~~~~~~~~~~~
 567 //
 568 // Here's some not-very-good ASCII art that tries to summarise the data
 569 // structures that persist for the entire allocation of a function:
 570 //
 571 //     BacktrackingAllocator
 572 //        |
 573 //      (vregs)
 574 //        |
 575 //        v
 576 //        |
 577 //     VirtualRegister -->--(ins)--> LNode
 578 //     |            |  `->--(def)--> LDefinition
 579 //     v            ^
 580 //     |            |
 581 //  (ranges)        |
 582 //     |          (vreg)
 583 //     `--v->--.     |     ,-->--v-->-------------->--v-->--.           ,--NULL
 584 //              \    |    /                                  \         /
 585 //               LiveRange               LiveRange            LiveRange
 586 //              /    |    \             /         \.
 587 //     ,--b->--'    /      `-->--b-->--'           `--NULL
 588 //     |         (bundle)
 589 //     ^          /
 590 //     |         v
 591 //  (ranges)    /
 592 //     |       /
 593 //     LiveBundle --s-->- LiveBundle
 594 //       |      \           /    |
 595 //       |       \         /     |
 596 //      (spill)   ^       ^     (spill)
 597 //       |         \     /       |
 598 //       v          \   /        ^
 599 //       |          (list)       |
 600 //       \            |          /
 601 //        `--->---> SpillSet <--'
 602 //
 603 // --b-- LiveRange::bundleLink: links in the list of LiveRanges that belong to
 604 //       a LiveBundle
 605 //
 606 // --v-- LiveRange::registerLink: links in the list of LiveRanges that belong
 607 //       to a VirtualRegister
 608 //
 609 // --s-- LiveBundle::spillParent: a possible link to my "spill parent bundle"
 610 //
 611 //
 612 // * LiveRange is in the center.  Each LiveRange is a member of two different
 613 //   linked lists, the --b-- list and the --v-- list.
 614 //
 615 // * VirtualRegister has a pointer `ranges` that points to the start of its
 616 //   --v-- list of LiveRanges.
 617 //
 618 // * LiveBundle has a pointer `ranges` that points to the start of its --b--
 619 //   list of LiveRanges.
 620 //
 621 // * LiveRange points back at both its owning VirtualRegister (`vreg`) and its
 622 //   owning LiveBundle (`bundle`).
 623 //
 624 // * LiveBundle has a pointer --s-- `spillParent`, which may be null, to its
 625 //   conceptual "spill parent bundle", as discussed in detail above.
 626 //
 627 // * LiveBundle has a pointer `spill` to its SpillSet.
 628 //
 629 // * SpillSet has a vector `list` of pointers back to the LiveBundles that
 630 //   point at it.
 631 //
 632 // * VirtualRegister has pointers `ins` to the LNode that defines the value and
 633 //   `def` to the LDefinition within that LNode.
 634 //
 635 // * BacktrackingAllocator has a vector `vregs` of pointers to all the
 636 //   VirtualRegisters for the function.  There is no equivalent top-level table
 637 //   of all the LiveBundles for the function.
 638 //
 639 // Note that none of these pointers are "owning" in the C++-storage-management
 640 // sense.  Rather, everything is stored in single arena which is freed when
 641 // compilation of the function is complete.  For this reason,
 642 // BacktrackingAllocator.{h,cpp} is almost completely free of the usual C++
 643 // storage-management artefacts one would normally expect to see.
 644 //
 645 //
 646 // ========================================================================
 647 // ====                                                                ====
 648 // ==== Section 2: The core allocation loop, and bundle splitting      ====
 649 // ====                                                                ====
 650 // ========================================================================
 651 //
 652 // Phase 1 of the allocator (described at the start of this SMDOC) computes
 653 // live ranges, merges them into bundles, and places the bundles in a priority
 654 // queue ::allocationQueue, ordered by what ::computePriority computes.
 655 //
 656 //
 657 // The allocation loops
 658 // ~~~~~~~~~~~~~~~~~~~~
 659 // The core of the allocation machinery consists of two loops followed by a
 660 // call to ::pickStackSlots.  The latter is uninteresting.  The two loops live
 661 // in ::go and are documented in detail there.
 662 //
 663 //
 664 // Bundle splitting
 665 // ~~~~~~~~~~~~~~~~
 666 // If the first of the two abovementioned loops cannot find a register for a
 667 // bundle, either directly or as a result of evicting conflicting bundles, then
 668 // it will have to either split or spill the bundle.  The entry point to the
 669 // split/spill subsystem is ::chooseBundleSplit.  See comments there.
 670
 671 ///////////////////////////////////////////////////////////////////////////////
 672 //                                                                           //
 673 // End of documentation                                                      //
 674 //                                                                           //
 675 ///////////////////////////////////////////////////////////////////////////////
 676
 677 #include "jit/BacktrackingAllocator.h"
 678
 679 #include <algorithm>
 680
 681 #include "jit/BitSet.h"
 682 #include "jit/CompileInfo.h"
 683 #include "js/Printf.h"
 684
 685 using namespace js;
 686 using namespace js::jit;
 687
 688 using mozilla::DebugOnly;
 689
 690 // This is a big, complex file.  Code is grouped into various sections, each
 691 // preceded by a box comment.  Sections not marked as "Misc helpers" are
 692 // pretty much the top level flow, and are presented roughly in the same order
 693 // in which the allocation pipeline operates.  BacktrackingAllocator::go,
 694 // right at the end of the file, is a good starting point.
 695
 696 ///////////////////////////////////////////////////////////////////////////////
 697 //                                                                           //
 698 // Misc helpers: linked-list management                                      //
 699 //                                                                           //
 700 ///////////////////////////////////////////////////////////////////////////////
 701
 702 static inline bool SortBefore(UsePosition* a, UsePosition* b) {
 703   return a->pos <= b->pos;
 704 }
 705
 706 static inline bool SortBefore(LiveRange::BundleLink* a,
 707                               LiveRange::BundleLink* b) {
 708   LiveRange* rangea = LiveRange::get(a);
 709   LiveRange* rangeb = LiveRange::get(b);
 710   MOZ_ASSERT(!rangea->intersects(rangeb));
 711   return rangea->from() < rangeb->from();
 712 }
 713
 714 static inline bool SortBefore(LiveRange::RegisterLink* a,
 715                               LiveRange::RegisterLink* b) {
 716   return LiveRange::get(a)->from() <= LiveRange::get(b)->from();
 717 }
 718
 719 template <typename T>
 720 static inline void InsertSortedList(InlineForwardList<T>& list, T* value) {
 721   if (list.empty()) {
 722     list.pushFront(value);
 723     return;
 724   }
 725
 726   if (SortBefore(list.back(), value)) {
 727     list.pushBack(value);
 728     return;
 729   }
 730
 731   T* prev = nullptr;
 732   for (InlineForwardListIterator<T> iter = list.begin(); iter; iter++) {
 733     if (SortBefore(value, *iter)) {
 734       break;
 735     }
 736     prev = *iter;
 737   }
 738
 739   if (prev) {
 740     list.insertAfter(prev, value);
 741   } else {
 742     list.pushFront(value);
 743   }
 744 }
 745
 746 ///////////////////////////////////////////////////////////////////////////////
 747 //                                                                           //
 748 // Misc helpers: methods for class SpillSet                                  //
 749 //                                                                           //
 750 ///////////////////////////////////////////////////////////////////////////////
 751
 752 void SpillSet::setAllocation(LAllocation alloc) {
 753   for (size_t i = 0; i < numSpilledBundles(); i++) {
 754     spilledBundle(i)->setAllocation(alloc);
 755   }
 756 }
 757
 758 ///////////////////////////////////////////////////////////////////////////////
 759 //                                                                           //
 760 // Misc helpers: methods for class LiveRange                                 //
 761 //                                                                           //
 762 ///////////////////////////////////////////////////////////////////////////////
 763
 764 static size_t SpillWeightFromUsePolicy(LUse::Policy policy) {
 765   switch (policy) {
 766     case LUse::ANY:
 767       return 1000;
 768
 769     case LUse::REGISTER:
 770     case LUse::FIXED:
 771       return 2000;
 772
 773     default:
 774       return 0;
 775   }
 776 }
 777
 778 inline void LiveRange::noteAddedUse(UsePosition* use) {
 779   LUse::Policy policy = use->usePolicy();
 780   usesSpillWeight_ += SpillWeightFromUsePolicy(policy);
 781   if (policy == LUse::FIXED) {
 782     ++numFixedUses_;
 783   }
 784 }
 785
 786 inline void LiveRange::noteRemovedUse(UsePosition* use) {
 787   LUse::Policy policy = use->usePolicy();
 788   usesSpillWeight_ -= SpillWeightFromUsePolicy(policy);
 789   if (policy == LUse::FIXED) {
 790     --numFixedUses_;
 791   }
 792   MOZ_ASSERT_IF(!hasUses(), !usesSpillWeight_ && !numFixedUses_);
 793 }
 794
 795 void LiveRange::addUse(UsePosition* use) {
 796   MOZ_ASSERT(covers(use->pos));
 797   InsertSortedList(uses_, use);
 798   noteAddedUse(use);
 799 }
 800
 801 UsePosition* LiveRange::popUse() {
 802   UsePosition* ret = uses_.popFront();
 803   noteRemovedUse(ret);
 804   return ret;
 805 }
 806
 807 void LiveRange::tryToMoveDefAndUsesInto(LiveRange* other) {
 808   MOZ_ASSERT(&other->vreg() == &vreg());
 809   MOZ_ASSERT(this != other);
 810
 811   // Move over all uses which fit in |other|'s boundaries.
 812   for (UsePositionIterator iter = usesBegin(); iter;) {
 813     UsePosition* use = *iter;
 814     if (other->covers(use->pos)) {
 815       uses_.removeAndIncrement(iter);
 816       noteRemovedUse(use);
 817       other->addUse(use);
 818     } else {
 819       iter++;
 820     }
 821   }
 822
 823   // Distribute the definition to |other| as well, if possible.
 824   if (hasDefinition() && from() == other->from()) {
 825     other->setHasDefinition();
 826   }
 827 }
 828
 829 bool LiveRange::contains(LiveRange* other) const {
 830   return from() <= other->from() && to() >= other->to();
 831 }
 832
 833 void LiveRange::intersect(LiveRange* other, Range* pre, Range* inside,
 834                           Range* post) const {
 835   MOZ_ASSERT(pre->empty() && inside->empty() && post->empty());
 836
 837   CodePosition innerFrom = from();
 838   if (from() < other->from()) {
 839     if (to() < other->from()) {
 840       *pre = range_;
 841       return;
 842     }
 843     *pre = Range(from(), other->from());
 844     innerFrom = other->from();
 845   }
 846
 847   CodePosition innerTo = to();
 848   if (to() > other->to()) {
 849     if (from() >= other->to()) {
 850       *post = range_;
 851       return;
 852     }
 853     *post = Range(other->to(), to());
 854     innerTo = other->to();
 855   }
 856
 857   if (innerFrom != innerTo) {
 858     *inside = Range(innerFrom, innerTo);
 859   }
 860 }
 861
 862 bool LiveRange::intersects(LiveRange* other) const {
 863   Range pre, inside, post;
 864   intersect(other, &pre, &inside, &post);
 865   return !inside.empty();
 866 }
 867
 868 ///////////////////////////////////////////////////////////////////////////////
 869 //                                                                           //
 870 // Misc helpers: methods for class LiveBundle                                //
 871 //                                                                           //
 872 ///////////////////////////////////////////////////////////////////////////////
 873
 874 #ifdef DEBUG
 875 size_t LiveBundle::numRanges() const {
 876   size_t count = 0;
 877   for (LiveRange::BundleLinkIterator iter = rangesBegin(); iter; iter++) {
 878     count++;
 879   }
 880   return count;
 881 }
 882 #endif
 883
 884 LiveRange* LiveBundle::rangeFor(CodePosition pos) const {
 885   for (LiveRange::BundleLinkIterator iter = rangesBegin(); iter; iter++) {
 886     LiveRange* range = LiveRange::get(*iter);
 887     if (range->covers(pos)) {
 888       return range;
 889     }
 890   }
 891   return nullptr;
 892 }
 893
 894 void LiveBundle::addRange(LiveRange* range) {
 895   MOZ_ASSERT(!range->bundle());
 896   range->setBundle(this);
 897   InsertSortedList(ranges_, &range->bundleLink);
 898 }
 899
 900 bool LiveBundle::addRange(TempAllocator& alloc, VirtualRegister* vreg,
 901                           CodePosition from, CodePosition to) {
 902   LiveRange* range = LiveRange::FallibleNew(alloc, vreg, from, to);
 903   if (!range) {
 904     return false;
 905   }
 906   addRange(range);
 907   return true;
 908 }
 909
 910 bool LiveBundle::addRangeAndDistributeUses(TempAllocator& alloc,
 911                                            LiveRange* oldRange,
 912                                            CodePosition from, CodePosition to) {
 913   LiveRange* range = LiveRange::FallibleNew(alloc, &oldRange->vreg(), from, to);
 914   if (!range) {
 915     return false;
 916   }
 917   addRange(range);
 918   oldRange->tryToMoveDefAndUsesInto(range);
 919   return true;
 920 }
 921
 922 LiveRange* LiveBundle::popFirstRange() {
 923   LiveRange::BundleLinkIterator iter = rangesBegin();
 924   if (!iter) {
 925     return nullptr;
 926   }
 927
 928   LiveRange* range = LiveRange::get(*iter);
 929   ranges_.removeAt(iter);
 930
 931   range->setBundle(nullptr);
 932   return range;
 933 }
 934
 935 void LiveBundle::removeRange(LiveRange* range) {
 936   for (LiveRange::BundleLinkIterator iter = rangesBegin(); iter; iter++) {
 937     LiveRange* existing = LiveRange::get(*iter);
 938     if (existing == range) {
 939       ranges_.removeAt(iter);
 940       return;
 941     }
 942   }
 943   MOZ_CRASH();
 944 }
 945
 946 ///////////////////////////////////////////////////////////////////////////////
 947 //                                                                           //
 948 // Misc helpers: methods for class VirtualRegister                           //
 949 //                                                                           //
 950 ///////////////////////////////////////////////////////////////////////////////
 951
 952 bool VirtualRegister::addInitialRange(TempAllocator& alloc, CodePosition from,
 953                                       CodePosition to, size_t* numRanges) {
 954   MOZ_ASSERT(from < to);
 955
 956   // Mark [from,to) as a live range for this register during the initial
 957   // liveness analysis, coalescing with any existing overlapping ranges.
 958
 959   // On some pathological graphs there might be a huge number of different
 960   // live ranges. Allow non-overlapping live range to be merged if the
 961   // number of ranges exceeds the cap below.
 962   static const size_t CoalesceLimit = 100000;
 963
 964   LiveRange* prev = nullptr;
 965   LiveRange* merged = nullptr;
 966   for (LiveRange::RegisterLinkIterator iter(rangesBegin()); iter;) {
 967     LiveRange* existing = LiveRange::get(*iter);
 968
 969     if (from > existing->to() && *numRanges < CoalesceLimit) {
 970       // The new range should go after this one.
 971       prev = existing;
 972       iter++;
 973       continue;
 974     }
 975
 976     if (to.next() < existing->from()) {
 977       // The new range should go before this one.
 978       break;
 979     }
 980
 981     if (!merged) {
 982       // This is the first old range we've found that overlaps the new
 983       // range. Extend this one to cover its union with the new range.
 984       merged = existing;
 985
 986       if (from < existing->from()) {
 987         existing->setFrom(from);
 988       }
 989       if (to > existing->to()) {
 990         existing->setTo(to);
 991       }
 992
 993       // Continue searching to see if any other old ranges can be
 994       // coalesced with the new merged range.
 995       iter++;
 996       continue;
 997     }
 998
 999     // Coalesce this range into the previous range we merged into.
1000     MOZ_ASSERT(existing->from() >= merged->from());
1001     if (existing->to() > merged->to()) {
1002       merged->setTo(existing->to());
1003     }
1004
1005     MOZ_ASSERT(!existing->hasDefinition());
1006     existing->tryToMoveDefAndUsesInto(merged);
1007     MOZ_ASSERT(!existing->hasUses());
1008
1009     ranges_.removeAndIncrement(iter);
1010   }
1011
1012   if (!merged) {
1013     // The new range does not overlap any existing range for the vreg.
1014     LiveRange* range = LiveRange::FallibleNew(alloc, this, from, to);
1015     if (!range) {
1016       return false;
1017     }
1018
1019     if (prev) {
1020       ranges_.insertAfter(&prev->registerLink, &range->registerLink);
1021     } else {
1022       ranges_.pushFront(&range->registerLink);
1023     }
1024
1025     (*numRanges)++;
1026   }
1027
1028   return true;
1029 }
1030
1031 void VirtualRegister::addInitialUse(UsePosition* use) {
1032   LiveRange::get(*rangesBegin())->addUse(use);
1033 }
1034
1035 void VirtualRegister::setInitialDefinition(CodePosition from) {
1036   LiveRange* first = LiveRange::get(*rangesBegin());
1037   MOZ_ASSERT(from >= first->from());
1038   first->setFrom(from);
1039   first->setHasDefinition();
1040 }
1041
1042 LiveRange* VirtualRegister::rangeFor(CodePosition pos,
1043                                      bool preferRegister /* = false */) const {
1044   LiveRange* found = nullptr;
1045   for (LiveRange::RegisterLinkIterator iter = rangesBegin(); iter; iter++) {
1046     LiveRange* range = LiveRange::get(*iter);
1047     if (range->covers(pos)) {
1048       if (!preferRegister || range->bundle()->allocation().isRegister()) {
1049         return range;
1050       }
1051       if (!found) {
1052         found = range;
1053       }
1054     }
1055   }
1056   return found;
1057 }
1058
1059 void VirtualRegister::addRange(LiveRange* range) {
1060   InsertSortedList(ranges_, &range->registerLink);
1061 }
1062
1063 void VirtualRegister::removeRange(LiveRange* range) {
1064   for (LiveRange::RegisterLinkIterator iter = rangesBegin(); iter; iter++) {
1065     LiveRange* existing = LiveRange::get(*iter);
1066     if (existing == range) {
1067       ranges_.removeAt(iter);
1068       return;
1069     }
1070   }
1071   MOZ_CRASH();
1072 }
1073
1074 ///////////////////////////////////////////////////////////////////////////////
1075 //                                                                           //
1076 // Misc helpers: queries about uses                                          //
1077 //                                                                           //
1078 ///////////////////////////////////////////////////////////////////////////////
1079
1080 static inline LDefinition* FindReusingDefOrTemp(LNode* node,
1081                                                 LAllocation* alloc) {
1082   if (node->isPhi()) {
1083     MOZ_ASSERT(node->toPhi()->numDefs() == 1);
1084     MOZ_ASSERT(node->toPhi()->getDef(0)->policy() !=
1085                LDefinition::MUST_REUSE_INPUT);
1086     return nullptr;
1087   }
1088
1089   LInstruction* ins = node->toInstruction();
1090
1091   for (size_t i = 0; i < ins->numDefs(); i++) {
1092     LDefinition* def = ins->getDef(i);
1093     if (def->policy() == LDefinition::MUST_REUSE_INPUT &&
1094         ins->getOperand(def->getReusedInput()) == alloc) {
1095       return def;
1096     }
1097   }
1098   for (size_t i = 0; i < ins->numTemps(); i++) {
1099     LDefinition* def = ins->getTemp(i);
1100     if (def->policy() == LDefinition::MUST_REUSE_INPUT &&
1101         ins->getOperand(def->getReusedInput()) == alloc) {
1102       return def;
1103     }
1104   }
1105   return nullptr;
1106 }
1107
1108 bool BacktrackingAllocator::isReusedInput(LUse* use, LNode* ins,
1109                                           bool considerCopy) {
1110   if (LDefinition* def = FindReusingDefOrTemp(ins, use)) {
1111     return considerCopy || !vregs[def->virtualRegister()].mustCopyInput();
1112   }
1113   return false;
1114 }
1115
1116 bool BacktrackingAllocator::isRegisterUse(UsePosition* use, LNode* ins,
1117                                           bool considerCopy) {
1118   switch (use->usePolicy()) {
1119     case LUse::ANY:
1120       return isReusedInput(use->use(), ins, considerCopy);
1121
1122     case LUse::REGISTER:
1123     case LUse::FIXED:
1124       return true;
1125
1126     default:
1127       return false;
1128   }
1129 }
1130
1131 bool BacktrackingAllocator::isRegisterDefinition(LiveRange* range) {
1132   if (!range->hasDefinition()) {
1133     return false;
1134   }
1135
1136   VirtualRegister& reg = range->vreg();
1137   if (reg.ins()->isPhi()) {
1138     return false;
1139   }
1140
1141   if (reg.def()->policy() == LDefinition::FIXED &&
1142       !reg.def()->output()->isRegister()) {
1143     return false;
1144   }
1145
1146   return true;
1147 }
1148
1149 ///////////////////////////////////////////////////////////////////////////////
1150 //                                                                           //
1151 // Misc helpers: atomic LIR groups                                           //
1152 //                                                                           //
1153 ///////////////////////////////////////////////////////////////////////////////
1154
1155 // The following groupings contain implicit (invisible to ::buildLivenessInfo)
1156 // value flows, and therefore no split points may be requested inside them.
1157 // This is an otherwise unstated part of the contract between LIR generation
1158 // and the allocator.
1159 //
1160 // (1) (any insn) ; OsiPoint
1161 //
1162 // [Further group definitions and supporting code to come, pending rework
1163 //  of the wasm atomic-group situation.]
1164
1165 CodePosition RegisterAllocator::minimalDefEnd(LNode* ins) const {
1166   // Compute the shortest interval that captures vregs defined by ins.
1167   // Watch for instructions that are followed by an OSI point.
1168   // If moves are introduced between the instruction and the OSI point then
1169   // safepoint information for the instruction may be incorrect.
1170   while (true) {
1171     LNode* next = insData[ins->id() + 1];
1172     if (!next->isOsiPoint()) {
1173       break;
1174     }
1175     ins = next;
1176   }
1177
1178   return outputOf(ins);
1179 }
1180
1181 ///////////////////////////////////////////////////////////////////////////////
1182 //                                                                           //
1183 // Misc helpers: computation of bundle priorities and spill weights          //
1184 //                                                                           //
1185 ///////////////////////////////////////////////////////////////////////////////
1186
1187 size_t BacktrackingAllocator::computePriority(LiveBundle* bundle) {
1188   // The priority of a bundle is its total length, so that longer lived
1189   // bundles will be processed before shorter ones (even if the longer ones
1190   // have a low spill weight). See processBundle().
1191   size_t lifetimeTotal = 0;
1192
1193   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
1194        iter++) {
1195     LiveRange* range = LiveRange::get(*iter);
1196     lifetimeTotal += range->to() - range->from();
1197   }
1198
1199   return lifetimeTotal;
1200 }
1201
1202 bool BacktrackingAllocator::minimalDef(LiveRange* range, LNode* ins) {
1203   // Whether this is a minimal range capturing a definition at ins.
1204   return (range->to() <= minimalDefEnd(ins).next()) &&
1205          ((!ins->isPhi() && range->from() == inputOf(ins)) ||
1206           range->from() == outputOf(ins));
1207 }
1208
1209 bool BacktrackingAllocator::minimalUse(LiveRange* range, UsePosition* use) {
1210   // Whether this is a minimal range capturing |use|.
1211   LNode* ins = insData[use->pos];
1212   return (range->from() == inputOf(ins)) &&
1213          (range->to() ==
1214           (use->use()->usedAtStart() ? outputOf(ins) : outputOf(ins).next()));
1215 }
1216
1217 bool BacktrackingAllocator::minimalBundle(LiveBundle* bundle, bool* pfixed) {
1218   LiveRange::BundleLinkIterator iter = bundle->rangesBegin();
1219   LiveRange* range = LiveRange::get(*iter);
1220
1221   if (!range->hasVreg()) {
1222     *pfixed = true;
1223     return true;
1224   }
1225
1226   // If a bundle contains multiple ranges, splitAtAllRegisterUses will split
1227   // each range into a separate bundle.
1228   if (++iter) {
1229     return false;
1230   }
1231
1232   if (range->hasDefinition()) {
1233     VirtualRegister& reg = range->vreg();
1234     if (pfixed) {
1235       *pfixed = reg.def()->policy() == LDefinition::FIXED &&
1236                 reg.def()->output()->isRegister();
1237     }
1238     return minimalDef(range, reg.ins());
1239   }
1240
1241   bool fixed = false, minimal = false, multiple = false;
1242
1243   for (UsePositionIterator iter = range->usesBegin(); iter; iter++) {
1244     if (iter != range->usesBegin()) {
1245       multiple = true;
1246     }
1247
1248     switch (iter->usePolicy()) {
1249       case LUse::FIXED:
1250         if (fixed) {
1251           return false;
1252         }
1253         fixed = true;
1254         if (minimalUse(range, *iter)) {
1255           minimal = true;
1256         }
1257         break;
1258
1259       case LUse::REGISTER:
1260         if (minimalUse(range, *iter)) {
1261           minimal = true;
1262         }
1263         break;
1264
1265       default:
1266         break;
1267     }
1268   }
1269
1270   // If a range contains a fixed use and at least one other use,
1271   // splitAtAllRegisterUses will split each use into a different bundle.
1272   if (multiple && fixed) {
1273     minimal = false;
1274   }
1275
1276   if (pfixed) {
1277     *pfixed = fixed;
1278   }
1279   return minimal;
1280 }
1281
1282 size_t BacktrackingAllocator::computeSpillWeight(LiveBundle* bundle) {
1283   // Minimal bundles have an extremely high spill weight, to ensure they
1284   // can evict any other bundles and be allocated to a register.
1285   bool fixed;
1286   if (minimalBundle(bundle, &fixed)) {
1287     return fixed ? 2000000 : 1000000;
1288   }
1289
1290   size_t usesTotal = 0;
1291   fixed = false;
1292
1293   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
1294        iter++) {
1295     LiveRange* range = LiveRange::get(*iter);
1296
1297     if (range->hasDefinition()) {
1298       VirtualRegister& reg = range->vreg();
1299       if (reg.def()->policy() == LDefinition::FIXED &&
1300           reg.def()->output()->isRegister()) {
1301         usesTotal += 2000;
1302         fixed = true;
1303       } else if (!reg.ins()->isPhi()) {
1304         usesTotal += 2000;
1305       }
1306     }
1307
1308     usesTotal += range->usesSpillWeight();
1309     if (range->numFixedUses() > 0) {
1310       fixed = true;
1311     }
1312   }
1313
1314   // Bundles with fixed uses are given a higher spill weight, since they must
1315   // be allocated to a specific register.
1316   if (testbed && fixed) {
1317     usesTotal *= 2;
1318   }
1319
1320   // Compute spill weight as a use density, lowering the weight for long
1321   // lived bundles with relatively few uses.
1322   size_t lifetimeTotal = computePriority(bundle);
1323   return lifetimeTotal ? usesTotal / lifetimeTotal : 0;
1324 }
1325
1326 size_t BacktrackingAllocator::maximumSpillWeight(
1327     const LiveBundleVector& bundles) {
1328   size_t maxWeight = 0;
1329   for (size_t i = 0; i < bundles.length(); i++) {
1330     maxWeight = std::max(maxWeight, computeSpillWeight(bundles[i]));
1331   }
1332   return maxWeight;
1333 }
1334
1335 ///////////////////////////////////////////////////////////////////////////////
1336 //                                                                           //
1337 // Initialization of the allocator                                           //
1338 //                                                                           //
1339 ///////////////////////////////////////////////////////////////////////////////
1340
1341 // This function pre-allocates and initializes as much global state as possible
1342 // to avoid littering the algorithms with memory management cruft.
1343 bool BacktrackingAllocator::init() {
1344   if (!RegisterAllocator::init()) {
1345     return false;
1346   }
1347
1348   liveIn = mir->allocate<BitSet>(graph.numBlockIds());
1349   if (!liveIn) {
1350     return false;
1351   }
1352
1353   size_t numVregs = graph.numVirtualRegisters();
1354   if (!vregs.init(mir->alloc(), numVregs)) {
1355     return false;
1356   }
1357   for (uint32_t i = 0; i < numVregs; i++) {
1358     new (&vregs[i]) VirtualRegister();
1359   }
1360
1361   // Build virtual register objects.
1362   for (size_t i = 0; i < graph.numBlocks(); i++) {
1363     if (mir->shouldCancel("Create data structures (main loop)")) {
1364       return false;
1365     }
1366
1367     LBlock* block = graph.getBlock(i);
1368     for (LInstructionIterator ins = block->begin(); ins != block->end();
1369          ins++) {
1370       if (mir->shouldCancel("Create data structures (inner loop 1)")) {
1371         return false;
1372       }
1373
1374       for (size_t j = 0; j < ins->numDefs(); j++) {
1375         LDefinition* def = ins->getDef(j);
1376         if (def->isBogusTemp()) {
1377           continue;
1378         }
1379         vreg(def).init(*ins, def, /* isTemp = */ false);
1380       }
1381
1382       for (size_t j = 0; j < ins->numTemps(); j++) {
1383         LDefinition* def = ins->getTemp(j);
1384         if (def->isBogusTemp()) {
1385           continue;
1386         }
1387         vreg(def).init(*ins, def, /* isTemp = */ true);
1388       }
1389     }
1390     for (size_t j = 0; j < block->numPhis(); j++) {
1391       LPhi* phi = block->getPhi(j);
1392       LDefinition* def = phi->getDef(0);
1393       vreg(def).init(phi, def, /* isTemp = */ false);
1394     }
1395   }
1396
1397   LiveRegisterSet remainingRegisters(allRegisters_.asLiveSet());
1398   while (!remainingRegisters.emptyGeneral()) {
1399     AnyRegister reg = AnyRegister(remainingRegisters.takeAnyGeneral());
1400     registers[reg.code()].allocatable = true;
1401   }
1402   while (!remainingRegisters.emptyFloat()) {
1403     AnyRegister reg =
1404         AnyRegister(remainingRegisters.takeAnyFloat<RegTypeName::Any>());
1405     registers[reg.code()].allocatable = true;
1406   }
1407
1408   LifoAlloc* lifoAlloc = mir->alloc().lifoAlloc();
1409   for (size_t i = 0; i < AnyRegister::Total; i++) {
1410     registers[i].reg = AnyRegister::FromCode(i);
1411     registers[i].allocations.setAllocator(lifoAlloc);
1412   }
1413
1414   hotcode.setAllocator(lifoAlloc);
1415   callRanges.setAllocator(lifoAlloc);
1416
1417   // Partition the graph into hot and cold sections, for helping to make
1418   // splitting decisions. Since we don't have any profiling data this is a
1419   // crapshoot, so just mark the bodies of inner loops as hot and everything
1420   // else as cold.
1421
1422   LBlock* backedge = nullptr;
1423   for (size_t i = 0; i < graph.numBlocks(); i++) {
1424     LBlock* block = graph.getBlock(i);
1425
1426     // If we see a loop header, mark the backedge so we know when we have
1427     // hit the end of the loop. Don't process the loop immediately, so that
1428     // if there is an inner loop we will ignore the outer backedge.
1429     if (block->mir()->isLoopHeader()) {
1430       backedge = block->mir()->backedge()->lir();
1431     }
1432
1433     if (block == backedge) {
1434       LBlock* header = block->mir()->loopHeaderOfBackedge()->lir();
1435       LiveRange* range = LiveRange::FallibleNew(
1436           alloc(), nullptr, entryOf(header), exitOf(block).next());
1437       if (!range || !hotcode.insert(range)) {
1438         return false;
1439       }
1440     }
1441   }
1442
1443   return true;
1444 }
1445
1446 ///////////////////////////////////////////////////////////////////////////////
1447 //                                                                           //
1448 // Liveness analysis                                                         //
1449 //                                                                           //
1450 ///////////////////////////////////////////////////////////////////////////////
1451
1452 // Helper for ::buildLivenessInfo
1453 bool BacktrackingAllocator::addInitialFixedRange(AnyRegister reg,
1454                                                  CodePosition from,
1455                                                  CodePosition to) {
1456   LiveRange* range = LiveRange::FallibleNew(alloc(), nullptr, from, to);
1457   if (!range) {
1458     return false;
1459   }
1460   LiveRangePlus rangePlus(range);
1461   return registers[reg.code()].allocations.insert(rangePlus);
1462 }
1463
1464 // Helper for ::buildLivenessInfo
1465 #ifdef DEBUG
1466 // Returns true iff ins has a def/temp reusing the input allocation.
1467 static bool IsInputReused(LInstruction* ins, LUse* use) {
1468   for (size_t i = 0; i < ins->numDefs(); i++) {
1469     if (ins->getDef(i)->policy() == LDefinition::MUST_REUSE_INPUT &&
1470         ins->getOperand(ins->getDef(i)->getReusedInput())->toUse() == use) {
1471       return true;
1472     }
1473   }
1474
1475   for (size_t i = 0; i < ins->numTemps(); i++) {
1476     if (ins->getTemp(i)->policy() == LDefinition::MUST_REUSE_INPUT &&
1477         ins->getOperand(ins->getTemp(i)->getReusedInput())->toUse() == use) {
1478       return true;
1479     }
1480   }
1481
1482   return false;
1483 }
1484 #endif
1485
1486 /*
1487  * This function builds up liveness ranges for all virtual registers
1488  * defined in the function.
1489  *
1490  * The algorithm is based on the one published in:
1491  *
1492  * Wimmer, Christian, and Michael Franz. "Linear Scan Register Allocation on
1493  *     SSA Form." Proceedings of the International Symposium on Code Generation
1494  *     and Optimization. Toronto, Ontario, Canada, ACM. 2010. 170-79. PDF.
1495  *
1496  * The algorithm operates on blocks ordered such that dominators of a block
1497  * are before the block itself, and such that all blocks of a loop are
1498  * contiguous. It proceeds backwards over the instructions in this order,
1499  * marking registers live at their uses, ending their live ranges at
1500  * definitions, and recording which registers are live at the top of every
1501  * block. To deal with loop backedges, registers live at the beginning of
1502  * a loop gain a range covering the entire loop.
1503  */
1504 bool BacktrackingAllocator::buildLivenessInfo() {
1505   JitSpew(JitSpew_RegAlloc, "Beginning liveness analysis");
1506
1507   Vector<MBasicBlock*, 1, SystemAllocPolicy> loopWorkList;
1508   BitSet loopDone(graph.numBlockIds());
1509   if (!loopDone.init(alloc())) {
1510     return false;
1511   }
1512
1513   size_t numRanges = 0;
1514
1515   for (size_t i = graph.numBlocks(); i > 0; i--) {
1516     if (mir->shouldCancel("Build Liveness Info (main loop)")) {
1517       return false;
1518     }
1519
1520     LBlock* block = graph.getBlock(i - 1);
1521     MBasicBlock* mblock = block->mir();
1522
1523     BitSet& live = liveIn[mblock->id()];
1524     new (&live) BitSet(graph.numVirtualRegisters());
1525     if (!live.init(alloc())) {
1526       return false;
1527     }
1528
1529     // Propagate liveIn from our successors to us.
1530     for (size_t i = 0; i < mblock->lastIns()->numSuccessors(); i++) {
1531       MBasicBlock* successor = mblock->lastIns()->getSuccessor(i);
1532       // Skip backedges, as we fix them up at the loop header.
1533       if (mblock->id() < successor->id()) {
1534         live.insertAll(liveIn[successor->id()]);
1535       }
1536     }
1537
1538     // Add successor phis.
1539     if (mblock->successorWithPhis()) {
1540       LBlock* phiSuccessor = mblock->successorWithPhis()->lir();
1541       for (unsigned int j = 0; j < phiSuccessor->numPhis(); j++) {
1542         LPhi* phi = phiSuccessor->getPhi(j);
1543         LAllocation* use = phi->getOperand(mblock->positionInPhiSuccessor());
1544         uint32_t reg = use->toUse()->virtualRegister();
1545         live.insert(reg);
1546         vreg(use).setUsedByPhi();
1547       }
1548     }
1549
1550     // Registers are assumed alive for the entire block, a define shortens
1551     // the range to the point of definition.
1552     for (BitSet::Iterator liveRegId(live); liveRegId; ++liveRegId) {
1553       if (!vregs[*liveRegId].addInitialRange(alloc(), entryOf(block),
1554                                              exitOf(block).next(), &numRanges))
1555         return false;
1556     }
1557
1558     // Shorten the front end of ranges for live variables to their point of
1559     // definition, if found.
1560     for (LInstructionReverseIterator ins = block->rbegin();
1561          ins != block->rend(); ins++) {
1562       // Calls may clobber registers, so force a spill and reload around the
1563       // callsite.
1564       if (ins->isCall()) {
1565         for (AnyRegisterIterator iter(allRegisters_.asLiveSet()); iter.more();
1566              ++iter) {
1567           bool found = false;
1568           for (size_t i = 0; i < ins->numDefs(); i++) {
1569             if (ins->getDef(i)->isFixed() &&
1570                 ins->getDef(i)->output()->aliases(LAllocation(*iter))) {
1571               found = true;
1572               break;
1573             }
1574           }
1575           // If this register doesn't have an explicit def above, mark
1576           // it as clobbered by the call unless it is actually
1577           // call-preserved.
1578           if (!found && !ins->isCallPreserved(*iter)) {
1579             if (!addInitialFixedRange(*iter, outputOf(*ins),
1580                                       outputOf(*ins).next())) {
1581               return false;
1582             }
1583           }
1584         }
1585
1586         CallRange* callRange = new (alloc().fallible())
1587             CallRange(outputOf(*ins), outputOf(*ins).next());
1588         if (!callRange) {
1589           return false;
1590         }
1591
1592         callRangesList.pushFront(callRange);
1593         if (!callRanges.insert(callRange)) {
1594           return false;
1595         }
1596       }
1597
1598       for (size_t i = 0; i < ins->numDefs(); i++) {
1599         LDefinition* def = ins->getDef(i);
1600         if (def->isBogusTemp()) {
1601           continue;
1602         }
1603
1604         CodePosition from = outputOf(*ins);
1605
1606         if (def->policy() == LDefinition::MUST_REUSE_INPUT) {
1607           // MUST_REUSE_INPUT is implemented by allocating an output
1608           // register and moving the input to it. Register hints are
1609           // used to avoid unnecessary moves. We give the input an
1610           // LUse::ANY policy to avoid allocating a register for the
1611           // input.
1612           LUse* inputUse = ins->getOperand(def->getReusedInput())->toUse();
1613           MOZ_ASSERT(inputUse->policy() == LUse::REGISTER);
1614           MOZ_ASSERT(inputUse->usedAtStart());
1615           *inputUse = LUse(inputUse->virtualRegister(), LUse::ANY,
1616                            /* usedAtStart = */ true);
1617         }
1618
1619         if (!vreg(def).addInitialRange(alloc(), from, from.next(),
1620                                        &numRanges)) {
1621           return false;
1622         }
1623         vreg(def).setInitialDefinition(from);
1624         live.remove(def->virtualRegister());
1625       }
1626
1627       for (size_t i = 0; i < ins->numTemps(); i++) {
1628         LDefinition* temp = ins->getTemp(i);
1629         if (temp->isBogusTemp()) {
1630           continue;
1631         }
1632
1633         // Normally temps are considered to cover both the input
1634         // and output of the associated instruction. In some cases
1635         // though we want to use a fixed register as both an input
1636         // and clobbered register in the instruction, so watch for
1637         // this and shorten the temp to cover only the output.
1638         CodePosition from = inputOf(*ins);
1639         if (temp->policy() == LDefinition::FIXED) {
1640           AnyRegister reg = temp->output()->toRegister();
1641           for (LInstruction::InputIterator alloc(**ins); alloc.more();
1642                alloc.next()) {
1643             if (alloc->isUse()) {
1644               LUse* use = alloc->toUse();
1645               if (use->isFixedRegister()) {
1646                 if (GetFixedRegister(vreg(use).def(), use) == reg) {
1647                   from = outputOf(*ins);
1648                 }
1649               }
1650             }
1651           }
1652         }
1653
1654         // * For non-call instructions, temps cover both the input and output,
1655         //   so temps never alias uses (even at-start uses) or defs.
1656         // * For call instructions, temps only cover the input (the output is
1657         //   used for the force-spill ranges added above). This means temps
1658         //   still don't alias uses but they can alias the (fixed) defs. For now
1659         //   we conservatively require temps to have a fixed register for call
1660         //   instructions to prevent a footgun.
1661         MOZ_ASSERT_IF(ins->isCall(), temp->policy() == LDefinition::FIXED);
1662         CodePosition to =
1663             ins->isCall() ? outputOf(*ins) : outputOf(*ins).next();
1664
1665         if (!vreg(temp).addInitialRange(alloc(), from, to, &numRanges)) {
1666           return false;
1667         }
1668         vreg(temp).setInitialDefinition(from);
1669       }
1670
1671       DebugOnly<bool> hasUseRegister = false;
1672       DebugOnly<bool> hasUseRegisterAtStart = false;
1673
1674       for (LInstruction::InputIterator inputAlloc(**ins); inputAlloc.more();
1675            inputAlloc.next()) {
1676         if (inputAlloc->isUse()) {
1677           LUse* use = inputAlloc->toUse();
1678
1679           // Call uses should always be at-start, since calls use all
1680           // registers.
1681           MOZ_ASSERT_IF(ins->isCall() && !inputAlloc.isSnapshotInput(),
1682                         use->usedAtStart());
1683
1684 #ifdef DEBUG
1685           // If there are both useRegisterAtStart(x) and useRegister(y)
1686           // uses, we may assign the same register to both operands
1687           // (bug 772830). Don't allow this for now.
1688           if (use->policy() == LUse::REGISTER) {
1689             if (use->usedAtStart()) {
1690               if (!IsInputReused(*ins, use)) {
1691                 hasUseRegisterAtStart = true;
1692               }
1693             } else {
1694               hasUseRegister = true;
1695             }
1696           }
1697           MOZ_ASSERT(!(hasUseRegister && hasUseRegisterAtStart));
1698 #endif
1699
1700           // Don't treat RECOVERED_INPUT uses as keeping the vreg alive.
1701           if (use->policy() == LUse::RECOVERED_INPUT) {
1702             continue;
1703           }
1704
1705           CodePosition to = use->usedAtStart() ? inputOf(*ins) : outputOf(*ins);
1706           if (use->isFixedRegister()) {
1707             LAllocation reg(AnyRegister::FromCode(use->registerCode()));
1708             for (size_t i = 0; i < ins->numDefs(); i++) {
1709               LDefinition* def = ins->getDef(i);
1710               if (def->policy() == LDefinition::FIXED &&
1711                   *def->output() == reg) {
1712                 to = inputOf(*ins);
1713               }
1714             }
1715           }
1716
1717           if (!vreg(use).addInitialRange(alloc(), entryOf(block), to.next(),
1718                                          &numRanges)) {
1719             return false;
1720           }
1721           UsePosition* usePosition =
1722               new (alloc().fallible()) UsePosition(use, to);
1723           if (!usePosition) {
1724             return false;
1725           }
1726           vreg(use).addInitialUse(usePosition);
1727           live.insert(use->virtualRegister());
1728         }
1729       }
1730     }
1731
1732     // Phis have simultaneous assignment semantics at block begin, so at
1733     // the beginning of the block we can be sure that liveIn does not
1734     // contain any phi outputs.
1735     for (unsigned int i = 0; i < block->numPhis(); i++) {
1736       LDefinition* def = block->getPhi(i)->getDef(0);
1737       if (live.contains(def->virtualRegister())) {
1738         live.remove(def->virtualRegister());
1739       } else {
1740         // This is a dead phi, so add a dummy range over all phis. This
1741         // can go away if we have an earlier dead code elimination pass.
1742         CodePosition entryPos = entryOf(block);
1743         if (!vreg(def).addInitialRange(alloc(), entryPos, entryPos.next(),
1744                                        &numRanges)) {
1745           return false;
1746         }
1747       }
1748     }
1749
1750     if (mblock->isLoopHeader()) {
1751       // A divergence from the published algorithm is required here, as
1752       // our block order does not guarantee that blocks of a loop are
1753       // contiguous. As a result, a single live range spanning the
1754       // loop is not possible. Additionally, we require liveIn in a later
1755       // pass for resolution, so that must also be fixed up here.
1756       MBasicBlock* loopBlock = mblock->backedge();
1757       while (true) {
1758         // Blocks must already have been visited to have a liveIn set.
1759         MOZ_ASSERT(loopBlock->id() >= mblock->id());
1760
1761         // Add a range for this entire loop block
1762         CodePosition from = entryOf(loopBlock->lir());
1763         CodePosition to = exitOf(loopBlock->lir()).next();
1764
1765         for (BitSet::Iterator liveRegId(live); liveRegId; ++liveRegId) {
1766           if (!vregs[*liveRegId].addInitialRange(alloc(), from, to,
1767                                                  &numRanges)) {
1768             return false;
1769           }
1770         }
1771
1772         // Fix up the liveIn set.
1773         liveIn[loopBlock->id()].insertAll(live);
1774
1775         // Make sure we don't visit this node again
1776         loopDone.insert(loopBlock->id());
1777
1778         // If this is the loop header, any predecessors are either the
1779         // backedge or out of the loop, so skip any predecessors of
1780         // this block
1781         if (loopBlock != mblock) {
1782           for (size_t i = 0; i < loopBlock->numPredecessors(); i++) {
1783             MBasicBlock* pred = loopBlock->getPredecessor(i);
1784             if (loopDone.contains(pred->id())) {
1785               continue;
1786             }
1787             if (!loopWorkList.append(pred)) {
1788               return false;
1789             }
1790           }
1791         }
1792
1793         // Terminate loop if out of work.
1794         if (loopWorkList.empty()) {
1795           break;
1796         }
1797
1798         // Grab the next block off the work list, skipping any OSR block.
1799         MBasicBlock* osrBlock = graph.mir().osrBlock();
1800         while (!loopWorkList.empty()) {
1801           loopBlock = loopWorkList.popCopy();
1802           if (loopBlock != osrBlock) {
1803             break;
1804           }
1805         }
1806
1807         // If end is reached without finding a non-OSR block, then no more work
1808         // items were found.
1809         if (loopBlock == osrBlock) {
1810           MOZ_ASSERT(loopWorkList.empty());
1811           break;
1812         }
1813       }
1814
1815       // Clear the done set for other loops
1816       loopDone.clear();
1817     }
1818
1819     MOZ_ASSERT_IF(!mblock->numPredecessors(), live.empty());
1820   }
1821
1822   JitSpew(JitSpew_RegAlloc, "Completed liveness analysis");
1823   return true;
1824 }
1825
1826 ///////////////////////////////////////////////////////////////////////////////
1827 //                                                                           //
1828 // Merging and queueing of LiveRange groups                                  //
1829 //                                                                           //
1830 ///////////////////////////////////////////////////////////////////////////////
1831
1832 // Helper for ::tryMergeBundles
1833 static bool IsArgumentSlotDefinition(LDefinition* def) {
1834   return def->policy() == LDefinition::FIXED && def->output()->isArgument();
1835 }
1836
1837 // Helper for ::tryMergeBundles
1838 static bool IsThisSlotDefinition(LDefinition* def) {
1839   return IsArgumentSlotDefinition(def) &&
1840          def->output()->toArgument()->index() <
1841              THIS_FRAME_ARGSLOT + sizeof(Value);
1842 }
1843
1844 // Helper for ::tryMergeBundles
1845 static bool HasStackPolicy(LDefinition* def) {
1846   return def->policy() == LDefinition::STACK;
1847 }
1848
1849 // Helper for ::tryMergeBundles
1850 static bool CanMergeTypesInBundle(LDefinition::Type a, LDefinition::Type b) {
1851   // Fast path for the common case.
1852   if (a == b) {
1853     return true;
1854   }
1855
1856   // Only merge if the sizes match, so that we don't get confused about the
1857   // width of spill slots.
1858   return StackSlotAllocator::width(a) == StackSlotAllocator::width(b);
1859 }
1860
1861 // Helper for ::tryMergeReusedRegister
1862 bool BacktrackingAllocator::tryMergeBundles(LiveBundle* bundle0,
1863                                             LiveBundle* bundle1) {
1864   // See if bundle0 and bundle1 can be merged together.
1865   if (bundle0 == bundle1) {
1866     return true;
1867   }
1868
1869   // Get a representative virtual register from each bundle.
1870   VirtualRegister& reg0 = bundle0->firstRange()->vreg();
1871   VirtualRegister& reg1 = bundle1->firstRange()->vreg();
1872
1873   MOZ_ASSERT(CanMergeTypesInBundle(reg0.type(), reg1.type()));
1874   MOZ_ASSERT(reg0.isCompatible(reg1));
1875
1876   // Registers which might spill to the frame's |this| slot can only be
1877   // grouped with other such registers. The frame's |this| slot must always
1878   // hold the |this| value, as required by JitFrame tracing and by the Ion
1879   // constructor calling convention.
1880   if (IsThisSlotDefinition(reg0.def()) || IsThisSlotDefinition(reg1.def())) {
1881     if (*reg0.def()->output() != *reg1.def()->output()) {
1882       return true;
1883     }
1884   }
1885
1886   // Registers which might spill to the frame's argument slots can only be
1887   // grouped with other such registers if the frame might access those
1888   // arguments through a lazy arguments object or rest parameter.
1889   if (IsArgumentSlotDefinition(reg0.def()) ||
1890       IsArgumentSlotDefinition(reg1.def())) {
1891     if (graph.mir().entryBlock()->info().mayReadFrameArgsDirectly()) {
1892       if (*reg0.def()->output() != *reg1.def()->output()) {
1893         return true;
1894       }
1895     }
1896   }
1897
1898   // When we make a call to a WebAssembly function that returns multiple
1899   // results, some of those results can go on the stack.  The callee is passed a
1900   // pointer to this stack area, which is represented as having policy
1901   // LDefinition::STACK (with type LDefinition::STACKRESULTS).  Individual
1902   // results alias parts of the stack area with a value-appropriate type, but
1903   // policy LDefinition::STACK.  This aliasing between allocations makes it
1904   // unsound to merge anything with a LDefinition::STACK policy.
1905   if (HasStackPolicy(reg0.def()) || HasStackPolicy(reg1.def())) {
1906     return true;
1907   }
1908
1909   // Limit the number of times we compare ranges if there are many ranges in
1910   // one of the bundles, to avoid quadratic behavior.
1911   static const size_t MAX_RANGES = 200;
1912
1913   // Make sure that ranges in the bundles do not overlap.
1914   LiveRange::BundleLinkIterator iter0 = bundle0->rangesBegin(),
1915                                 iter1 = bundle1->rangesBegin();
1916   size_t count = 0;
1917   while (iter0 && iter1) {
1918     if (++count >= MAX_RANGES) {
1919       return true;
1920     }
1921
1922     LiveRange* range0 = LiveRange::get(*iter0);
1923     LiveRange* range1 = LiveRange::get(*iter1);
1924
1925     if (range0->from() >= range1->to()) {
1926       iter1++;
1927     } else if (range1->from() >= range0->to()) {
1928       iter0++;
1929     } else {
1930       return true;
1931     }
1932   }
1933
1934   // Move all ranges from bundle1 into bundle0.
1935   while (LiveRange* range = bundle1->popFirstRange()) {
1936     bundle0->addRange(range);
1937   }
1938
1939   return true;
1940 }
1941
1942 // Helper for ::mergeAndQueueRegisters
1943 void BacktrackingAllocator::allocateStackDefinition(VirtualRegister& reg) {
1944   LInstruction* ins = reg.ins()->toInstruction();
1945   if (reg.def()->type() == LDefinition::STACKRESULTS) {
1946     LStackArea alloc(ins->toInstruction());
1947     stackSlotAllocator.allocateStackArea(&alloc);
1948     reg.def()->setOutput(alloc);
1949   } else {
1950     // Because the definitions are visited in order, the area has been allocated
1951     // before we reach this result, so we know the operand is an LStackArea.
1952     const LUse* use = ins->getOperand(0)->toUse();
1953     VirtualRegister& area = vregs[use->virtualRegister()];
1954     const LStackArea* areaAlloc = area.def()->output()->toStackArea();
1955     reg.def()->setOutput(areaAlloc->resultAlloc(ins, reg.def()));
1956   }
1957 }
1958
1959 // Helper for ::mergeAndQueueRegisters
1960 bool BacktrackingAllocator::tryMergeReusedRegister(VirtualRegister& def,
1961                                                    VirtualRegister& input) {
1962   // def is a vreg which reuses input for its output physical register. Try
1963   // to merge ranges for def with those of input if possible, as avoiding
1964   // copies before def's instruction is crucial for generated code quality
1965   // (MUST_REUSE_INPUT is used for all arithmetic on x86/x64).
1966
1967   if (def.rangeFor(inputOf(def.ins()))) {
1968     MOZ_ASSERT(def.isTemp());
1969     def.setMustCopyInput();
1970     return true;
1971   }
1972
1973   if (!CanMergeTypesInBundle(def.type(), input.type())) {
1974     def.setMustCopyInput();
1975     return true;
1976   }
1977
1978   LiveRange* inputRange = input.rangeFor(outputOf(def.ins()));
1979   if (!inputRange) {
1980     // The input is not live after the instruction, either in a safepoint
1981     // for the instruction or in subsequent code. The input and output
1982     // can thus be in the same group.
1983     return tryMergeBundles(def.firstBundle(), input.firstBundle());
1984   }
1985
1986   // Avoid merging in very large live ranges as merging has non-linear
1987   // complexity.  The cutoff value is hard to gauge.  1M was chosen because it
1988   // is "large" and yet usefully caps compile time on AutoCad-for-the-web to
1989   // something reasonable on a 2017-era desktop system.
1990   const uint32_t RANGE_SIZE_CUTOFF = 1000000;
1991   if (inputRange->to() - inputRange->from() > RANGE_SIZE_CUTOFF) {
1992     def.setMustCopyInput();
1993     return true;
1994   }
1995
1996   // The input is live afterwards, either in future instructions or in a
1997   // safepoint for the reusing instruction. This is impossible to satisfy
1998   // without copying the input.
1999   //
2000   // It may or may not be better to split the input into two bundles at the
2001   // point of the definition, which may permit merging. One case where it is
2002   // definitely better to split is if the input never has any register uses
2003   // after the instruction. Handle this splitting eagerly.
2004
2005   LBlock* block = def.ins()->block();
2006
2007   // The input's lifetime must end within the same block as the definition,
2008   // otherwise it could live on in phis elsewhere.
2009   if (inputRange != input.lastRange() || inputRange->to() > exitOf(block)) {
2010     def.setMustCopyInput();
2011     return true;
2012   }
2013
2014   // If we already split the input for some other register, don't make a
2015   // third bundle.
2016   if (inputRange->bundle() != input.firstRange()->bundle()) {
2017     def.setMustCopyInput();
2018     return true;
2019   }
2020
2021   // If the input will start out in memory then adding a separate bundle for
2022   // memory uses after the def won't help.
2023   if (input.def()->isFixed() && !input.def()->output()->isRegister()) {
2024     def.setMustCopyInput();
2025     return true;
2026   }
2027
2028   // The input cannot have register or reused uses after the definition.
2029   for (UsePositionIterator iter = inputRange->usesBegin(); iter; iter++) {
2030     if (iter->pos <= inputOf(def.ins())) {
2031       continue;
2032     }
2033
2034     LUse* use = iter->use();
2035     if (FindReusingDefOrTemp(insData[iter->pos], use)) {
2036       def.setMustCopyInput();
2037       return true;
2038     }
2039     if (iter->usePolicy() != LUse::ANY &&
2040         iter->usePolicy() != LUse::KEEPALIVE) {
2041       def.setMustCopyInput();
2042       return true;
2043     }
2044   }
2045
2046   LiveRange* preRange = LiveRange::FallibleNew(
2047       alloc(), &input, inputRange->from(), outputOf(def.ins()));
2048   if (!preRange) {
2049     return false;
2050   }
2051
2052   // The new range starts at reg's input position, which means it overlaps
2053   // with the old range at one position. This is what we want, because we
2054   // need to copy the input before the instruction.
2055   LiveRange* postRange = LiveRange::FallibleNew(
2056       alloc(), &input, inputOf(def.ins()), inputRange->to());
2057   if (!postRange) {
2058     return false;
2059   }
2060
2061   inputRange->tryToMoveDefAndUsesInto(preRange);
2062   inputRange->tryToMoveDefAndUsesInto(postRange);
2063   MOZ_ASSERT(!inputRange->hasUses());
2064
2065   JitSpewIfEnabled(JitSpew_RegAlloc,
2066                    "  splitting reused input at %u to try to help grouping",
2067                    inputOf(def.ins()).bits());
2068
2069   LiveBundle* firstBundle = inputRange->bundle();
2070   input.removeRange(inputRange);
2071   input.addRange(preRange);
2072   input.addRange(postRange);
2073
2074   firstBundle->removeRange(inputRange);
2075   firstBundle->addRange(preRange);
2076
2077   // The new range goes in a separate bundle, where it will be spilled during
2078   // allocation.
2079   LiveBundle* secondBundle = LiveBundle::FallibleNew(alloc(), nullptr, nullptr);
2080   if (!secondBundle) {
2081     return false;
2082   }
2083   secondBundle->addRange(postRange);
2084
2085   return tryMergeBundles(def.firstBundle(), input.firstBundle());
2086 }
2087
2088 bool BacktrackingAllocator::mergeAndQueueRegisters() {
2089   MOZ_ASSERT(!vregs[0u].hasRanges());
2090
2091   // Create a bundle for each register containing all its ranges.
2092   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
2093     VirtualRegister& reg = vregs[i];
2094     if (!reg.hasRanges()) {
2095       continue;
2096     }
2097
2098     LiveBundle* bundle = LiveBundle::FallibleNew(alloc(), nullptr, nullptr);
2099     if (!bundle) {
2100       return false;
2101     }
2102     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
2103          iter++) {
2104       LiveRange* range = LiveRange::get(*iter);
2105       bundle->addRange(range);
2106     }
2107   }
2108
2109   // If there is an OSR block, merge parameters in that block with the
2110   // corresponding parameters in the initial block.
2111   if (MBasicBlock* osr = graph.mir().osrBlock()) {
2112     size_t original = 1;
2113     for (LInstructionIterator iter = osr->lir()->begin();
2114          iter != osr->lir()->end(); iter++) {
2115       if (iter->isParameter()) {
2116         for (size_t i = 0; i < iter->numDefs(); i++) {
2117           DebugOnly<bool> found = false;
2118           VirtualRegister& paramVreg = vreg(iter->getDef(i));
2119           for (; original < paramVreg.vreg(); original++) {
2120             VirtualRegister& originalVreg = vregs[original];
2121             if (*originalVreg.def()->output() == *iter->getDef(i)->output()) {
2122               MOZ_ASSERT(originalVreg.ins()->isParameter());
2123               if (!tryMergeBundles(originalVreg.firstBundle(),
2124                                    paramVreg.firstBundle())) {
2125                 return false;
2126               }
2127               found = true;
2128               break;
2129             }
2130           }
2131           MOZ_ASSERT(found);
2132         }
2133       }
2134     }
2135   }
2136
2137   // Try to merge registers with their reused inputs.
2138   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
2139     VirtualRegister& reg = vregs[i];
2140     if (!reg.hasRanges()) {
2141       continue;
2142     }
2143
2144     if (reg.def()->policy() == LDefinition::MUST_REUSE_INPUT) {
2145       LUse* use = reg.ins()
2146                       ->toInstruction()
2147                       ->getOperand(reg.def()->getReusedInput())
2148                       ->toUse();
2149       if (!tryMergeReusedRegister(reg, vreg(use))) {
2150         return false;
2151       }
2152     }
2153   }
2154
2155   // Try to merge phis with their inputs.
2156   for (size_t i = 0; i < graph.numBlocks(); i++) {
2157     LBlock* block = graph.getBlock(i);
2158     for (size_t j = 0; j < block->numPhis(); j++) {
2159       LPhi* phi = block->getPhi(j);
2160       VirtualRegister& outputVreg = vreg(phi->getDef(0));
2161       for (size_t k = 0, kend = phi->numOperands(); k < kend; k++) {
2162         VirtualRegister& inputVreg = vreg(phi->getOperand(k)->toUse());
2163         if (!tryMergeBundles(inputVreg.firstBundle(),
2164                              outputVreg.firstBundle())) {
2165           return false;
2166         }
2167       }
2168     }
2169   }
2170
2171   // Add all bundles to the allocation queue, and create spill sets for them.
2172   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
2173     VirtualRegister& reg = vregs[i];
2174
2175     // Eagerly allocate stack result areas and their component stack results.
2176     if (reg.def() && reg.def()->policy() == LDefinition::STACK) {
2177       allocateStackDefinition(reg);
2178     }
2179
2180     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
2181          iter++) {
2182       LiveRange* range = LiveRange::get(*iter);
2183       LiveBundle* bundle = range->bundle();
2184       if (range == bundle->firstRange()) {
2185         if (!alloc().ensureBallast()) {
2186           return false;
2187         }
2188
2189         SpillSet* spill = SpillSet::New(alloc());
2190         if (!spill) {
2191           return false;
2192         }
2193         bundle->setSpillSet(spill);
2194
2195         size_t priority = computePriority(bundle);
2196         if (!allocationQueue.insert(QueueItem(bundle, priority))) {
2197           return false;
2198         }
2199       }
2200     }
2201   }
2202
2203   return true;
2204 }
2205
2206 ///////////////////////////////////////////////////////////////////////////////
2207 //                                                                           //
2208 // Code for the splitting/spilling subsystem begins here.                    //
2209 //                                                                           //
2210 // The code that follows is structured in the following sequence:            //
2211 //                                                                           //
2212 // (1) Routines that are helpers for ::splitAt.                              //
2213 // (2) ::splitAt itself, which implements splitting decisions.               //
2214 // (3) heuristic routines (eg ::splitAcrossCalls), which decide where        //
2215 //     splits should be made.  They then call ::splitAt to perform the       //
2216 //     chosen split.                                                         //
2217 // (4) The top level driver, ::chooseBundleSplit.                            //
2218 //                                                                           //
2219 // There are further comments on ::splitAt and ::chooseBundleSplit below.    //
2220 //                                                                           //
2221 ///////////////////////////////////////////////////////////////////////////////
2222
2223 ///////////////////////////////////////////////////////////////////////////////
2224 //                                                                           //
2225 // Implementation of splitting decisions, but not the making of those        //
2226 // decisions: various helper functions                                       //
2227 //                                                                           //
2228 ///////////////////////////////////////////////////////////////////////////////
2229
2230 bool BacktrackingAllocator::updateVirtualRegisterListsThenRequeueBundles(
2231     LiveBundle* bundle, const LiveBundleVector& newBundles) {
2232 #ifdef DEBUG
2233   if (newBundles.length() == 1) {
2234     LiveBundle* newBundle = newBundles[0];
2235     if (newBundle->numRanges() == bundle->numRanges() &&
2236         computePriority(newBundle) == computePriority(bundle)) {
2237       bool different = false;
2238       LiveRange::BundleLinkIterator oldRanges = bundle->rangesBegin();
2239       LiveRange::BundleLinkIterator newRanges = newBundle->rangesBegin();
2240       while (oldRanges) {
2241         LiveRange* oldRange = LiveRange::get(*oldRanges);
2242         LiveRange* newRange = LiveRange::get(*newRanges);
2243         if (oldRange->from() != newRange->from() ||
2244             oldRange->to() != newRange->to()) {
2245           different = true;
2246           break;
2247         }
2248         oldRanges++;
2249         newRanges++;
2250       }
2251
2252       // This is likely to trigger an infinite loop in register allocation. This
2253       // can be the result of invalid register constraints, making regalloc
2254       // impossible; consider relaxing those.
2255       MOZ_ASSERT(different,
2256                  "Split results in the same bundle with the same priority");
2257     }
2258   }
2259 #endif
2260
2261   if (JitSpewEnabled(JitSpew_RegAlloc)) {
2262     JitSpew(JitSpew_RegAlloc, "  .. into:");
2263     for (size_t i = 0; i < newBundles.length(); i++) {
2264       JitSpew(JitSpew_RegAlloc, "    %s", newBundles[i]->toString().get());
2265     }
2266   }
2267
2268   // Remove all ranges in the old bundle from their register's list.
2269   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2270        iter++) {
2271     LiveRange* range = LiveRange::get(*iter);
2272     range->vreg().removeRange(range);
2273   }
2274
2275   // Add all ranges in the new bundles to their register's list.
2276   for (size_t i = 0; i < newBundles.length(); i++) {
2277     LiveBundle* newBundle = newBundles[i];
2278     for (LiveRange::BundleLinkIterator iter = newBundle->rangesBegin(); iter;
2279          iter++) {
2280       LiveRange* range = LiveRange::get(*iter);
2281       range->vreg().addRange(range);
2282     }
2283   }
2284
2285   // Queue the new bundles for register assignment.
2286   for (size_t i = 0; i < newBundles.length(); i++) {
2287     LiveBundle* newBundle = newBundles[i];
2288     size_t priority = computePriority(newBundle);
2289     if (!allocationQueue.insert(QueueItem(newBundle, priority))) {
2290       return false;
2291     }
2292   }
2293
2294   return true;
2295 }
2296
2297 // Helper for ::splitAt
2298 // When splitting a bundle according to a list of split positions, return
2299 // whether a use or range at |pos| should use a different bundle than the last
2300 // position this was called for.
2301 static bool UseNewBundle(const SplitPositionVector& splitPositions,
2302                          CodePosition pos, size_t* activeSplitPosition) {
2303   if (splitPositions.empty()) {
2304     // When the split positions are empty we are splitting at all uses.
2305     return true;
2306   }
2307
2308   if (*activeSplitPosition == splitPositions.length()) {
2309     // We've advanced past all split positions.
2310     return false;
2311   }
2312
2313   if (splitPositions[*activeSplitPosition] > pos) {
2314     // We haven't gotten to the next split position yet.
2315     return false;
2316   }
2317
2318   // We've advanced past the next split position, find the next one which we
2319   // should split at.
2320   while (*activeSplitPosition < splitPositions.length() &&
2321          splitPositions[*activeSplitPosition] <= pos) {
2322     (*activeSplitPosition)++;
2323   }
2324   return true;
2325 }
2326
2327 // Helper for ::splitAt
2328 static bool HasPrecedingRangeSharingVreg(LiveBundle* bundle, LiveRange* range) {
2329   MOZ_ASSERT(range->bundle() == bundle);
2330
2331   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2332        iter++) {
2333     LiveRange* prevRange = LiveRange::get(*iter);
2334     if (prevRange == range) {
2335       return false;
2336     }
2337     if (&prevRange->vreg() == &range->vreg()) {
2338       return true;
2339     }
2340   }
2341
2342   MOZ_CRASH();
2343 }
2344
2345 // Helper for ::splitAt
2346 static bool HasFollowingRangeSharingVreg(LiveBundle* bundle, LiveRange* range) {
2347   MOZ_ASSERT(range->bundle() == bundle);
2348
2349   bool foundRange = false;
2350   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2351        iter++) {
2352     LiveRange* prevRange = LiveRange::get(*iter);
2353     if (foundRange && &prevRange->vreg() == &range->vreg()) {
2354       return true;
2355     }
2356     if (prevRange == range) {
2357       foundRange = true;
2358     }
2359   }
2360
2361   MOZ_ASSERT(foundRange);
2362   return false;
2363 }
2364
2365 ///////////////////////////////////////////////////////////////////////////////
2366 //                                                                           //
2367 // Implementation of splitting decisions, but not the making of those        //
2368 // decisions:                                                                //
2369 //   ::splitAt                                                               //
2370 //                                                                           //
2371 ///////////////////////////////////////////////////////////////////////////////
2372
2373 // ::splitAt
2374 // ---------
2375 // It would be nice to be able to interpret ::splitAt as simply performing
2376 // whatever split the heuristic routines decide on.  Unfortunately it
2377 // tries to "improve" on the initial locations, which as
2378 // https://bugzilla.mozilla.org/show_bug.cgi?id=1758274#c17 shows, often
2379 // leads to excessive spilling.  So there is no clean distinction between
2380 // policy (where to split, computed by the heuristic routines) and
2381 // implementation (done by ::splitAt).
2382 //
2383 // ::splitAt -- creation of spill parent bundles
2384 // ---------------------------------------------
2385 // To understand what ::splitAt does, we must refer back to Section 1's
2386 // description of LiveBundle::spillParent_.
2387 //
2388 // Initially (as created by Phase 1), all bundles have `spillParent_` being
2389 // NULL.  If ::splitAt is asked to split such a bundle, it will first create a
2390 // "spill bundle" or "spill parent" bundle.  This is a copy of the original,
2391 // with two changes:
2392 //
2393 // * all register uses have been removed, so that only stack-compatible uses
2394 //   remain.
2395 //
2396 // * for all LiveRanges in the bundle that define a register, the start point
2397 //   of the range is moved one CodePosition forwards, thusly:
2398 //
2399 //   from = minimalDefEnd(insData[from]).next();
2400 //
2401 // The reason for the latter relates to the idea described in Section 1, that
2402 // all LiveRanges for any given VirtualRegister must form a tree rooted at the
2403 // defining LiveRange.  If the spill-bundle definition range start points are
2404 // the same as those in the original bundle, then we will end up with two roots
2405 // for the tree, and it is then unclear which one should supply "the value".
2406 //
2407 // Putting the spill-bundle start point one CodePosition further along causes
2408 // the range containing the register def (after splitting) to still be the
2409 // defining point.  ::createMoveGroupsFromLiveRangeTransitions will observe the
2410 // equivalent spill-bundle range starting one point later and add a MoveGroup
2411 // to move the value into it.  Since the spill bundle is intended to be stack
2412 // resident, the effect is to force creation of the MoveGroup that will
2413 // actually spill this value onto the stack.
2414 //
2415 // If the bundle provided to ::splitAt already has a spill parent, then
2416 // ::splitAt doesn't create a new spill parent.  This situation will happen
2417 // when the bundle to be split was itself created by splitting.  The effect is
2418 // that *all* bundles created from an "original bundle" share the same spill
2419 // parent, and hence they will share the same spill slot, which guarantees that
2420 // all the spilled fragments of a VirtualRegister share the same spill slot,
2421 // which means we'll never have to move a VirtualRegister between different
2422 // spill slots during its lifetime.
2423 //
2424 // ::splitAt -- creation of other bundles
2425 // --------------------------------------
2426 // With the spill parent bundle question out of the way, ::splitAt then goes on
2427 // to create the remaining new bundles, using near-incomprehensible logic
2428 // steered by `UseNewBundle`.
2429 //
2430 // This supposedly splits the bundle at the positions given by the
2431 // `SplitPositionVector` parameter to ::splitAt, putting them in a temporary
2432 // vector `newBundles`.  Whether it really splits at the requested positions or
2433 // not is hard to say; more important is what happens next.
2434 //
2435 // ::splitAt -- "improvement" ("filtering") of the split bundles
2436 // -------------------------------------------------------------
2437 // ::splitAt now tries to reduce the length of the LiveRanges that make up the
2438 // new bundles (not including the "spill parent").  I assume this is to remove
2439 // sections of the bundles that carry no useful value (eg, extending after the
2440 // last using a range), thereby removing the demand for registers in those
2441 // parts.  This does however mean that ::splitAt is no longer really splitting
2442 // where the heuristic routines wanted, and that can lead to a big increase in
2443 // spilling in loops, as
2444 // https://bugzilla.mozilla.org/show_bug.cgi?id=1758274#c17 describes.
2445 //
2446 // ::splitAt -- meaning of the incoming `SplitPositionVector`
2447 // ----------------------------------------------------------
2448 // ::splitAt has one last mystery which is important to document.  The split
2449 // positions are specified as CodePositions, but this leads to ambiguity
2450 // because, in a sequence of N (LIR) instructions, there are 2N valid
2451 // CodePositions.  For example:
2452 //
2453 //    6-7 WasmLoadTls [def v2<o>] [use v1:R]
2454 //    8-9 WasmNullConstant [def v3<o>]
2455 //
2456 // Consider splitting the range for `v2`, which starts at CodePosition 7.
2457 // What's the difference between saying "split it at 7" and "split it at 8" ?
2458 // Not much really, since in both cases what we intend is for the range to be
2459 // split in between the two instructions.
2460 //
2461 // Hence I believe the semantics is:
2462 //
2463 // * splitting at an even numbered CodePosition (eg, 8), which is an input-side
2464 //   position, means "split before the instruction containing this position".
2465 //
2466 // * splitting at an odd numbered CodePositin (eg, 7), which is an output-side
2467 //   position, means "split after the instruction containing this position".
2468 //
2469 // Hence in the example, we could specify either 7 or 8 to mean the same
2470 // placement of the split.  Well, almost true, but actually:
2471 //
2472 // (SPEC) specifying 8 means
2473 //
2474 //   "split between these two insns, and any resulting MoveGroup goes in the
2475 //    list to be emitted before the start of the second insn"
2476 //
2477 // (SPEC) specifying 7 means
2478 //
2479 //   "split between these two insns, and any resulting MoveGroup goes in the
2480 //    list to be emitted after the end of the first insn"
2481 //
2482 // In most cases we don't care on which "side of the valley" the MoveGroup ends
2483 // up, in which case we can use either convention.
2484 //
2485 // (SPEC) I believe these semantics are implied by the logic in
2486 // ::createMoveGroupsFromLiveRangeTransitions.  They are certainly not
2487 // documented anywhere in the code.
2488
2489 bool BacktrackingAllocator::splitAt(LiveBundle* bundle,
2490                                     const SplitPositionVector& splitPositions) {
2491   // Split the bundle at the given split points. Register uses which have no
2492   // intervening split points are consolidated into the same bundle. If the
2493   // list of split points is empty, then all register uses are placed in
2494   // minimal bundles.
2495
2496   // splitPositions should be sorted.
2497   for (size_t i = 1; i < splitPositions.length(); ++i) {
2498     MOZ_ASSERT(splitPositions[i - 1] < splitPositions[i]);
2499   }
2500
2501   // We don't need to create a new spill bundle if there already is one.
2502   bool spillBundleIsNew = false;
2503   LiveBundle* spillBundle = bundle->spillParent();
2504   if (!spillBundle) {
2505     spillBundle = LiveBundle::FallibleNew(alloc(), bundle->spillSet(), nullptr);
2506     if (!spillBundle) {
2507       return false;
2508     }
2509     spillBundleIsNew = true;
2510
2511     for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2512          iter++) {
2513       LiveRange* range = LiveRange::get(*iter);
2514
2515       CodePosition from = range->from();
2516       if (isRegisterDefinition(range)) {
2517         from = minimalDefEnd(insData[from]).next();
2518       }
2519
2520       if (from < range->to()) {
2521         if (!spillBundle->addRange(alloc(), &range->vreg(), from,
2522                                    range->to())) {
2523           return false;
2524         }
2525
2526         if (range->hasDefinition() && !isRegisterDefinition(range)) {
2527           spillBundle->lastRange()->setHasDefinition();
2528         }
2529       }
2530     }
2531   }
2532
2533   LiveBundleVector newBundles;
2534
2535   // The bundle which ranges are currently being added to.
2536   LiveBundle* activeBundle =
2537       LiveBundle::FallibleNew(alloc(), bundle->spillSet(), spillBundle);
2538   if (!activeBundle || !newBundles.append(activeBundle)) {
2539     return false;
2540   }
2541
2542   // State for use by UseNewBundle.
2543   size_t activeSplitPosition = 0;
2544
2545   // Make new bundles according to the split positions, and distribute ranges
2546   // and uses to them.
2547   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2548        iter++) {
2549     LiveRange* range = LiveRange::get(*iter);
2550
2551     if (UseNewBundle(splitPositions, range->from(), &activeSplitPosition)) {
2552       activeBundle =
2553           LiveBundle::FallibleNew(alloc(), bundle->spillSet(), spillBundle);
2554       if (!activeBundle || !newBundles.append(activeBundle)) {
2555         return false;
2556       }
2557     }
2558
2559     LiveRange* activeRange = LiveRange::FallibleNew(alloc(), &range->vreg(),
2560                                                     range->from(), range->to());
2561     if (!activeRange) {
2562       return false;
2563     }
2564     activeBundle->addRange(activeRange);
2565
2566     if (isRegisterDefinition(range)) {
2567       activeRange->setHasDefinition();
2568     }
2569
2570     while (range->hasUses()) {
2571       UsePosition* use = range->popUse();
2572       LNode* ins = insData[use->pos];
2573
2574       // Any uses of a register that appear before its definition has
2575       // finished must be associated with the range for that definition.
2576       if (isRegisterDefinition(range) &&
2577           use->pos <= minimalDefEnd(insData[range->from()])) {
2578         activeRange->addUse(use);
2579       } else if (isRegisterUse(use, ins)) {
2580         // Place this register use into a different bundle from the
2581         // last one if there are any split points between the two uses.
2582         // UseNewBundle always returns true if we are splitting at all
2583         // register uses, but we can still reuse the last range and
2584         // bundle if they have uses at the same position, except when
2585         // either use is fixed (the two uses might require incompatible
2586         // registers.)
2587         if (UseNewBundle(splitPositions, use->pos, &activeSplitPosition) &&
2588             (!activeRange->hasUses() ||
2589              activeRange->usesBegin()->pos != use->pos ||
2590              activeRange->usesBegin()->usePolicy() == LUse::FIXED ||
2591              use->usePolicy() == LUse::FIXED)) {
2592           activeBundle =
2593               LiveBundle::FallibleNew(alloc(), bundle->spillSet(), spillBundle);
2594           if (!activeBundle || !newBundles.append(activeBundle)) {
2595             return false;
2596           }
2597           activeRange = LiveRange::FallibleNew(alloc(), &range->vreg(),
2598                                                range->from(), range->to());
2599           if (!activeRange) {
2600             return false;
2601           }
2602           activeBundle->addRange(activeRange);
2603         }
2604
2605         activeRange->addUse(use);
2606       } else {
2607         MOZ_ASSERT(spillBundleIsNew);
2608         spillBundle->rangeFor(use->pos)->addUse(use);
2609       }
2610     }
2611   }
2612
2613   LiveBundleVector filteredBundles;
2614
2615   // Trim the ends of ranges in each new bundle when there are no other
2616   // earlier or later ranges in the same bundle with the same vreg.
2617   for (size_t i = 0; i < newBundles.length(); i++) {
2618     LiveBundle* bundle = newBundles[i];
2619
2620     for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;) {
2621       LiveRange* range = LiveRange::get(*iter);
2622
2623       if (!range->hasDefinition()) {
2624         if (!HasPrecedingRangeSharingVreg(bundle, range)) {
2625           if (range->hasUses()) {
2626             UsePosition* use = *range->usesBegin();
2627             range->setFrom(inputOf(insData[use->pos]));
2628           } else {
2629             bundle->removeRangeAndIncrementIterator(iter);
2630             continue;
2631           }
2632         }
2633       }
2634
2635       if (!HasFollowingRangeSharingVreg(bundle, range)) {
2636         if (range->hasUses()) {
2637           UsePosition* use = range->lastUse();
2638           range->setTo(use->pos.next());
2639         } else if (range->hasDefinition()) {
2640           range->setTo(minimalDefEnd(insData[range->from()]).next());
2641         } else {
2642           bundle->removeRangeAndIncrementIterator(iter);
2643           continue;
2644         }
2645       }
2646
2647       iter++;
2648     }
2649
2650     if (bundle->hasRanges() && !filteredBundles.append(bundle)) {
2651       return false;
2652     }
2653   }
2654
2655   if (spillBundleIsNew && !filteredBundles.append(spillBundle)) {
2656     return false;
2657   }
2658
2659   return updateVirtualRegisterListsThenRequeueBundles(bundle, filteredBundles);
2660 }
2661
2662 ///////////////////////////////////////////////////////////////////////////////
2663 //                                                                           //
2664 // Creation of splitting decisions, but not their implementation:            //
2665 //   ::splitAcrossCalls                                                      //
2666 //   ::trySplitAcrossHotcode                                                 //
2667 //   ::trySplitAfterLastRegisterUse                                          //
2668 //   ::trySplitBeforeFirstRegisterUse                                        //
2669 //                                                                           //
2670 ///////////////////////////////////////////////////////////////////////////////
2671
2672 bool BacktrackingAllocator::splitAcrossCalls(LiveBundle* bundle) {
2673   // Split the bundle to separate register uses and non-register uses and
2674   // allow the vreg to be spilled across its range.
2675
2676   // Find the locations of all calls in the bundle's range.
2677   SplitPositionVector callPositions;
2678   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2679        iter++) {
2680     LiveRange* range = LiveRange::get(*iter);
2681     CallRange searchRange(range->from(), range->to());
2682     CallRange* callRange;
2683     if (!callRanges.contains(&searchRange, &callRange)) {
2684       // There are no calls inside this range.
2685       continue;
2686     }
2687     MOZ_ASSERT(range->covers(callRange->range.from));
2688
2689     // The search above returns an arbitrary call within the range. Walk
2690     // backwards to find the first call in the range.
2691     for (CallRangeList::reverse_iterator riter =
2692              callRangesList.rbegin(callRange);
2693          riter != callRangesList.rend(); ++riter) {
2694       CodePosition pos = riter->range.from;
2695       if (range->covers(pos)) {
2696         callRange = *riter;
2697       } else {
2698         break;
2699       }
2700     }
2701
2702     // Add all call positions within the range, by walking forwards.
2703     for (CallRangeList::iterator iter = callRangesList.begin(callRange);
2704          iter != callRangesList.end(); ++iter) {
2705       CodePosition pos = iter->range.from;
2706       if (!range->covers(pos)) {
2707         break;
2708       }
2709
2710       // Calls at the beginning of the range are ignored; there is no splitting
2711       // to do.
2712       if (range->covers(pos.previous())) {
2713         MOZ_ASSERT_IF(callPositions.length(), pos > callPositions.back());
2714         if (!callPositions.append(pos)) {
2715           return false;
2716         }
2717       }
2718     }
2719   }
2720   MOZ_ASSERT(callPositions.length());
2721
2722 #ifdef JS_JITSPEW
2723   JitSpewStart(JitSpew_RegAlloc, "  .. split across calls at ");
2724   for (size_t i = 0; i < callPositions.length(); ++i) {
2725     JitSpewCont(JitSpew_RegAlloc, "%s%u", i != 0 ? ", " : "",
2726                 callPositions[i].bits());
2727   }
2728   JitSpewFin(JitSpew_RegAlloc);
2729 #endif
2730
2731   return splitAt(bundle, callPositions);
2732 }
2733
2734 bool BacktrackingAllocator::trySplitAcrossHotcode(LiveBundle* bundle,
2735                                                   bool* success) {
2736   // If this bundle has portions that are hot and portions that are cold,
2737   // split it at the boundaries between hot and cold code.
2738
2739   LiveRange* hotRange = nullptr;
2740
2741   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2742        iter++) {
2743     LiveRange* range = LiveRange::get(*iter);
2744     if (hotcode.contains(range, &hotRange)) {
2745       break;
2746     }
2747   }
2748
2749   // Don't split if there is no hot code in the bundle.
2750   if (!hotRange) {
2751     JitSpew(JitSpew_RegAlloc, "  .. bundle does not contain hot code");
2752     return true;
2753   }
2754
2755   // Don't split if there is no cold code in the bundle.
2756   bool coldCode = false;
2757   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2758        iter++) {
2759     LiveRange* range = LiveRange::get(*iter);
2760     if (!hotRange->contains(range)) {
2761       coldCode = true;
2762       break;
2763     }
2764   }
2765   if (!coldCode) {
2766     JitSpew(JitSpew_RegAlloc, "  .. bundle does not contain cold code");
2767     return true;
2768   }
2769
2770   JitSpewIfEnabled(JitSpew_RegAlloc, "  .. split across hot range %s",
2771                    hotRange->toString().get());
2772
2773   // Tweak the splitting method when compiling wasm code to look at actual
2774   // uses within the hot/cold code. This heuristic is in place as the below
2775   // mechanism regresses several asm.js tests. Hopefully this will be fixed
2776   // soon and this special case removed. See bug 948838.
2777   if (compilingWasm()) {
2778     SplitPositionVector splitPositions;
2779     if (!splitPositions.append(hotRange->from()) ||
2780         !splitPositions.append(hotRange->to())) {
2781       return false;
2782     }
2783     *success = true;
2784     return splitAt(bundle, splitPositions);
2785   }
2786
2787   LiveBundle* hotBundle = LiveBundle::FallibleNew(alloc(), bundle->spillSet(),
2788                                                   bundle->spillParent());
2789   if (!hotBundle) {
2790     return false;
2791   }
2792   LiveBundle* preBundle = nullptr;
2793   LiveBundle* postBundle = nullptr;
2794   LiveBundle* coldBundle = nullptr;
2795
2796   if (testbed) {
2797     coldBundle = LiveBundle::FallibleNew(alloc(), bundle->spillSet(),
2798                                          bundle->spillParent());
2799     if (!coldBundle) {
2800       return false;
2801     }
2802   }
2803
2804   // Accumulate the ranges of hot and cold code in the bundle. Note that
2805   // we are only comparing with the single hot range found, so the cold code
2806   // may contain separate hot ranges.
2807   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2808        iter++) {
2809     LiveRange* range = LiveRange::get(*iter);
2810     LiveRange::Range hot, coldPre, coldPost;
2811     range->intersect(hotRange, &coldPre, &hot, &coldPost);
2812
2813     if (!hot.empty()) {
2814       if (!hotBundle->addRangeAndDistributeUses(alloc(), range, hot.from,
2815                                                 hot.to)) {
2816         return false;
2817       }
2818     }
2819
2820     if (!coldPre.empty()) {
2821       if (testbed) {
2822         if (!coldBundle->addRangeAndDistributeUses(alloc(), range, coldPre.from,
2823                                                    coldPre.to)) {
2824           return false;
2825         }
2826       } else {
2827         if (!preBundle) {
2828           preBundle = LiveBundle::FallibleNew(alloc(), bundle->spillSet(),
2829                                               bundle->spillParent());
2830           if (!preBundle) {
2831             return false;
2832           }
2833         }
2834         if (!preBundle->addRangeAndDistributeUses(alloc(), range, coldPre.from,
2835                                                   coldPre.to)) {
2836           return false;
2837         }
2838       }
2839     }
2840
2841     if (!coldPost.empty()) {
2842       if (testbed) {
2843         if (!coldBundle->addRangeAndDistributeUses(
2844                 alloc(), range, coldPost.from, coldPost.to)) {
2845           return false;
2846         }
2847       } else {
2848         if (!postBundle) {
2849           postBundle = LiveBundle::FallibleNew(alloc(), bundle->spillSet(),
2850                                                bundle->spillParent());
2851           if (!postBundle) {
2852             return false;
2853           }
2854         }
2855         if (!postBundle->addRangeAndDistributeUses(
2856                 alloc(), range, coldPost.from, coldPost.to)) {
2857           return false;
2858         }
2859       }
2860     }
2861   }
2862
2863   MOZ_ASSERT(hotBundle->numRanges() != 0);
2864
2865   LiveBundleVector newBundles;
2866   if (!newBundles.append(hotBundle)) {
2867     return false;
2868   }
2869
2870   if (testbed) {
2871     MOZ_ASSERT(coldBundle->numRanges() != 0);
2872     if (!newBundles.append(coldBundle)) {
2873       return false;
2874     }
2875   } else {
2876     MOZ_ASSERT(preBundle || postBundle);
2877     if (preBundle && !newBundles.append(preBundle)) {
2878       return false;
2879     }
2880     if (postBundle && !newBundles.append(postBundle)) {
2881       return false;
2882     }
2883   }
2884
2885   *success = true;
2886   return updateVirtualRegisterListsThenRequeueBundles(bundle, newBundles);
2887 }
2888
2889 bool BacktrackingAllocator::trySplitAfterLastRegisterUse(LiveBundle* bundle,
2890                                                          LiveBundle* conflict,
2891                                                          bool* success) {
2892   // If this bundle's later uses do not require it to be in a register,
2893   // split it after the last use which does require a register. If conflict
2894   // is specified, only consider register uses before the conflict starts.
2895
2896   CodePosition lastRegisterFrom, lastRegisterTo, lastUse;
2897
2898   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2899        iter++) {
2900     LiveRange* range = LiveRange::get(*iter);
2901
2902     // If the range defines a register, consider that a register use for
2903     // our purposes here.
2904     if (isRegisterDefinition(range)) {
2905       CodePosition spillStart = minimalDefEnd(insData[range->from()]).next();
2906       if (!conflict || spillStart < conflict->firstRange()->from()) {
2907         lastUse = lastRegisterFrom = range->from();
2908         lastRegisterTo = spillStart;
2909       }
2910     }
2911
2912     for (UsePositionIterator iter(range->usesBegin()); iter; iter++) {
2913       LNode* ins = insData[iter->pos];
2914
2915       // Uses in the bundle should be sorted.
2916       MOZ_ASSERT(iter->pos >= lastUse);
2917       lastUse = inputOf(ins);
2918
2919       if (!conflict || outputOf(ins) < conflict->firstRange()->from()) {
2920         if (isRegisterUse(*iter, ins, /* considerCopy = */ true)) {
2921           lastRegisterFrom = inputOf(ins);
2922           lastRegisterTo = iter->pos.next();
2923         }
2924       }
2925     }
2926   }
2927
2928   // Can't trim non-register uses off the end by splitting.
2929   if (!lastRegisterFrom.bits()) {
2930     JitSpew(JitSpew_RegAlloc, "  .. bundle has no register uses");
2931     return true;
2932   }
2933   if (lastUse < lastRegisterTo) {
2934     JitSpew(JitSpew_RegAlloc, "  .. bundle's last use is a register use");
2935     return true;
2936   }
2937
2938   JitSpewIfEnabled(JitSpew_RegAlloc, "  .. split after last register use at %u",
2939                    lastRegisterTo.bits());
2940
2941   SplitPositionVector splitPositions;
2942   if (!splitPositions.append(lastRegisterTo)) {
2943     return false;
2944   }
2945   *success = true;
2946   return splitAt(bundle, splitPositions);
2947 }
2948
2949 bool BacktrackingAllocator::trySplitBeforeFirstRegisterUse(LiveBundle* bundle,
2950                                                            LiveBundle* conflict,
2951                                                            bool* success) {
2952   // If this bundle's earlier uses do not require it to be in a register,
2953   // split it before the first use which does require a register. If conflict
2954   // is specified, only consider register uses after the conflict ends.
2955
2956   if (isRegisterDefinition(bundle->firstRange())) {
2957     JitSpew(JitSpew_RegAlloc, "  .. bundle is defined by a register");
2958     return true;
2959   }
2960   if (!bundle->firstRange()->hasDefinition()) {
2961     JitSpew(JitSpew_RegAlloc, "  .. bundle does not have definition");
2962     return true;
2963   }
2964
2965   CodePosition firstRegisterFrom;
2966
2967   CodePosition conflictEnd;
2968   if (conflict) {
2969     for (LiveRange::BundleLinkIterator iter = conflict->rangesBegin(); iter;
2970          iter++) {
2971       LiveRange* range = LiveRange::get(*iter);
2972       if (range->to() > conflictEnd) {
2973         conflictEnd = range->to();
2974       }
2975     }
2976   }
2977
2978   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
2979        iter++) {
2980     LiveRange* range = LiveRange::get(*iter);
2981
2982     if (!conflict || range->from() > conflictEnd) {
2983       if (range->hasDefinition() && isRegisterDefinition(range)) {
2984         firstRegisterFrom = range->from();
2985         break;
2986       }
2987     }
2988
2989     for (UsePositionIterator iter(range->usesBegin()); iter; iter++) {
2990       LNode* ins = insData[iter->pos];
2991
2992       if (!conflict || outputOf(ins) >= conflictEnd) {
2993         if (isRegisterUse(*iter, ins, /* considerCopy = */ true)) {
2994           firstRegisterFrom = inputOf(ins);
2995           break;
2996         }
2997       }
2998     }
2999     if (firstRegisterFrom.bits()) {
3000       break;
3001     }
3002   }
3003
3004   if (!firstRegisterFrom.bits()) {
3005     // Can't trim non-register uses off the beginning by splitting.
3006     JitSpew(JitSpew_RegAlloc, "  bundle has no register uses");
3007     return true;
3008   }
3009
3010   JitSpewIfEnabled(JitSpew_RegAlloc,
3011                    "  .. split before first register use at %u",
3012                    firstRegisterFrom.bits());
3013
3014   SplitPositionVector splitPositions;
3015   if (!splitPositions.append(firstRegisterFrom)) {
3016     return false;
3017   }
3018   *success = true;
3019   return splitAt(bundle, splitPositions);
3020 }
3021
3022 ///////////////////////////////////////////////////////////////////////////////
3023 //                                                                           //
3024 // The top level driver for the splitting machinery                          //
3025 //                                                                           //
3026 ///////////////////////////////////////////////////////////////////////////////
3027
3028 // ::chooseBundleSplit
3029 // -------------------
3030 // If the first allocation loop (in ::go) can't allocate a bundle, it hands it
3031 // off to ::chooseBundleSplit, which is the "entry point" of the bundle-split
3032 // machinery.  This tries four heuristics in turn, to see if any can split the
3033 // bundle:
3034 //
3035 // * ::trySplitAcrossHotcode
3036 // * ::splitAcrossCalls (in some cases)
3037 // * ::trySplitBeforeFirstRegisterUse
3038 // * ::trySplitAfterLastRegisterUse
3039 //
3040 // These routines have similar structure: they try to decide on one or more
3041 // CodePositions at which to split the bundle, using whatever heuristics they
3042 // have to hand.  If suitable CodePosition(s) are found, they are put into a
3043 // `SplitPositionVector`, and the bundle and the vector are handed off to
3044 // ::splitAt, which performs the split (at least in theory) at the chosen
3045 // positions.  It also arranges for the new bundles to be added to
3046 // ::allocationQueue.
3047 //
3048 // ::trySplitAcrossHotcode has a special case for JS -- it modifies the
3049 // bundle(s) itself, rather than using ::splitAt.
3050 //
3051 // If none of the heuristic routines apply, then ::splitAt is called with an
3052 // empty vector of split points.  This is interpreted to mean "split at all
3053 // register uses".  When combined with how ::splitAt works, the effect is to
3054 // spill the bundle.
3055
3056 bool BacktrackingAllocator::chooseBundleSplit(LiveBundle* bundle, bool fixed,
3057                                               LiveBundle* conflict) {
3058   bool success = false;
3059
3060   JitSpewIfEnabled(JitSpew_RegAlloc, "  Splitting %s ..",
3061                    bundle->toString().get());
3062
3063   if (!trySplitAcrossHotcode(bundle, &success)) {
3064     return false;
3065   }
3066   if (success) {
3067     return true;
3068   }
3069
3070   if (fixed) {
3071     return splitAcrossCalls(bundle);
3072   }
3073
3074   if (!trySplitBeforeFirstRegisterUse(bundle, conflict, &success)) {
3075     return false;
3076   }
3077   if (success) {
3078     return true;
3079   }
3080
3081   if (!trySplitAfterLastRegisterUse(bundle, conflict, &success)) {
3082     return false;
3083   }
3084   if (success) {
3085     return true;
3086   }
3087
3088   // Split at all register uses.
3089   SplitPositionVector emptyPositions;
3090   return splitAt(bundle, emptyPositions);
3091 }
3092
3093 ///////////////////////////////////////////////////////////////////////////////
3094 //                                                                           //
3095 // Bundle allocation                                                         //
3096 //                                                                           //
3097 ///////////////////////////////////////////////////////////////////////////////
3098
3099 static const size_t MAX_ATTEMPTS = 2;
3100
3101 bool BacktrackingAllocator::computeRequirement(LiveBundle* bundle,
3102                                                Requirement* requirement,
3103                                                Requirement* hint) {
3104   // Set any requirement or hint on bundle according to its definition and
3105   // uses. Return false if there are conflicting requirements which will
3106   // require the bundle to be split.
3107
3108   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3109        iter++) {
3110     LiveRange* range = LiveRange::get(*iter);
3111     VirtualRegister& reg = range->vreg();
3112
3113     if (range->hasDefinition()) {
3114       // Deal with any definition constraints/hints.
3115       LDefinition::Policy policy = reg.def()->policy();
3116       if (policy == LDefinition::FIXED || policy == LDefinition::STACK) {
3117         // Fixed and stack policies get a FIXED requirement.  (In the stack
3118         // case, the allocation should have been performed already by
3119         // mergeAndQueueRegisters.)
3120         JitSpewIfEnabled(JitSpew_RegAlloc,
3121                          "  Requirement %s, fixed by definition",
3122                          reg.def()->output()->toString().get());
3123         if (!requirement->merge(Requirement(*reg.def()->output()))) {
3124           return false;
3125         }
3126       } else if (reg.ins()->isPhi()) {
3127         // Phis don't have any requirements, but they should prefer their
3128         // input allocations. This is captured by the group hints above.
3129       } else {
3130         // Non-phis get a REGISTER requirement.
3131         if (!requirement->merge(Requirement(Requirement::REGISTER))) {
3132           return false;
3133         }
3134       }
3135     }
3136
3137     // Search uses for requirements.
3138     for (UsePositionIterator iter = range->usesBegin(); iter; iter++) {
3139       LUse::Policy policy = iter->usePolicy();
3140       if (policy == LUse::FIXED) {
3141         AnyRegister required = GetFixedRegister(reg.def(), iter->use());
3142
3143         JitSpewIfEnabled(JitSpew_RegAlloc, "  Requirement %s, due to use at %u",
3144                          required.name(), iter->pos.bits());
3145
3146         // If there are multiple fixed registers which the bundle is
3147         // required to use, fail. The bundle will need to be split before
3148         // it can be allocated.
3149         if (!requirement->merge(Requirement(LAllocation(required)))) {
3150           return false;
3151         }
3152       } else if (policy == LUse::REGISTER) {
3153         if (!requirement->merge(Requirement(Requirement::REGISTER))) {
3154           return false;
3155         }
3156       } else if (policy == LUse::ANY) {
3157         // ANY differs from KEEPALIVE by actively preferring a register.
3158         if (!hint->merge(Requirement(Requirement::REGISTER))) {
3159           return false;
3160         }
3161       }
3162
3163       // The only case of STACK use policies is individual stack results using
3164       // their containing stack result area, which is given a fixed allocation
3165       // above.
3166       MOZ_ASSERT_IF(policy == LUse::STACK,
3167                     requirement->kind() == Requirement::FIXED);
3168       MOZ_ASSERT_IF(policy == LUse::STACK,
3169                     requirement->allocation().isStackArea());
3170     }
3171   }
3172
3173   return true;
3174 }
3175
3176 bool BacktrackingAllocator::tryAllocateRegister(PhysicalRegister& r,
3177                                                 LiveBundle* bundle,
3178                                                 bool* success, bool* pfixed,
3179                                                 LiveBundleVector& conflicting) {
3180   *success = false;
3181
3182   if (!r.allocatable) {
3183     return true;
3184   }
3185
3186   LiveBundleVector aliasedConflicting;
3187
3188   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3189        iter++) {
3190     LiveRange* range = LiveRange::get(*iter);
3191     LiveRangePlus rangePlus(range);
3192
3193     // All ranges in the bundle must be compatible with the physical register.
3194     MOZ_ASSERT(range->vreg().isCompatible(r.reg));
3195
3196     const size_t numAliased = r.reg.numAliased();
3197     for (size_t a = 0; a < numAliased; a++) {
3198       PhysicalRegister& rAlias = registers[r.reg.aliased(a).code()];
3199       LiveRangePlus existingPlus;
3200       if (!rAlias.allocations.contains(rangePlus, &existingPlus)) {
3201         continue;
3202       }
3203       const LiveRange* existing = existingPlus.liveRange();
3204       if (existing->hasVreg()) {
3205         MOZ_ASSERT(existing->bundle()->allocation().toRegister() == rAlias.reg);
3206         bool duplicate = false;
3207         for (size_t i = 0; i < aliasedConflicting.length(); i++) {
3208           if (aliasedConflicting[i] == existing->bundle()) {
3209             duplicate = true;
3210             break;
3211           }
3212         }
3213         if (!duplicate && !aliasedConflicting.append(existing->bundle())) {
3214           return false;
3215         }
3216       } else {
3217         JitSpewIfEnabled(JitSpew_RegAlloc, "  %s collides with fixed use %s",
3218                          rAlias.reg.name(), existing->toString().get());
3219         *pfixed = true;
3220         return true;
3221       }
3222       MOZ_ASSERT(r.reg.numAliased() == numAliased);
3223     }
3224   }
3225
3226   if (!aliasedConflicting.empty()) {
3227     // One or more aliased registers is allocated to another bundle
3228     // overlapping this one. Keep track of the conflicting set, and in the
3229     // case of multiple conflicting sets keep track of the set with the
3230     // lowest maximum spill weight.
3231
3232     // The #ifdef guards against "unused variable 'existing'" bustage.
3233 #ifdef JS_JITSPEW
3234     if (JitSpewEnabled(JitSpew_RegAlloc)) {
3235       if (aliasedConflicting.length() == 1) {
3236         LiveBundle* existing = aliasedConflicting[0];
3237         JitSpew(JitSpew_RegAlloc, "  %s collides with %s [weight %zu]",
3238                 r.reg.name(), existing->toString().get(),
3239                 computeSpillWeight(existing));
3240       } else {
3241         JitSpew(JitSpew_RegAlloc, "  %s collides with the following",
3242                 r.reg.name());
3243         for (size_t i = 0; i < aliasedConflicting.length(); i++) {
3244           LiveBundle* existing = aliasedConflicting[i];
3245           JitSpew(JitSpew_RegAlloc, "    %s [weight %zu]",
3246                   existing->toString().get(), computeSpillWeight(existing));
3247         }
3248       }
3249     }
3250 #endif
3251
3252     if (conflicting.empty()) {
3253       conflicting = std::move(aliasedConflicting);
3254     } else {
3255       if (maximumSpillWeight(aliasedConflicting) <
3256           maximumSpillWeight(conflicting)) {
3257         conflicting = std::move(aliasedConflicting);
3258       }
3259     }
3260     return true;
3261   }
3262
3263   JitSpewIfEnabled(JitSpew_RegAlloc, "  allocated to %s", r.reg.name());
3264
3265   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3266        iter++) {
3267     LiveRange* range = LiveRange::get(*iter);
3268     if (!alloc().ensureBallast()) {
3269       return false;
3270     }
3271     LiveRangePlus rangePlus(range);
3272     if (!r.allocations.insert(rangePlus)) {
3273       return false;
3274     }
3275   }
3276
3277   bundle->setAllocation(LAllocation(r.reg));
3278   *success = true;
3279   return true;
3280 }
3281
3282 bool BacktrackingAllocator::tryAllocateAnyRegister(
3283     LiveBundle* bundle, bool* success, bool* pfixed,
3284     LiveBundleVector& conflicting) {
3285   // Search for any available register which the bundle can be allocated to.
3286
3287   LDefinition::Type type = bundle->firstRange()->vreg().type();
3288
3289   if (LDefinition::isFloatReg(type)) {
3290     for (size_t i = AnyRegister::FirstFloatReg; i < AnyRegister::Total; i++) {
3291       if (!LDefinition::isFloatRegCompatible(type, registers[i].reg.fpu())) {
3292         continue;
3293       }
3294       if (!tryAllocateRegister(registers[i], bundle, success, pfixed,
3295                                conflicting)) {
3296         return false;
3297       }
3298       if (*success) {
3299         break;
3300       }
3301     }
3302     return true;
3303   }
3304
3305   for (size_t i = 0; i < AnyRegister::FirstFloatReg; i++) {
3306     if (!tryAllocateRegister(registers[i], bundle, success, pfixed,
3307                              conflicting)) {
3308       return false;
3309     }
3310     if (*success) {
3311       break;
3312     }
3313   }
3314   return true;
3315 }
3316
3317 bool BacktrackingAllocator::evictBundle(LiveBundle* bundle) {
3318   JitSpewIfEnabled(JitSpew_RegAlloc,
3319                    "  Evicting %s [priority %zu] [weight %zu]",
3320                    bundle->toString().get(), computePriority(bundle),
3321                    computeSpillWeight(bundle));
3322
3323   AnyRegister reg(bundle->allocation().toRegister());
3324   PhysicalRegister& physical = registers[reg.code()];
3325   MOZ_ASSERT(physical.reg == reg && physical.allocatable);
3326
3327   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3328        iter++) {
3329     LiveRange* range = LiveRange::get(*iter);
3330     LiveRangePlus rangePlus(range);
3331     physical.allocations.remove(rangePlus);
3332   }
3333
3334   bundle->setAllocation(LAllocation());
3335
3336   size_t priority = computePriority(bundle);
3337   return allocationQueue.insert(QueueItem(bundle, priority));
3338 }
3339
3340 bool BacktrackingAllocator::tryAllocateFixed(LiveBundle* bundle,
3341                                              Requirement requirement,
3342                                              bool* success, bool* pfixed,
3343                                              LiveBundleVector& conflicting) {
3344   // Spill bundles which are required to be in a certain stack slot.
3345   if (!requirement.allocation().isRegister()) {
3346     JitSpew(JitSpew_RegAlloc, "  stack allocation requirement");
3347     bundle->setAllocation(requirement.allocation());
3348     *success = true;
3349     return true;
3350   }
3351
3352   AnyRegister reg = requirement.allocation().toRegister();
3353   return tryAllocateRegister(registers[reg.code()], bundle, success, pfixed,
3354                              conflicting);
3355 }
3356
3357 bool BacktrackingAllocator::tryAllocateNonFixed(LiveBundle* bundle,
3358                                                 Requirement requirement,
3359                                                 Requirement hint, bool* success,
3360                                                 bool* pfixed,
3361                                                 LiveBundleVector& conflicting) {
3362   // If we want, but do not require a bundle to be in a specific register,
3363   // only look at that register for allocating and evict or spill if it is
3364   // not available. Picking a separate register may be even worse than
3365   // spilling, as it will still necessitate moves and will tie up more
3366   // registers than if we spilled.
3367   if (hint.kind() == Requirement::FIXED) {
3368     AnyRegister reg = hint.allocation().toRegister();
3369     if (!tryAllocateRegister(registers[reg.code()], bundle, success, pfixed,
3370                              conflicting)) {
3371       return false;
3372     }
3373     if (*success) {
3374       return true;
3375     }
3376   }
3377
3378   // Spill bundles which have no hint or register requirement.
3379   if (requirement.kind() == Requirement::NONE &&
3380       hint.kind() != Requirement::REGISTER) {
3381     JitSpew(JitSpew_RegAlloc,
3382             "  postponed spill (no hint or register requirement)");
3383     if (!spilledBundles.append(bundle)) {
3384       return false;
3385     }
3386     *success = true;
3387     return true;
3388   }
3389
3390   if (conflicting.empty() || minimalBundle(bundle)) {
3391     if (!tryAllocateAnyRegister(bundle, success, pfixed, conflicting)) {
3392       return false;
3393     }
3394     if (*success) {
3395       return true;
3396     }
3397   }
3398
3399   // Spill bundles which have no register requirement if they didn't get
3400   // allocated.
3401   if (requirement.kind() == Requirement::NONE) {
3402     JitSpew(JitSpew_RegAlloc, "  postponed spill (no register requirement)");
3403     if (!spilledBundles.append(bundle)) {
3404       return false;
3405     }
3406     *success = true;
3407     return true;
3408   }
3409
3410   // We failed to allocate this bundle.
3411   MOZ_ASSERT(!*success);
3412   return true;
3413 }
3414
3415 bool BacktrackingAllocator::processBundle(MIRGenerator* mir,
3416                                           LiveBundle* bundle) {
3417   JitSpewIfEnabled(JitSpew_RegAlloc,
3418                    "Allocating %s [priority %zu] [weight %zu]",
3419                    bundle->toString().get(), computePriority(bundle),
3420                    computeSpillWeight(bundle));
3421
3422   // A bundle can be processed by doing any of the following:
3423   //
3424   // - Assigning the bundle a register. The bundle cannot overlap any other
3425   //   bundle allocated for that physical register.
3426   //
3427   // - Spilling the bundle, provided it has no register uses.
3428   //
3429   // - Splitting the bundle into two or more bundles which cover the original
3430   //   one. The new bundles are placed back onto the priority queue for later
3431   //   processing.
3432   //
3433   // - Evicting one or more existing allocated bundles, and then doing one
3434   //   of the above operations. Evicted bundles are placed back on the
3435   //   priority queue. Any evicted bundles must have a lower spill weight
3436   //   than the bundle being processed.
3437   //
3438   // As long as this structure is followed, termination is guaranteed.
3439   // In general, we want to minimize the amount of bundle splitting (which
3440   // generally necessitates spills), so allocate longer lived, lower weight
3441   // bundles first and evict and split them later if they prevent allocation
3442   // for higher weight bundles.
3443
3444   Requirement requirement, hint;
3445   bool canAllocate = computeRequirement(bundle, &requirement, &hint);
3446
3447   bool fixed;
3448   LiveBundleVector conflicting;
3449   for (size_t attempt = 0;; attempt++) {
3450     if (mir->shouldCancel("Backtracking Allocation (processBundle loop)")) {
3451       return false;
3452     }
3453
3454     if (canAllocate) {
3455       bool success = false;
3456       fixed = false;
3457       conflicting.clear();
3458
3459       // Ok, let's try allocating for this bundle.
3460       if (requirement.kind() == Requirement::FIXED) {
3461         if (!tryAllocateFixed(bundle, requirement, &success, &fixed,
3462                               conflicting)) {
3463           return false;
3464         }
3465       } else {
3466         if (!tryAllocateNonFixed(bundle, requirement, hint, &success, &fixed,
3467                                  conflicting)) {
3468           return false;
3469         }
3470       }
3471
3472       // If that worked, we're done!
3473       if (success) {
3474         return true;
3475       }
3476
3477       // If that didn't work, but we have one or more non-fixed bundles
3478       // known to be conflicting, maybe we can evict them and try again.
3479       if ((attempt < MAX_ATTEMPTS || minimalBundle(bundle)) && !fixed &&
3480           !conflicting.empty() &&
3481           maximumSpillWeight(conflicting) < computeSpillWeight(bundle)) {
3482         for (size_t i = 0; i < conflicting.length(); i++) {
3483           if (!evictBundle(conflicting[i])) {
3484             return false;
3485           }
3486         }
3487         continue;
3488       }
3489     }
3490
3491     // A minimal bundle cannot be split any further. If we try to split it
3492     // it at this point we will just end up with the same bundle and will
3493     // enter an infinite loop. Weights and the initial live ranges must
3494     // be constructed so that any minimal bundle is allocatable.
3495     MOZ_ASSERT(!minimalBundle(bundle));
3496
3497     LiveBundle* conflict = conflicting.empty() ? nullptr : conflicting[0];
3498     return chooseBundleSplit(bundle, canAllocate && fixed, conflict);
3499   }
3500 }
3501
3502 // Helper for ::tryAllocatingRegistersForSpillBundles
3503 bool BacktrackingAllocator::spill(LiveBundle* bundle) {
3504   JitSpew(JitSpew_RegAlloc, "  Spilling bundle");
3505   MOZ_ASSERT(bundle->allocation().isBogus());
3506
3507   if (LiveBundle* spillParent = bundle->spillParent()) {
3508     JitSpew(JitSpew_RegAlloc, "    Using existing spill bundle");
3509     for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3510          iter++) {
3511       LiveRange* range = LiveRange::get(*iter);
3512       LiveRange* parentRange = spillParent->rangeFor(range->from());
3513       MOZ_ASSERT(parentRange->contains(range));
3514       MOZ_ASSERT(&range->vreg() == &parentRange->vreg());
3515       range->tryToMoveDefAndUsesInto(parentRange);
3516       MOZ_ASSERT(!range->hasUses());
3517       range->vreg().removeRange(range);
3518     }
3519     return true;
3520   }
3521
3522   return bundle->spillSet()->addSpilledBundle(bundle);
3523 }
3524
3525 bool BacktrackingAllocator::tryAllocatingRegistersForSpillBundles() {
3526   for (auto it = spilledBundles.begin(); it != spilledBundles.end(); it++) {
3527     LiveBundle* bundle = *it;
3528     LiveBundleVector conflicting;
3529     bool fixed = false;
3530     bool success = false;
3531
3532     if (mir->shouldCancel("Backtracking Try Allocating Spilled Bundles")) {
3533       return false;
3534     }
3535
3536     JitSpewIfEnabled(JitSpew_RegAlloc, "Spill or allocate %s",
3537                      bundle->toString().get());
3538
3539     if (!tryAllocateAnyRegister(bundle, &success, &fixed, conflicting)) {
3540       return false;
3541     }
3542
3543     // If the bundle still has no register, spill the bundle.
3544     if (!success && !spill(bundle)) {
3545       return false;
3546     }
3547   }
3548
3549   return true;
3550 }
3551
3552 ///////////////////////////////////////////////////////////////////////////////
3553 //                                                                           //
3554 // Rewriting of the LIR after bundle processing is done:                     //
3555 //   ::pickStackSlots                                                        //
3556 //   ::createMoveGroupsFromLiveRangeTransitions                              //
3557 //   ::installAllocationsInLIR                                               //
3558 //   ::populateSafepoints                                                    //
3559 //   ::annotateMoveGroups                                                    //
3560 //                                                                           //
3561 ///////////////////////////////////////////////////////////////////////////////
3562
3563 // Helper for ::pickStackSlot
3564 bool BacktrackingAllocator::insertAllRanges(LiveRangePlusSet& set,
3565                                             LiveBundle* bundle) {
3566   for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3567        iter++) {
3568     LiveRange* range = LiveRange::get(*iter);
3569     if (!alloc().ensureBallast()) {
3570       return false;
3571     }
3572     LiveRangePlus rangePlus(range);
3573     if (!set.insert(rangePlus)) {
3574       return false;
3575     }
3576   }
3577   return true;
3578 }
3579
3580 // Helper for ::pickStackSlots
3581 bool BacktrackingAllocator::pickStackSlot(SpillSet* spillSet) {
3582   // Look through all ranges that have been spilled in this set for a
3583   // register definition which is fixed to a stack or argument slot. If we
3584   // find one, use it for all bundles that have been spilled. tryMergeBundles
3585   // makes sure this reuse is possible when an initial bundle contains ranges
3586   // from multiple virtual registers.
3587   for (size_t i = 0; i < spillSet->numSpilledBundles(); i++) {
3588     LiveBundle* bundle = spillSet->spilledBundle(i);
3589     for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3590          iter++) {
3591       LiveRange* range = LiveRange::get(*iter);
3592       if (range->hasDefinition()) {
3593         LDefinition* def = range->vreg().def();
3594         if (def->policy() == LDefinition::FIXED) {
3595           MOZ_ASSERT(!def->output()->isRegister());
3596           MOZ_ASSERT(!def->output()->isStackSlot());
3597           spillSet->setAllocation(*def->output());
3598           return true;
3599         }
3600       }
3601     }
3602   }
3603
3604   LDefinition::Type type =
3605       spillSet->spilledBundle(0)->firstRange()->vreg().type();
3606
3607   SpillSlotList* slotList;
3608   switch (StackSlotAllocator::width(type)) {
3609     case 4:
3610       slotList = &normalSlots;
3611       break;
3612     case 8:
3613       slotList = &doubleSlots;
3614       break;
3615     case 16:
3616       slotList = &quadSlots;
3617       break;
3618     default:
3619       MOZ_CRASH("Bad width");
3620   }
3621
3622   // Maximum number of existing spill slots we will look at before giving up
3623   // and allocating a new slot.
3624   static const size_t MAX_SEARCH_COUNT = 10;
3625
3626   size_t searches = 0;
3627   SpillSlot* stop = nullptr;
3628   while (!slotList->empty()) {
3629     SpillSlot* spillSlot = *slotList->begin();
3630     if (!stop) {
3631       stop = spillSlot;
3632     } else if (stop == spillSlot) {
3633       // We looked through every slot in the list.
3634       break;
3635     }
3636
3637     bool success = true;
3638     for (size_t i = 0; i < spillSet->numSpilledBundles(); i++) {
3639       LiveBundle* bundle = spillSet->spilledBundle(i);
3640       for (LiveRange::BundleLinkIterator iter = bundle->rangesBegin(); iter;
3641            iter++) {
3642         LiveRange* range = LiveRange::get(*iter);
3643         LiveRangePlus rangePlus(range);
3644         LiveRangePlus existingPlus;
3645         if (spillSlot->allocated.contains(rangePlus, &existingPlus)) {
3646           success = false;
3647           break;
3648         }
3649       }
3650       if (!success) {
3651         break;
3652       }
3653     }
3654     if (success) {
3655       // We can reuse this physical stack slot for the new bundles.
3656       // Update the allocated ranges for the slot.
3657       for (size_t i = 0; i < spillSet->numSpilledBundles(); i++) {
3658         LiveBundle* bundle = spillSet->spilledBundle(i);
3659         if (!insertAllRanges(spillSlot->allocated, bundle)) {
3660           return false;
3661         }
3662       }
3663       spillSet->setAllocation(spillSlot->alloc);
3664       return true;
3665     }
3666
3667     // On a miss, move the spill to the end of the list. This will cause us
3668     // to make fewer attempts to allocate from slots with a large and
3669     // highly contended range.
3670     slotList->popFront();
3671     slotList->pushBack(spillSlot);
3672
3673     if (++searches == MAX_SEARCH_COUNT) {
3674       break;
3675     }
3676   }
3677
3678   // We need a new physical stack slot.
3679   uint32_t stackSlot = stackSlotAllocator.allocateSlot(type);
3680
3681   SpillSlot* spillSlot =
3682       new (alloc().fallible()) SpillSlot(stackSlot, alloc().lifoAlloc());
3683   if (!spillSlot) {
3684     return false;
3685   }
3686
3687   for (size_t i = 0; i < spillSet->numSpilledBundles(); i++) {
3688     LiveBundle* bundle = spillSet->spilledBundle(i);
3689     if (!insertAllRanges(spillSlot->allocated, bundle)) {
3690       return false;
3691     }
3692   }
3693
3694   spillSet->setAllocation(spillSlot->alloc);
3695
3696   slotList->pushFront(spillSlot);
3697   return true;
3698 }
3699
3700 bool BacktrackingAllocator::pickStackSlots() {
3701   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
3702     VirtualRegister& reg = vregs[i];
3703
3704     if (mir->shouldCancel("Backtracking Pick Stack Slots")) {
3705       return false;
3706     }
3707
3708     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
3709          iter++) {
3710       LiveRange* range = LiveRange::get(*iter);
3711       LiveBundle* bundle = range->bundle();
3712
3713       if (bundle->allocation().isBogus()) {
3714         if (!pickStackSlot(bundle->spillSet())) {
3715           return false;
3716         }
3717         MOZ_ASSERT(!bundle->allocation().isBogus());
3718       }
3719     }
3720   }
3721
3722   return true;
3723 }
3724
3725 // Helper for ::createMoveGroupsFromLiveRangeTransitions
3726 bool BacktrackingAllocator::moveAtEdge(LBlock* predecessor, LBlock* successor,
3727                                        LiveRange* from, LiveRange* to,
3728                                        LDefinition::Type type) {
3729   if (successor->mir()->numPredecessors() > 1) {
3730     MOZ_ASSERT(predecessor->mir()->numSuccessors() == 1);
3731     return moveAtExit(predecessor, from, to, type);
3732   }
3733
3734   return moveAtEntry(successor, from, to, type);
3735 }
3736
3737 // Helper for ::createMoveGroupsFromLiveRangeTransitions
3738 bool BacktrackingAllocator::deadRange(LiveRange* range) {
3739   // Check for direct uses of this range.
3740   if (range->hasUses() || range->hasDefinition()) {
3741     return false;
3742   }
3743
3744   CodePosition start = range->from();
3745   LNode* ins = insData[start];
3746   if (start == entryOf(ins->block())) {
3747     return false;
3748   }
3749
3750   VirtualRegister& reg = range->vreg();
3751
3752   // Check if there are later ranges for this vreg.
3753   LiveRange::RegisterLinkIterator iter = reg.rangesBegin(range);
3754   for (iter++; iter; iter++) {
3755     LiveRange* laterRange = LiveRange::get(*iter);
3756     if (laterRange->from() > range->from()) {
3757       return false;
3758     }
3759   }
3760
3761   // Check if this range ends at a loop backedge.
3762   LNode* last = insData[range->to().previous()];
3763   if (last->isGoto() &&
3764       last->toGoto()->target()->id() < last->block()->mir()->id()) {
3765     return false;
3766   }
3767
3768   // Check if there are phis which this vreg flows to.
3769   if (reg.usedByPhi()) {
3770     return false;
3771   }
3772
3773   return true;
3774 }
3775
3776 bool BacktrackingAllocator::createMoveGroupsFromLiveRangeTransitions() {
3777   // Add moves to handle changing assignments for vregs over their lifetime.
3778   JitSpew(JitSpew_RegAlloc, "ResolveControlFlow: begin");
3779
3780   JitSpew(JitSpew_RegAlloc,
3781           "  ResolveControlFlow: adding MoveGroups within blocks");
3782
3783   // Look for places where a register's assignment changes in the middle of a
3784   // basic block.
3785   MOZ_ASSERT(!vregs[0u].hasRanges());
3786   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
3787     VirtualRegister& reg = vregs[i];
3788
3789     if (mir->shouldCancel(
3790             "Backtracking Resolve Control Flow (vreg outer loop)")) {
3791       return false;
3792     }
3793
3794     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;) {
3795       LiveRange* range = LiveRange::get(*iter);
3796
3797       if (mir->shouldCancel(
3798               "Backtracking Resolve Control Flow (vreg inner loop)")) {
3799         return false;
3800       }
3801
3802       // Remove ranges which will never be used.
3803       if (deadRange(range)) {
3804         reg.removeRangeAndIncrement(iter);
3805         continue;
3806       }
3807
3808       // The range which defines the register does not have a predecessor
3809       // to add moves from.
3810       if (range->hasDefinition()) {
3811         iter++;
3812         continue;
3813       }
3814
3815       // Ignore ranges that start at block boundaries. We will handle
3816       // these in the next phase.
3817       CodePosition start = range->from();
3818       LNode* ins = insData[start];
3819       if (start == entryOf(ins->block())) {
3820         iter++;
3821         continue;
3822       }
3823
3824       // If we already saw a range which covers the start of this range
3825       // and has the same allocation, we don't need an explicit move at
3826       // the start of this range.
3827       bool skip = false;
3828       for (LiveRange::RegisterLinkIterator prevIter = reg.rangesBegin();
3829            prevIter != iter; prevIter++) {
3830         LiveRange* prevRange = LiveRange::get(*prevIter);
3831         if (prevRange->covers(start) && prevRange->bundle()->allocation() ==
3832                                             range->bundle()->allocation()) {
3833           skip = true;
3834           break;
3835         }
3836       }
3837       if (skip) {
3838         iter++;
3839         continue;
3840       }
3841
3842       if (!alloc().ensureBallast()) {
3843         return false;
3844       }
3845
3846       LiveRange* predecessorRange =
3847           reg.rangeFor(start.previous(), /* preferRegister = */ true);
3848       if (start.subpos() == CodePosition::INPUT) {
3849         JitSpewIfEnabled(JitSpew_RegAlloc, "    moveInput (%s) <- (%s)",
3850                          range->toString().get(),
3851                          predecessorRange->toString().get());
3852         if (!moveInput(ins->toInstruction(), predecessorRange, range,
3853                        reg.type())) {
3854           return false;
3855         }
3856       } else {
3857         JitSpew(JitSpew_RegAlloc, "    (moveAfter)");
3858         if (!moveAfter(ins->toInstruction(), predecessorRange, range,
3859                        reg.type())) {
3860           return false;
3861         }
3862       }
3863
3864       iter++;
3865     }
3866   }
3867
3868   JitSpew(JitSpew_RegAlloc,
3869           "  ResolveControlFlow: adding MoveGroups for phi nodes");
3870
3871   for (size_t i = 0; i < graph.numBlocks(); i++) {
3872     if (mir->shouldCancel("Backtracking Resolve Control Flow (block loop)")) {
3873       return false;
3874     }
3875
3876     LBlock* successor = graph.getBlock(i);
3877     MBasicBlock* mSuccessor = successor->mir();
3878     if (mSuccessor->numPredecessors() < 1) {
3879       continue;
3880     }
3881
3882     // Resolve phis to moves.
3883     for (size_t j = 0; j < successor->numPhis(); j++) {
3884       LPhi* phi = successor->getPhi(j);
3885       MOZ_ASSERT(phi->numDefs() == 1);
3886       LDefinition* def = phi->getDef(0);
3887       VirtualRegister& reg = vreg(def);
3888       LiveRange* to = reg.rangeFor(entryOf(successor));
3889       MOZ_ASSERT(to);
3890
3891       for (size_t k = 0; k < mSuccessor->numPredecessors(); k++) {
3892         LBlock* predecessor = mSuccessor->getPredecessor(k)->lir();
3893         MOZ_ASSERT(predecessor->mir()->numSuccessors() == 1);
3894
3895         LAllocation* input = phi->getOperand(k);
3896         LiveRange* from = vreg(input).rangeFor(exitOf(predecessor),
3897                                                /* preferRegister = */ true);
3898         MOZ_ASSERT(from);
3899
3900         if (!alloc().ensureBallast()) {
3901           return false;
3902         }
3903
3904         // Note: we have to use moveAtEdge both here and below (for edge
3905         // resolution) to avoid conflicting moves. See bug 1493900.
3906         JitSpew(JitSpew_RegAlloc, "    (moveAtEdge#1)");
3907         if (!moveAtEdge(predecessor, successor, from, to, def->type())) {
3908           return false;
3909         }
3910       }
3911     }
3912   }
3913
3914   JitSpew(JitSpew_RegAlloc,
3915           "  ResolveControlFlow: adding MoveGroups to fix conflicted edges");
3916
3917   // Add moves to resolve graph edges with different allocations at their
3918   // source and target.
3919   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
3920     VirtualRegister& reg = vregs[i];
3921     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
3922          iter++) {
3923       LiveRange* targetRange = LiveRange::get(*iter);
3924
3925       size_t firstBlockId = insData[targetRange->from()]->block()->mir()->id();
3926       if (!targetRange->covers(entryOf(graph.getBlock(firstBlockId)))) {
3927         firstBlockId++;
3928       }
3929       for (size_t id = firstBlockId; id < graph.numBlocks(); id++) {
3930         LBlock* successor = graph.getBlock(id);
3931         if (!targetRange->covers(entryOf(successor))) {
3932           break;
3933         }
3934
3935         BitSet& live = liveIn[id];
3936         if (!live.contains(i)) {
3937           continue;
3938         }
3939
3940         for (size_t j = 0; j < successor->mir()->numPredecessors(); j++) {
3941           LBlock* predecessor = successor->mir()->getPredecessor(j)->lir();
3942           if (targetRange->covers(exitOf(predecessor))) {
3943             continue;
3944           }
3945
3946           if (!alloc().ensureBallast()) {
3947             return false;
3948           }
3949           JitSpew(JitSpew_RegAlloc, "    (moveAtEdge#2)");
3950           LiveRange* from = reg.rangeFor(exitOf(predecessor), true);
3951           if (!moveAtEdge(predecessor, successor, from, targetRange,
3952                           reg.type())) {
3953             return false;
3954           }
3955         }
3956       }
3957     }
3958   }
3959
3960   JitSpew(JitSpew_RegAlloc, "ResolveControlFlow: end");
3961   return true;
3962 }
3963
3964 // Helper for ::addLiveRegistersForRange
3965 size_t BacktrackingAllocator::findFirstNonCallSafepoint(CodePosition from) {
3966   size_t i = 0;
3967   for (; i < graph.numNonCallSafepoints(); i++) {
3968     const LInstruction* ins = graph.getNonCallSafepoint(i);
3969     if (from <= inputOf(ins)) {
3970       break;
3971     }
3972   }
3973   return i;
3974 }
3975
3976 // Helper for ::installAllocationsInLIR
3977 void BacktrackingAllocator::addLiveRegistersForRange(VirtualRegister& reg,
3978                                                      LiveRange* range) {
3979   // Fill in the live register sets for all non-call safepoints.
3980   LAllocation a = range->bundle()->allocation();
3981   if (!a.isRegister()) {
3982     return;
3983   }
3984
3985   // Don't add output registers to the safepoint.
3986   CodePosition start = range->from();
3987   if (range->hasDefinition() && !reg.isTemp()) {
3988 #ifdef CHECK_OSIPOINT_REGISTERS
3989     // We don't add the output register to the safepoint,
3990     // but it still might get added as one of the inputs.
3991     // So eagerly add this reg to the safepoint clobbered registers.
3992     if (reg.ins()->isInstruction()) {
3993       if (LSafepoint* safepoint = reg.ins()->toInstruction()->safepoint()) {
3994         safepoint->addClobberedRegister(a.toRegister());
3995       }
3996     }
3997 #endif
3998     start = start.next();
3999   }
4000
4001   size_t i = findFirstNonCallSafepoint(start);
4002   for (; i < graph.numNonCallSafepoints(); i++) {
4003     LInstruction* ins = graph.getNonCallSafepoint(i);
4004     CodePosition pos = inputOf(ins);
4005
4006     // Safepoints are sorted, so we can shortcut out of this loop
4007     // if we go out of range.
4008     if (range->to() <= pos) {
4009       break;
4010     }
4011
4012     MOZ_ASSERT(range->covers(pos));
4013
4014     LSafepoint* safepoint = ins->safepoint();
4015     safepoint->addLiveRegister(a.toRegister());
4016
4017 #ifdef CHECK_OSIPOINT_REGISTERS
4018     if (reg.isTemp()) {
4019       safepoint->addClobberedRegister(a.toRegister());
4020     }
4021 #endif
4022   }
4023 }
4024
4025 // Helper for ::installAllocationsInLIR
4026 static inline size_t NumReusingDefs(LInstruction* ins) {
4027   size_t num = 0;
4028   for (size_t i = 0; i < ins->numDefs(); i++) {
4029     LDefinition* def = ins->getDef(i);
4030     if (def->policy() == LDefinition::MUST_REUSE_INPUT) {
4031       num++;
4032     }
4033   }
4034   return num;
4035 }
4036
4037 bool BacktrackingAllocator::installAllocationsInLIR() {
4038   JitSpew(JitSpew_RegAlloc, "Installing Allocations");
4039
4040   MOZ_ASSERT(!vregs[0u].hasRanges());
4041   for (size_t i = 1; i < graph.numVirtualRegisters(); i++) {
4042     VirtualRegister& reg = vregs[i];
4043
4044     if (mir->shouldCancel("Backtracking Install Allocations (main loop)")) {
4045       return false;
4046     }
4047
4048     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
4049          iter++) {
4050       LiveRange* range = LiveRange::get(*iter);
4051
4052       if (range->hasDefinition()) {
4053         reg.def()->setOutput(range->bundle()->allocation());
4054         if (reg.ins()->recoversInput()) {
4055           LSnapshot* snapshot = reg.ins()->toInstruction()->snapshot();
4056           for (size_t i = 0; i < snapshot->numEntries(); i++) {
4057             LAllocation* entry = snapshot->getEntry(i);
4058             if (entry->isUse() &&
4059                 entry->toUse()->policy() == LUse::RECOVERED_INPUT) {
4060               *entry = *reg.def()->output();
4061             }
4062           }
4063         }
4064       }
4065
4066       for (UsePositionIterator iter(range->usesBegin()); iter; iter++) {
4067         LAllocation* alloc = iter->use();
4068         *alloc = range->bundle()->allocation();
4069
4070         // For any uses which feed into MUST_REUSE_INPUT definitions,
4071         // add copies if the use and def have different allocations.
4072         LNode* ins = insData[iter->pos];
4073         if (LDefinition* def = FindReusingDefOrTemp(ins, alloc)) {
4074           LiveRange* outputRange = vreg(def).rangeFor(outputOf(ins));
4075           LAllocation res = outputRange->bundle()->allocation();
4076           LAllocation sourceAlloc = range->bundle()->allocation();
4077
4078           if (res != *alloc) {
4079             if (!this->alloc().ensureBallast()) {
4080               return false;
4081             }
4082             if (NumReusingDefs(ins->toInstruction()) <= 1) {
4083               LMoveGroup* group = getInputMoveGroup(ins->toInstruction());
4084               if (!group->addAfter(sourceAlloc, res, reg.type())) {
4085                 return false;
4086               }
4087             } else {
4088               LMoveGroup* group = getFixReuseMoveGroup(ins->toInstruction());
4089               if (!group->add(sourceAlloc, res, reg.type())) {
4090                 return false;
4091               }
4092             }
4093             *alloc = res;
4094           }
4095         }
4096       }
4097
4098       addLiveRegistersForRange(reg, range);
4099     }
4100   }
4101
4102   graph.setLocalSlotsSize(stackSlotAllocator.stackHeight());
4103   return true;
4104 }
4105
4106 // Helper for ::populateSafepoints
4107 size_t BacktrackingAllocator::findFirstSafepoint(CodePosition pos,
4108                                                  size_t startFrom) {
4109   size_t i = startFrom;
4110   for (; i < graph.numSafepoints(); i++) {
4111     LInstruction* ins = graph.getSafepoint(i);
4112     if (pos <= inputOf(ins)) {
4113       break;
4114     }
4115   }
4116   return i;
4117 }
4118
4119 // Helper for ::populateSafepoints
4120 static inline bool IsNunbox(VirtualRegister& reg) {
4121 #ifdef JS_NUNBOX32
4122   return reg.type() == LDefinition::TYPE || reg.type() == LDefinition::PAYLOAD;
4123 #else
4124   return false;
4125 #endif
4126 }
4127
4128 // Helper for ::populateSafepoints
4129 static inline bool IsSlotsOrElements(VirtualRegister& reg) {
4130   return reg.type() == LDefinition::SLOTS;
4131 }
4132
4133 // Helper for ::populateSafepoints
4134 static inline bool IsTraceable(VirtualRegister& reg) {
4135   if (reg.type() == LDefinition::OBJECT ||
4136       reg.type() == LDefinition::WASM_ANYREF) {
4137     return true;
4138   }
4139 #ifdef JS_PUNBOX64
4140   if (reg.type() == LDefinition::BOX) {
4141     return true;
4142   }
4143 #endif
4144   if (reg.type() == LDefinition::STACKRESULTS) {
4145     MOZ_ASSERT(reg.def());
4146     const LStackArea* alloc = reg.def()->output()->toStackArea();
4147     for (auto iter = alloc->results(); iter; iter.next()) {
4148       if (iter.isWasmAnyRef()) {
4149         return true;
4150       }
4151     }
4152   }
4153   return false;
4154 }
4155
4156 bool BacktrackingAllocator::populateSafepoints() {
4157   JitSpew(JitSpew_RegAlloc, "Populating Safepoints");
4158
4159   size_t firstSafepoint = 0;
4160
4161   MOZ_ASSERT(!vregs[0u].def());
4162   for (uint32_t i = 1; i < graph.numVirtualRegisters(); i++) {
4163     VirtualRegister& reg = vregs[i];
4164
4165     if (!reg.def() ||
4166         (!IsTraceable(reg) && !IsSlotsOrElements(reg) && !IsNunbox(reg))) {
4167       continue;
4168     }
4169
4170     firstSafepoint = findFirstSafepoint(inputOf(reg.ins()), firstSafepoint);
4171     if (firstSafepoint >= graph.numSafepoints()) {
4172       break;
4173     }
4174
4175     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
4176          iter++) {
4177       LiveRange* range = LiveRange::get(*iter);
4178
4179       for (size_t j = firstSafepoint; j < graph.numSafepoints(); j++) {
4180         LInstruction* ins = graph.getSafepoint(j);
4181
4182         if (!range->covers(inputOf(ins))) {
4183           if (inputOf(ins) >= range->to()) {
4184             break;
4185           }
4186           continue;
4187         }
4188
4189         // Include temps but not instruction outputs. Also make sure
4190         // MUST_REUSE_INPUT is not used with gcthings or nunboxes, or
4191         // we would have to add the input reg to this safepoint.
4192         if (ins == reg.ins() && !reg.isTemp()) {
4193           DebugOnly<LDefinition*> def = reg.def();
4194           MOZ_ASSERT_IF(def->policy() == LDefinition::MUST_REUSE_INPUT,
4195                         def->type() == LDefinition::GENERAL ||
4196                             def->type() == LDefinition::INT32 ||
4197                             def->type() == LDefinition::FLOAT32 ||
4198                             def->type() == LDefinition::DOUBLE ||
4199                             def->type() == LDefinition::SIMD128);
4200           continue;
4201         }
4202
4203         LSafepoint* safepoint = ins->safepoint();
4204
4205         LAllocation a = range->bundle()->allocation();
4206         if (a.isGeneralReg() && ins->isCall()) {
4207           continue;
4208         }
4209
4210         switch (reg.type()) {
4211           case LDefinition::OBJECT:
4212             if (!safepoint->addGcPointer(a)) {
4213               return false;
4214             }
4215             break;
4216           case LDefinition::SLOTS:
4217             if (!safepoint->addSlotsOrElementsPointer(a)) {
4218               return false;
4219             }
4220             break;
4221           case LDefinition::WASM_ANYREF:
4222             if (!safepoint->addWasmAnyRef(a)) {
4223               return false;
4224             }
4225             break;
4226           case LDefinition::STACKRESULTS: {
4227             MOZ_ASSERT(a.isStackArea());
4228             for (auto iter = a.toStackArea()->results(); iter; iter.next()) {
4229               if (iter.isWasmAnyRef()) {
4230                 if (!safepoint->addWasmAnyRef(iter.alloc())) {
4231                   return false;
4232                 }
4233               }
4234             }
4235             break;
4236           }
4237 #ifdef JS_NUNBOX32
4238           case LDefinition::TYPE:
4239             if (!safepoint->addNunboxType(i, a)) {
4240               return false;
4241             }
4242             break;
4243           case LDefinition::PAYLOAD:
4244             if (!safepoint->addNunboxPayload(i, a)) {
4245               return false;
4246             }
4247             break;
4248 #else
4249           case LDefinition::BOX:
4250             if (!safepoint->addBoxedValue(a)) {
4251               return false;
4252             }
4253             break;
4254 #endif
4255           default:
4256             MOZ_CRASH("Bad register type");
4257         }
4258       }
4259     }
4260   }
4261
4262   return true;
4263 }
4264
4265 bool BacktrackingAllocator::annotateMoveGroups() {
4266   // Annotate move groups in the LIR graph with any register that is not
4267   // allocated at that point and can be used as a scratch register. This is
4268   // only required for x86, as other platforms always have scratch registers
4269   // available for use.
4270 #ifdef JS_CODEGEN_X86
4271   LiveRange* range = LiveRange::FallibleNew(alloc(), nullptr, CodePosition(),
4272                                             CodePosition().next());
4273   if (!range) {
4274     return false;
4275   }
4276
4277   for (size_t i = 0; i < graph.numBlocks(); i++) {
4278     if (mir->shouldCancel("Backtracking Annotate Move Groups")) {
4279       return false;
4280     }
4281
4282     LBlock* block = graph.getBlock(i);
4283     LInstruction* last = nullptr;
4284     for (LInstructionIterator iter = block->begin(); iter != block->end();
4285          ++iter) {
4286       if (iter->isMoveGroup()) {
4287         CodePosition from = last ? outputOf(last) : entryOf(block);
4288         range->setTo(from.next());
4289         range->setFrom(from);
4290
4291         for (size_t i = 0; i < AnyRegister::Total; i++) {
4292           PhysicalRegister& reg = registers[i];
4293           if (reg.reg.isFloat() || !reg.allocatable) {
4294             continue;
4295           }
4296
4297           // This register is unavailable for use if (a) it is in use
4298           // by some live range immediately before the move group,
4299           // or (b) it is an operand in one of the group's moves. The
4300           // latter case handles live ranges which end immediately
4301           // before the move group or start immediately after.
4302           // For (b) we need to consider move groups immediately
4303           // preceding or following this one.
4304
4305           if (iter->toMoveGroup()->uses(reg.reg.gpr())) {
4306             continue;
4307           }
4308           bool found = false;
4309           LInstructionIterator niter(iter);
4310           for (niter++; niter != block->end(); niter++) {
4311             if (niter->isMoveGroup()) {
4312               if (niter->toMoveGroup()->uses(reg.reg.gpr())) {
4313                 found = true;
4314                 break;
4315               }
4316             } else {
4317               break;
4318             }
4319           }
4320           if (iter != block->begin()) {
4321             LInstructionIterator riter(iter);
4322             do {
4323               riter--;
4324               if (riter->isMoveGroup()) {
4325                 if (riter->toMoveGroup()->uses(reg.reg.gpr())) {
4326                   found = true;
4327                   break;
4328                 }
4329               } else {
4330                 break;
4331               }
4332             } while (riter != block->begin());
4333           }
4334
4335           if (found) {
4336             continue;
4337           }
4338           LiveRangePlus existingPlus;
4339           LiveRangePlus rangePlus(range);
4340           if (reg.allocations.contains(rangePlus, &existingPlus)) {
4341             continue;
4342           }
4343
4344           iter->toMoveGroup()->setScratchRegister(reg.reg.gpr());
4345           break;
4346         }
4347       } else {
4348         last = *iter;
4349       }
4350     }
4351   }
4352 #endif
4353
4354   return true;
4355 }
4356
4357 ///////////////////////////////////////////////////////////////////////////////
4358 //                                                                           //
4359 // Debug-printing support                                                    //
4360 //                                                                           //
4361 ///////////////////////////////////////////////////////////////////////////////
4362
4363 #ifdef JS_JITSPEW
4364
4365 UniqueChars LiveRange::toString() const {
4366   AutoEnterOOMUnsafeRegion oomUnsafe;
4367
4368   UniqueChars buf = JS_smprintf("v%u %u-%u", hasVreg() ? vreg().vreg() : 0,
4369                                 from().bits(), to().bits() - 1);
4370
4371   if (buf && bundle() && !bundle()->allocation().isBogus()) {
4372     buf = JS_sprintf_append(std::move(buf), " %s",
4373                             bundle()->allocation().toString().get());
4374   }
4375
4376   buf = JS_sprintf_append(std::move(buf), " {");
4377
4378   if (buf && hasDefinition()) {
4379     buf = JS_sprintf_append(std::move(buf), " %u_def", from().bits());
4380     if (hasVreg()) {
4381       // If the definition has a fixed requirement, print it too.
4382       const LDefinition* def = vreg().def();
4383       LDefinition::Policy policy = def->policy();
4384       if (policy == LDefinition::FIXED || policy == LDefinition::STACK) {
4385         if (buf) {
4386           buf = JS_sprintf_append(std::move(buf), ":F:%s",
4387                                   def->output()->toString().get());
4388         }
4389       }
4390     }
4391   }
4392
4393   for (UsePositionIterator iter = usesBegin(); buf && iter; iter++) {
4394     buf = JS_sprintf_append(std::move(buf), " %u_%s", iter->pos.bits(),
4395                             iter->use()->toString().get());
4396   }
4397
4398   buf = JS_sprintf_append(std::move(buf), " }");
4399
4400   if (!buf) {
4401     oomUnsafe.crash("LiveRange::toString()");
4402   }
4403
4404   return buf;
4405 }
4406
4407 UniqueChars LiveBundle::toString() const {
4408   AutoEnterOOMUnsafeRegion oomUnsafe;
4409
4410   UniqueChars buf = JS_smprintf("LB%u(", debugId());
4411
4412   if (buf) {
4413     if (spillParent()) {
4414       buf = JS_sprintf_append(std::move(buf), "parent=LB%u",
4415                               spillParent()->debugId());
4416     } else {
4417       buf = JS_sprintf_append(std::move(buf), "parent=none");
4418     }
4419   }
4420
4421   for (LiveRange::BundleLinkIterator iter = rangesBegin(); buf && iter;
4422        iter++) {
4423     if (buf) {
4424       buf = JS_sprintf_append(std::move(buf), "%s %s",
4425                               (iter == rangesBegin()) ? "" : " ##",
4426                               LiveRange::get(*iter)->toString().get());
4427     }
4428   }
4429
4430   if (buf) {
4431     buf = JS_sprintf_append(std::move(buf), ")");
4432   }
4433
4434   if (!buf) {
4435     oomUnsafe.crash("LiveBundle::toString()");
4436   }
4437
4438   return buf;
4439 }
4440
4441 void BacktrackingAllocator::dumpLiveRangesByVReg(const char* who) {
4442   MOZ_ASSERT(!vregs[0u].hasRanges());
4443
4444   JitSpewCont(JitSpew_RegAlloc, "\n");
4445   JitSpew(JitSpew_RegAlloc, "Live ranges by virtual register (%s):", who);
4446
4447   for (uint32_t i = 1; i < graph.numVirtualRegisters(); i++) {
4448     JitSpewHeader(JitSpew_RegAlloc);
4449     JitSpewCont(JitSpew_RegAlloc, "  ");
4450     VirtualRegister& reg = vregs[i];
4451     for (LiveRange::RegisterLinkIterator iter = reg.rangesBegin(); iter;
4452          iter++) {
4453       if (iter != reg.rangesBegin()) {
4454         JitSpewCont(JitSpew_RegAlloc, " ## ");
4455       }
4456       JitSpewCont(JitSpew_RegAlloc, "%s",
4457                   LiveRange::get(*iter)->toString().get());
4458     }
4459     JitSpewCont(JitSpew_RegAlloc, "\n");
4460   }
4461 }
4462
4463 void BacktrackingAllocator::dumpLiveRangesByBundle(const char* who) {
4464   MOZ_ASSERT(!vregs[0u].hasRanges());
4465
4466   JitSpewCont(JitSpew_RegAlloc, "\n");
4467   JitSpew(JitSpew_RegAlloc, "Live ranges by bundle (%s):", who);
4468
4469   for (uint32_t i = 1; i < graph.numVirtualRegisters(); i++) {
4470     VirtualRegister& reg = vregs[i];
4471     for (LiveRange::RegisterLinkIterator baseIter = reg.rangesBegin(); baseIter;
4472          baseIter++) {
4473       LiveRange* range = LiveRange::get(*baseIter);
4474       LiveBundle* bundle = range->bundle();
4475       if (range == bundle->firstRange()) {
4476         JitSpew(JitSpew_RegAlloc, "  %s", bundle->toString().get());
4477       }
4478     }
4479   }
4480 }
4481
4482 void BacktrackingAllocator::dumpAllocations() {
4483   JitSpew(JitSpew_RegAlloc, "Allocations:");
4484
4485   dumpLiveRangesByBundle("in dumpAllocations()");
4486
4487   JitSpewCont(JitSpew_RegAlloc, "\n");
4488   JitSpew(JitSpew_RegAlloc, "Allocations by physical register:");
4489
4490   for (size_t i = 0; i < AnyRegister::Total; i++) {
4491     if (registers[i].allocatable && !registers[i].allocations.empty()) {
4492       JitSpewHeader(JitSpew_RegAlloc);
4493       JitSpewCont(JitSpew_RegAlloc, "  %s:", AnyRegister::FromCode(i).name());
4494       bool first = true;
4495       LiveRangePlusSet::Iter lrpIter(&registers[i].allocations);
4496       while (lrpIter.hasMore()) {
4497         LiveRange* range = lrpIter.next().liveRange();
4498         if (first) {
4499           first = false;
4500         } else {
4501           fprintf(stderr, " /");
4502         }
4503         fprintf(stderr, " %s", range->toString().get());
4504       }
4505       JitSpewCont(JitSpew_RegAlloc, "\n");
4506     }
4507   }
4508
4509   JitSpewCont(JitSpew_RegAlloc, "\n");
4510 }
4511
4512 #endif  // JS_JITSPEW
4513
4514 ///////////////////////////////////////////////////////////////////////////////
4515 //                                                                           //
4516 // Top level of the register allocation machinery                            //
4517 //                                                                           //
4518 ///////////////////////////////////////////////////////////////////////////////
4519
4520 bool BacktrackingAllocator::go() {
4521   JitSpewCont(JitSpew_RegAlloc, "\n");
4522   JitSpew(JitSpew_RegAlloc, "Beginning register allocation");
4523
4524   JitSpewCont(JitSpew_RegAlloc, "\n");
4525   if (JitSpewEnabled(JitSpew_RegAlloc)) {
4526     dumpInstructions("(Pre-allocation LIR)");
4527   }
4528
4529   if (!init()) {
4530     return false;
4531   }
4532
4533   if (!buildLivenessInfo()) {
4534     return false;
4535   }
4536
4537 #ifdef JS_JITSPEW
4538   if (JitSpewEnabled(JitSpew_RegAlloc)) {
4539     dumpLiveRangesByVReg("after liveness analysis");
4540   }
4541 #endif
4542
4543   if (!allocationQueue.reserve(graph.numVirtualRegisters() * 3 / 2)) {
4544     return false;
4545   }
4546
4547   JitSpewCont(JitSpew_RegAlloc, "\n");
4548   JitSpew(JitSpew_RegAlloc, "Beginning grouping and queueing registers");
4549   if (!mergeAndQueueRegisters()) {
4550     return false;
4551   }
4552   JitSpew(JitSpew_RegAlloc, "Completed grouping and queueing registers");
4553
4554 #ifdef JS_JITSPEW
4555   if (JitSpewEnabled(JitSpew_RegAlloc)) {
4556     dumpLiveRangesByBundle("after grouping/queueing regs");
4557   }
4558 #endif
4559
4560   // There now follow two allocation loops, which are really the heart of the
4561   // allocator.  First, the "main" allocation loop.  This does almost all of
4562   // the allocation work, by repeatedly pulling bundles out of
4563   // ::allocationQueue and calling ::processBundle on it, until there are no
4564   // bundles left in the queue.  Note that ::processBundle can add new smaller
4565   // bundles to the queue if it needs to split or spill a bundle.
4566   //
4567   // For each bundle in turn pulled out of ::allocationQueue, ::processBundle:
4568   //
4569   // * calls ::computeRequirement to discover the overall constraint for the
4570   //   bundle.
4571   //
4572   // * tries to find a register for it, by calling either ::tryAllocateFixed or
4573   //   ::tryAllocateNonFixed.
4574   //
4575   // * if that fails, but ::tryAllocateFixed / ::tryAllocateNonFixed indicate
4576   //   that there is some other bundle with lower spill weight that can be
4577   //   evicted, then that bundle is evicted (hence, put back into
4578   //   ::allocationQueue), and we try again.
4579   //
4580   // * at most MAX_ATTEMPTS may be made.
4581   //
4582   // * If that still fails to find a register, then the bundle is handed off to
4583   //   ::chooseBundleSplit.  That will choose to either split the bundle,
4584   //   yielding multiple pieces which are put back into ::allocationQueue, or
4585   //   it will spill the bundle.  Note that the same mechanism applies to both;
4586   //   there's no clear boundary between splitting and spilling, because
4587   //   spilling can be interpreted as an extreme form of splitting.
4588   //
4589   // ::processBundle and its callees contains much gnarly and logic which isn't
4590   // easy to understand, particularly in the area of how eviction candidates
4591   // are chosen.  But it works well enough, and tinkering doesn't seem to
4592   // improve the resulting allocations.  More important is the splitting logic,
4593   // because that controls where spill/reload instructions are placed.
4594   //
4595   // Eventually ::allocationQueue becomes empty, and each LiveBundle has either
4596   // been allocated a register or is marked for spilling.  In the latter case
4597   // it will have been added to ::spilledBundles.
4598
4599   JitSpewCont(JitSpew_RegAlloc, "\n");
4600   JitSpew(JitSpew_RegAlloc, "Beginning main allocation loop");
4601   JitSpewCont(JitSpew_RegAlloc, "\n");
4602
4603   // Allocate, spill and split bundles until finished.
4604   while (!allocationQueue.empty()) {
4605     if (mir->shouldCancel("Backtracking Allocation")) {
4606       return false;
4607     }
4608
4609     QueueItem item = allocationQueue.removeHighest();
4610     if (!processBundle(mir, item.bundle)) {
4611       return false;
4612     }
4613   }
4614
4615   // And here's the second allocation loop (hidden inside
4616   // ::tryAllocatingRegistersForSpillBundles).  It makes one last attempt to
4617   // find a register for each spill bundle.  There's no attempt to free up
4618   // registers by eviction.  In at least 99% of cases this attempt fails, in
4619   // which case the bundle is handed off to ::spill.  The lucky remaining 1%
4620   // get a register.  Unfortunately this scheme interacts badly with the
4621   // splitting strategy, leading to excessive register-to-register copying in
4622   // some very simple cases.  See bug 1752520.
4623   //
4624   // A modest but probably worthwhile amount of allocation time can be saved by
4625   // making ::tryAllocatingRegistersForSpillBundles use specialised versions of
4626   // ::tryAllocateAnyRegister and its callees, that don't bother to create sets
4627   // of conflicting bundles.  Creating those sets is expensive and, here,
4628   // pointless, since we're not going to do any eviction based on them.  This
4629   // refinement is implemented in the un-landed patch at bug 1758274 comment
4630   // 15.
4631
4632   JitSpewCont(JitSpew_RegAlloc, "\n");
4633   JitSpew(JitSpew_RegAlloc,
4634           "Main allocation loop complete; "
4635           "beginning spill-bundle allocation loop");
4636   JitSpewCont(JitSpew_RegAlloc, "\n");
4637
4638   if (!tryAllocatingRegistersForSpillBundles()) {
4639     return false;
4640   }
4641
4642   JitSpewCont(JitSpew_RegAlloc, "\n");
4643   JitSpew(JitSpew_RegAlloc, "Spill-bundle allocation loop complete");
4644   JitSpewCont(JitSpew_RegAlloc, "\n");
4645
4646   if (!pickStackSlots()) {
4647     return false;
4648   }
4649
4650 #ifdef JS_JITSPEW
4651   if (JitSpewEnabled(JitSpew_RegAlloc)) {
4652     dumpAllocations();
4653   }
4654 #endif
4655
4656   if (!createMoveGroupsFromLiveRangeTransitions()) {
4657     return false;
4658   }
4659
4660   if (!installAllocationsInLIR()) {
4661     return false;
4662   }
4663
4664   if (!populateSafepoints()) {
4665     return false;
4666   }
4667
4668   if (!annotateMoveGroups()) {
4669     return false;
4670   }
4671
4672   JitSpewCont(JitSpew_RegAlloc, "\n");
4673   if (JitSpewEnabled(JitSpew_RegAlloc)) {
4674     dumpInstructions("(Post-allocation LIR)");
4675   }
4676
4677   JitSpew(JitSpew_RegAlloc, "Finished register allocation");
4678
4679   return true;
4680 }
4681
4682 ///////////////////////////////////////////////////////////////////////////////
4683 //                                                                           //
4684 ///////////////////////////////////////////////////////////////////////////////