src/assembly/x86/assem-rtns.lisp

   1 ;;;; the machine specific support routines needed by the file assembler
   2
   3 ;;;; This software is part of the SBCL system. See the README file for
   4 ;;;; more information.
   5 ;;;;
   6 ;;;; This software is derived from the CMU CL system, which was
   7 ;;;; written at Carnegie Mellon University and released into the
   8 ;;;; public domain. The software is in the public domain and is
   9 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
  10 ;;;; files for more information.
  11
  12 (in-package "SB!VM")
  13 \f
  14 ;;;; RETURN-MULTIPLE
  15
  16 ;;; For RETURN-MULTIPLE, we have to move the results from the end of
  17 ;;; the frame for the function that is returning to the end of the
  18 ;;; frame for the function being returned to.
  19
  20 #+sb-assembling ;; We don't want a vop for this one.
  21 (define-assembly-routine
  22     (return-multiple (:return-style :none))
  23     (;; These are really arguments.
  24      (:temp ecx unsigned-reg ecx-offset)
  25      (:temp esi unsigned-reg esi-offset)
  26
  27      ;; These we need as temporaries.
  28      (:temp eax unsigned-reg eax-offset)
  29      (:temp ebx unsigned-reg ebx-offset)
  30      (:temp edx unsigned-reg edx-offset)
  31      (:temp edi unsigned-reg edi-offset))
  32
  33   ;; Pick off the cases where everything fits in register args.
  34   (inst jecxz ZERO-VALUES)
  35   (inst cmp ecx (fixnumize 1))
  36   (inst jmp :e ONE-VALUE)
  37   (inst cmp ecx (fixnumize 2))
  38   (inst jmp :e TWO-VALUES)
  39   (inst cmp ecx (fixnumize 3))
  40   (inst jmp :e THREE-VALUES)
  41
  42   ;; As per the calling convention EBX is expected to point at the SP
  43   ;; before the stack frame.
  44   (inst lea ebx (make-ea :dword :base ebp-tn
  45                          :disp (* sp->fp-offset n-word-bytes)))
  46
  47   ;; Save the count, the return address and restore the frame pointer,
  48   ;; because the loop is going to destroy them.
  49   (inst mov edx ecx)
  50   (inst mov eax (make-ea :dword :base ebp-tn
  51                          :disp (frame-byte-offset return-pc-save-offset)))
  52   (inst mov ebp-tn (make-ea :dword :base ebp-tn
  53                             :disp (frame-byte-offset ocfp-save-offset)))
  54   ;; Blit the values down the stack. Note: there might be overlap, so
  55   ;; we have to be careful not to clobber values before we've read
  56   ;; them. Because the stack builds down, we are copying to a larger
  57   ;; address. Therefore, we need to iterate from larger addresses to
  58   ;; smaller addresses. pfw-this says copy ecx words from esi to edi
  59   ;; counting down.
  60   (inst shr ecx (1- n-lowtag-bits))
  61   (inst std)                            ; count down
  62   (inst sub esi n-word-bytes)
  63   (inst lea edi (make-ea :dword :base ebx :disp (- n-word-bytes)))
  64   (inst rep)
  65   (inst movs :dword)
  66   (inst cld)
  67
  68   ;; Restore the count.
  69   (inst mov ecx edx)
  70
  71   ;; Set the stack top to the last result.
  72   (inst lea esp-tn (make-ea :dword :base edi :disp n-word-bytes))
  73
  74   ;; Load the register args.
  75   (loadw edx ebx -1)
  76   (loadw edi ebx -2)
  77   (loadw esi ebx -3)
  78
  79   ;; And back we go.
  80   (inst stc)
  81   (inst push eax)
  82   (inst ret)
  83
  84   ;; Handle the register arg cases.
  85   ZERO-VALUES
  86   (inst lea ebx (make-ea :dword :base ebp-tn
  87                          :disp (* sp->fp-offset n-word-bytes)))
  88   (inst mov edx nil-value)
  89   (inst mov edi edx)
  90   (inst mov esi edx)
  91   (inst mov esp-tn ebp-tn)
  92   (inst stc)
  93   (inst pop ebp-tn)
  94   (inst ret)
  95
  96   ;; Note: we can get this, because the return-multiple vop doesn't
  97   ;; check for this case when size > speed.
  98   ONE-VALUE
  99   (loadw edx esi -1)
 100   (inst mov esp-tn ebp-tn)
 101   (inst clc)
 102   (inst pop ebp-tn)
 103   (inst ret)
 104
 105   TWO-VALUES
 106   (inst lea ebx (make-ea :dword :base ebp-tn
 107                          :disp (* sp->fp-offset n-word-bytes)))
 108   (loadw edx esi -1)
 109   (loadw edi esi -2)
 110   (inst mov esi nil-value)
 111   (inst mov esp-tn ebp-tn)
 112   (inst stc)
 113   (inst pop ebp-tn)
 114   (inst ret)
 115
 116   THREE-VALUES
 117   (inst lea ebx (make-ea :dword :base ebp-tn
 118                          :disp (* sp->fp-offset n-word-bytes)))
 119   (loadw edx esi -1)
 120   (loadw edi esi -2)
 121   (loadw esi esi -3)
 122   (inst mov esp-tn ebp-tn)
 123   (inst stc)
 124   (inst pop ebp-tn)
 125   (inst ret))
 126 \f
 127 ;;;; TAIL-CALL-VARIABLE
 128
 129 ;;; For tail-call-variable, we have to copy the arguments from the end
 130 ;;; of our stack frame (were args are produced) to the start of our
 131 ;;; stack frame (were args are expected).
 132 ;;;
 133 ;;; We take the function to call in EAX and a pointer to the arguments in
 134 ;;; ESI. EBP says the same over the jump, and the old frame pointer is
 135 ;;; still saved in the first stack slot. The return-pc is saved in
 136 ;;; the second stack slot, so we have to push it to make it look like
 137 ;;; we actually called. We also have to compute ECX from the difference
 138 ;;; between ESI and the stack top.
 139 #+sb-assembling ;; No vop for this one either.
 140 (define-assembly-routine
 141     (tail-call-variable
 142      (:return-style :none))
 143
 144     ((:temp eax unsigned-reg eax-offset)
 145      (:temp ebx unsigned-reg ebx-offset)
 146      (:temp ecx unsigned-reg ecx-offset)
 147      (:temp edx unsigned-reg edx-offset)
 148      (:temp edi unsigned-reg edi-offset)
 149      (:temp esi unsigned-reg esi-offset))
 150
 151   ;; Calculate NARGS (as a fixnum)
 152   (move ecx esi)
 153   (inst sub ecx esp-tn)
 154
 155   ;; Check for all the args fitting the registers.
 156   (inst cmp ecx (fixnumize 3))
 157   (inst jmp :le REGISTER-ARGS)
 158
 159   ;; Save the OLD-FP and RETURN-PC because the blit is going to trash
 160   ;; those stack locations. Save the ECX, because the loop is going to
 161   ;; trash it.
 162   (pushw ebp-tn (frame-word-offset ocfp-save-offset))
 163   (loadw ebx ebp-tn (frame-word-offset return-pc-save-offset))
 164   (inst push ecx)
 165
 166   ;; Do the blit. Because we are coping from smaller addresses to
 167   ;; larger addresses, we have to start at the largest pair and work
 168   ;; our way down.
 169   (inst shr ecx (1- n-lowtag-bits))
 170   (inst std)                            ; count down
 171   (inst lea edi (make-ea :dword :base ebp-tn :disp (frame-byte-offset 0)))
 172   (inst sub esi (fixnumize 1))
 173   (inst rep)
 174   (inst movs :dword)
 175   (inst cld)
 176
 177   ;; Load the register arguments carefully.
 178   (loadw edx ebp-tn (frame-word-offset ocfp-save-offset))
 179
 180   ;; Restore OLD-FP and ECX.
 181   (inst pop ecx)
 182   ;; Overwrites a1
 183   (popw ebp-tn (frame-word-offset ocfp-save-offset))
 184
 185   ;; Blow off the stack above the arguments.
 186   (inst lea esp-tn (make-ea :dword :base edi :disp n-word-bytes))
 187
 188   ;; remaining register args
 189   (inst mov edi edx)
 190   (loadw edx ebp-tn (frame-word-offset 0))
 191   (loadw esi ebp-tn (frame-word-offset 2))
 192
 193   ;; Push the (saved) return-pc so it looks like we just called.
 194   (inst push ebx)
 195
 196   ;; And jump into the function.
 197   (inst jmp (make-ea-for-object-slot eax closure-fun-slot fun-pointer-lowtag))
 198
 199   ;; All the arguments fit in registers, so load them.
 200   REGISTER-ARGS
 201   (loadw edx esi -1)
 202   (loadw edi esi -2)
 203   (loadw esi esi -3)
 204
 205   ;; Clear most of the stack.
 206   (inst lea esp-tn
 207         (make-ea :dword :base ebp-tn :disp (* (- sp->fp-offset 3) n-word-bytes)))
 208
 209   ;; Push the return-pc so it looks like we just called.
 210   (pushw ebp-tn (frame-word-offset return-pc-save-offset))
 211
 212   ;; And away we go.
 213   (inst jmp (make-ea-for-object-slot eax closure-fun-slot fun-pointer-lowtag)))
 214 \f
 215 (define-assembly-routine (throw
 216                           (:return-style :raw))
 217                          ((:arg target (descriptor-reg any-reg) edx-offset)
 218                           (:arg start any-reg ebx-offset)
 219                           (:arg count any-reg ecx-offset)
 220                           (:temp catch any-reg eax-offset))
 221
 222   (declare (ignore start count))
 223
 224   (load-tl-symbol-value catch *current-catch-block*)
 225
 226   LOOP
 227
 228   (let ((error (gen-label)))
 229     (assemble (*elsewhere*)
 230       (emit-label error)
 231
 232       ;; Fake up a stack frame so that backtraces come out right.
 233       (inst push ebp-tn)
 234       (inst mov ebp-tn esp-tn)
 235
 236       (emit-error-break nil error-trap
 237                         (error-number-or-lose 'unseen-throw-tag-error)
 238                         (list target)))
 239     (inst test catch catch)             ; check for NULL pointer
 240     (inst jmp :z error))
 241
 242   (inst cmp target (make-ea-for-object-slot catch catch-block-tag-slot 0))
 243   (inst jmp :e EXIT)
 244
 245   (loadw catch catch catch-block-previous-catch-slot)
 246   (inst jmp LOOP)
 247
 248   EXIT
 249
 250   ;; Here EAX points to catch block containing symbol pointed to by EDX.
 251   ;; An extra RET gets stuffed after the JMP, but oh well. You can't just change
 252   ;; the :return-style to :none because that also affects the call sequence.
 253   (inst jmp (make-fixup 'unwind :assembly-routine)))
 254
 255 ;;;; non-local exit noise
 256
 257 #!-win32
 258 (define-assembly-routine (unwind
 259                           (:return-style :none)
 260                           (:translate %continue-unwind)
 261                           (:policy :fast-safe))
 262                          ((:arg block (any-reg descriptor-reg) eax-offset)
 263                           (:arg start (any-reg descriptor-reg) ebx-offset)
 264                           (:arg count (any-reg descriptor-reg) ecx-offset)
 265                           (:temp uwp unsigned-reg esi-offset))
 266   (declare (ignore start count))
 267
 268   (let ((error (generate-error-code nil 'invalid-unwind-error)))
 269     (inst test block block)             ; check for NULL pointer
 270     (inst jmp :z error))
 271
 272   (load-tl-symbol-value uwp *current-unwind-protect-block*)
 273
 274   ;; Does *CURRENT-UNWIND-PROTECT-BLOCK* match the value stored in
 275   ;; argument's CURRENT-UWP-SLOT?
 276   (inst cmp uwp
 277         (make-ea-for-object-slot block unwind-block-current-uwp-slot 0))
 278   ;; If a match, return to context in arg block.
 279   (inst jmp :e DO-EXIT)
 280
 281   ;; Not a match - return to *CURRENT-UNWIND-PROTECT-BLOCK* context.
 282   ;; Important! Must save (and return) the arg 'block' for later use!!
 283   (move edx-tn block)
 284   (move block uwp)
 285   ;; Set next unwind protect context.
 286   (loadw uwp uwp unwind-block-current-uwp-slot)
 287   ;; we're about to reload ebp anyway, so let's borrow it here as a
 288   ;; temporary.  Hope this works
 289   (store-tl-symbol-value uwp *current-unwind-protect-block* ebp-tn)
 290
 291   DO-EXIT
 292
 293   (loadw ebp-tn block unwind-block-current-cont-slot)
 294
 295   ;; Uwp-entry expects some things in known locations so that they can
 296   ;; be saved on the stack: the block in edx-tn, start in ebx-tn, and
 297   ;; count in ecx-tn.
 298
 299   (inst jmp (make-ea-for-object-slot block unwind-block-entry-pc-slot 0)))
 300
 301
 302 ;;;; Win32 non-local exit noise
 303
 304 #!+win32
 305 (define-assembly-routine (unwind
 306                           (:return-style :none)
 307                           (:policy :fast-safe))
 308                          ((:arg block (any-reg descriptor-reg) eax-offset)
 309                           (:arg start (any-reg descriptor-reg) ebx-offset)
 310                           (:arg count (any-reg descriptor-reg) ecx-offset))
 311   (declare (ignore start count))
 312
 313   (let ((error (generate-error-code nil 'invalid-unwind-error)))
 314     (inst test block block)             ; check for NULL pointer
 315     (inst jmp :z error))
 316
 317   ;; Save all our registers, as we're about to clobber them.
 318   (inst pusha)
 319
 320   ;; Find the SEH frame surrounding our target.
 321   (loadw ecx-tn block unwind-block-next-seh-frame-slot)
 322
 323   ;; This section copied from VOP CALL-OUT.
 324   ;; Setup the NPX for C; all the FP registers need to be
 325   ;; empty; pop them all.
 326   (dotimes (i 8)
 327     (inst fstp fr0-tn))
 328
 329   ;; ABI requires this
 330   (inst cld)
 331   (inst push ebp-tn)
 332   (inst mov ebp-tn esp-tn)
 333
 334   ;; Actually call out for the unwind.
 335   (inst push 0)
 336   (inst push 0)
 337   (inst push 0)
 338   (inst push ecx-tn)
 339
 340   (inst call (make-fixup "RtlUnwind" :foreign))
 341
 342   (inst pop ebp-tn)
 343   ;; This section based on VOP CALL-OUT.
 344   ;; Restore the NPX for lisp; ensure no regs are empty
 345   (dotimes (i 8)
 346     (inst fldz))
 347
 348   ;; Restore our regs.
 349   (inst popa)
 350
 351   ;; By now we've unwound all the UWP frames required, so we
 352   ;; just jump to our target block.
 353   (loadw ebp-tn block unwind-block-current-cont-slot)
 354
 355   ;; Nlx-entry expects the arg start in ebx-tn and the arg count
 356   ;; in ecx-tn.  Fortunately, that's where they are already.
 357   (inst jmp (make-ea-for-object-slot block unwind-block-entry-pc-slot 0)))
 358
 359 ;;;; Win32 UWP block SEH interface.
 360
 361 ;; We want no VOP for this one and for it to only happen on Win32
 362 ;; targets.  Hence the following disaster.
 363 #!+#.(cl:if (cl:member sb-assembling cl:*features*) win32 '(or))
 364 (define-assembly-routine
 365     (uwp-seh-handler (:return-style :none))
 366     ((:temp block unsigned-reg eax-offset))
 367
 368   ;; We get called for any exception which happens within our
 369   ;; dynamic contour that isn't handled below us, and for
 370   ;; unwinding.
 371
 372   ;; For the exceptions we just return ExceptionContinueSearch.
 373
 374   ;; Find the exception record.
 375   (inst mov eax-tn (make-ea :dword :base esp-tn :disp 4))
 376
 377   ;; Check unwind flags.
 378   (inst test (make-ea :byte :base eax-tn :disp 4) 6) ; EH_UNWINDING | EH_EXIT_UNWIND
 379
 380   ;; To see if we're unwinding or not.
 381   (inst jmp :nz UNWINDING)
 382
 383   ;; We're not unwinding, so we're not interested.
 384   (inst mov eax-tn 1) ;; exception-continue-search
 385   (inst ret)
 386
 387   ;; For the unwinds we establish a basic environment as per
 388   ;; call_into_lisp, but without the extra SEH frame (the theory
 389   ;; being that we're already in a Lisp SEH context), and invoke
 390   ;; our UWP block to unwind itself.
 391
 392   ;; FIXME: Do we need to establish an SEH frame anyway?  And do
 393   ;; we need to do the same stack frame hackery for the debugger
 394   ;; as we do for the main exception handler?
 395
 396   ;; When the UWP block calls %continue-unwind, we come back to
 397   ;; the next assembly routine, below, which reinitializes for C
 398   ;; and returns to the Win32 unwind machinery.
 399
 400   ;; If the UWP block sees fit to do a non-local exit, things
 401   ;; Just Work, thanks to the Win32 API being sanely designed
 402   ;; and our complying with it.
 403
 404   ;; We also must update *current-unwind-protect-block* before
 405   ;; calling the cleanup function.
 406
 407   UNWINDING
 408
 409   ;; Save all registers (overkill)
 410   (inst pusha)
 411
 412   ;; Establish our stack frame.
 413   (inst mov ebp-tn esp-tn)
 414
 415   ;; This section based on VOP CALL-OUT.
 416   ;; Restore the NPX for lisp; ensure no regs are empty
 417   (dotimes (i 8)
 418     (inst fldz))
 419
 420   ;; Find our unwind-block by way of our SEH frame.
 421   (inst mov block (make-ea :dword :base ebp-tn :disp #x28))
 422   (inst lea block (make-ea :dword :base block
 423                            :disp (- (* unwind-block-next-seh-frame-slot
 424                                        n-word-bytes))))
 425
 426   ;; Update *CURRENT-UNWIND-PROTECT-BLOCK*.
 427   (loadw ebx-tn block unwind-block-current-uwp-slot)
 428   (store-tl-symbol-value ebx-tn *current-unwind-protect-block* ecx-tn)
 429
 430   ;; Uwp-entry expects some things in known locations so that they can
 431   ;; be saved on the stack: the block in edx-tn, start in ebx-tn, and
 432   ;; count in ecx-tn.  We don't actually have any of that here, but we
 433   ;; do need to have access to our own stack frame, so we hijack the
 434   ;; known locations to cover our own state.
 435
 436   (inst xor ebx-tn ebx-tn)
 437   (inst xor ecx-tn ecx-tn)
 438   (inst mov ebx-tn ebp-tn)
 439   (loadw ebp-tn block unwind-block-current-cont-slot)
 440   (inst jmp (make-ea-for-object-slot block unwind-block-entry-pc-slot 0)))
 441
 442 #!+win32
 443 (define-assembly-routine (continue-unwind
 444                           (:return-style :none)
 445                           (:translate %continue-unwind)
 446                           (:policy :fast-safe))
 447                          ((:arg block (any-reg descriptor-reg) eax-offset)
 448                           (:arg start (any-reg descriptor-reg) ebx-offset)
 449                           (:arg count (any-reg descriptor-reg) ecx-offset))
 450   (declare (ignore block count))
 451   ;; The args here are mostly ignored because we're using the
 452   ;; win32 unwind mechanism and keep all that elsewhere.  The
 453   ;; exception is START, which we use to pass the saved EBP for
 454   ;; our exception handler.
 455
 456   ;; "All" we have to do here is reload our EBP, reestablish a C
 457   ;; environment, and return ExceptionContinueSearch.  The OS
 458   ;; handles the rest.
 459
 460   ;; Restore our frame pointer.
 461   (inst mov esp-tn start)
 462
 463   ;; This section copied from VOP CALL-OUT.
 464   ;; Setup the NPX for C; all the FP registers need to be
 465   ;; empty; pop them all.
 466   (dotimes (i 8)
 467     (inst fstp fr0-tn))
 468
 469   ;; I'm unlikely to ever forget this again.
 470   (inst cld)
 471
 472   ;; Restore our saved registers
 473   (inst popa)
 474
 475   ;; And we're done.
 476   (inst mov eax-tn 1) ;; exception-continue-search
 477   (inst ret))