libphobos/src/std/math/hardware.d

   1 // Written in the D programming language.
   2
   3 /**
   4 This is a submodule of $(MREF std, math).
   5
   6 It contains hardware support for floating point numbers.
   7
   8 Copyright: Copyright The D Language Foundation 2000 - 2011.
   9 License:   $(HTTP www.boost.org/LICENSE_1_0.txt, Boost License 1.0).
  10 Authors:   $(HTTP digitalmars.com, Walter Bright), Don Clugston,
  11            Conversion of CEPHES math library to D by Iain Buclaw and David Nadlinger
  12 Source: $(PHOBOSSRC std/math/hardware.d)
  13  */
  14
  15 /* NOTE: This file has been patched from the original DMD distribution to
  16  * work with the GDC compiler.
  17  */
  18 module std.math.hardware;
  19
  20 static import core.stdc.fenv;
  21
  22 version (X86)       version = X86_Any;
  23 version (X86_64)    version = X86_Any;
  24 version (PPC)       version = PPC_Any;
  25 version (PPC64)     version = PPC_Any;
  26 version (MIPS32)    version = MIPS_Any;
  27 version (MIPS64)    version = MIPS_Any;
  28 version (AArch64)   version = ARM_Any;
  29 version (ARM)       version = ARM_Any;
  30 version (S390)      version = IBMZ_Any;
  31 version (SPARC)     version = SPARC_Any;
  32 version (SPARC64)   version = SPARC_Any;
  33 version (SystemZ)   version = IBMZ_Any;
  34 version (RISCV32)   version = RISCV_Any;
  35 version (RISCV64)   version = RISCV_Any;
  36 version (LoongArch64)   version = LoongArch_Any;
  37
  38 version (D_InlineAsm_X86)    version = InlineAsm_X86_Any;
  39 version (D_InlineAsm_X86_64) version = InlineAsm_X86_Any;
  40
  41 version (X86_64) version = StaticallyHaveSSE;
  42 version (X86) version (OSX) version = StaticallyHaveSSE;
  43
  44 version (StaticallyHaveSSE)
  45 {
  46     private enum bool haveSSE = true;
  47 }
  48 else version (X86)
  49 {
  50     static import core.cpuid;
  51     private alias haveSSE = core.cpuid.sse;
  52 }
  53
  54 version (D_SoftFloat)
  55 {
  56     // Some soft float implementations may support IEEE floating flags.
  57     // The implementation here supports hardware flags only and is so currently
  58     // only available for supported targets.
  59 }
  60 else version (X86_Any)   version = IeeeFlagsSupport;
  61 else version (PPC_Any)   version = IeeeFlagsSupport;
  62 else version (RISCV_Any) version = IeeeFlagsSupport;
  63 else version (MIPS_Any)  version = IeeeFlagsSupport;
  64 else version (LoongArch_Any) version = IeeeFlagsSupport;
  65 else version (ARM_Any)   version = IeeeFlagsSupport;
  66
  67 // Struct FloatingPointControl is only available if hardware FP units are available.
  68 version (D_HardFloat)
  69 {
  70     // FloatingPointControl.clearExceptions() depends on version IeeeFlagsSupport
  71     version (IeeeFlagsSupport) version = FloatingPointControlSupport;
  72 }
  73
  74 version (IeeeFlagsSupport)
  75 {
  76
  77 /** IEEE exception status flags ('sticky bits')
  78
  79  These flags indicate that an exceptional floating-point condition has occurred.
  80  They indicate that a NaN or an infinity has been generated, that a result
  81  is inexact, or that a signalling NaN has been encountered. If floating-point
  82  exceptions are enabled (unmasked), a hardware exception will be generated
  83  instead of setting these flags.
  84  */
  85 struct IeeeFlags
  86 {
  87 nothrow @nogc:
  88
  89 private:
  90     // The x87 FPU status register is 16 bits.
  91     // The Pentium SSE2 status register is 32 bits.
  92     // The ARM and PowerPC FPSCR is a 32-bit register.
  93     // The SPARC FSR is a 32bit register (64 bits for SPARC 7 & 8, but high bits are uninteresting).
  94     // The RISC-V (32 & 64 bit) fcsr is 32-bit register.
  95     // THe LoongArch fcsr (fcsr0) is a 32-bit register.
  96     uint flags;
  97
  98     version (CRuntime_Microsoft)
  99     {
 100         // Microsoft uses hardware-incompatible custom constants in fenv.h (core.stdc.fenv).
 101         // Applies to both x87 status word (16 bits) and SSE2 status word(32 bits).
 102         enum : int
 103         {
 104             INEXACT_MASK   = 0x20,
 105             UNDERFLOW_MASK = 0x10,
 106             OVERFLOW_MASK  = 0x08,
 107             DIVBYZERO_MASK = 0x04,
 108             INVALID_MASK   = 0x01,
 109
 110             EXCEPTIONS_MASK = 0b11_1111
 111         }
 112         // Don't bother about subnormals, they are not supported on most CPUs.
 113         //  SUBNORMAL_MASK = 0x02;
 114     }
 115     else
 116     {
 117         enum : int
 118         {
 119             INEXACT_MASK    = core.stdc.fenv.FE_INEXACT,
 120             UNDERFLOW_MASK  = core.stdc.fenv.FE_UNDERFLOW,
 121             OVERFLOW_MASK   = core.stdc.fenv.FE_OVERFLOW,
 122             DIVBYZERO_MASK  = core.stdc.fenv.FE_DIVBYZERO,
 123             INVALID_MASK    = core.stdc.fenv.FE_INVALID,
 124             EXCEPTIONS_MASK = core.stdc.fenv.FE_ALL_EXCEPT,
 125         }
 126     }
 127
 128     static uint getIeeeFlags() @trusted pure
 129     {
 130         version (GNU)
 131         {
 132             version (X86_Any)
 133             {
 134                 ushort sw;
 135                 asm pure nothrow @nogc
 136                 {
 137                     "fstsw %0" : "=a" (sw);
 138                 }
 139                 // OR the result with the SSE2 status register (MXCSR).
 140                 if (haveSSE)
 141                 {
 142                     uint mxcsr;
 143                     asm pure nothrow @nogc
 144                     {
 145                         "stmxcsr %0" : "=m" (mxcsr);
 146                     }
 147                     return (sw | mxcsr) & EXCEPTIONS_MASK;
 148                 }
 149                 else
 150                     return sw & EXCEPTIONS_MASK;
 151             }
 152             else version (ARM)
 153             {
 154                 version (ARM_SoftFloat)
 155                     return 0;
 156                 else
 157                 {
 158                     uint result = void;
 159                     asm pure nothrow @nogc
 160                     {
 161                         "vmrs %0, FPSCR; and %0, %0, #0x1F;" : "=r" (result);
 162                     }
 163                     return result;
 164                 }
 165             }
 166             else version (RISCV_Any)
 167             {
 168                 version (D_SoftFloat)
 169                     return 0;
 170                 else
 171                 {
 172                     uint result = void;
 173                     asm pure nothrow @nogc
 174                     {
 175                         "frflags %0" : "=r" (result);
 176                     }
 177                     return result;
 178                 }
 179             }
 180             else
 181                 assert(0, "Not yet supported");
 182         }
 183         else
 184         version (InlineAsm_X86_Any)
 185         {
 186             ushort sw;
 187             asm pure nothrow @nogc { fstsw sw; }
 188
 189             // OR the result with the SSE2 status register (MXCSR).
 190             if (haveSSE)
 191             {
 192                 uint mxcsr;
 193                 asm pure nothrow @nogc { stmxcsr mxcsr; }
 194                 return (sw | mxcsr) & EXCEPTIONS_MASK;
 195             }
 196             else return sw & EXCEPTIONS_MASK;
 197         }
 198         else version (SPARC)
 199         {
 200             /*
 201                int retval;
 202                asm pure nothrow @nogc { st %fsr, retval; }
 203                return retval;
 204             */
 205             assert(0, "Not yet supported");
 206         }
 207         else version (ARM)
 208         {
 209             assert(false, "Not yet supported.");
 210         }
 211         else version (RISCV_Any)
 212         {
 213             mixin(`
 214             uint result = void;
 215             asm pure nothrow @nogc
 216             {
 217                 "frflags %0" : "=r" (result);
 218             }
 219             return result;
 220             `);
 221         }
 222         else version (LoongArch_Any)
 223         {
 224             uint result = void;
 225             asm pure nothrow @nogc
 226             {
 227                 "movfcsr2gr %0,$r2" : "=r" (result);
 228             }
 229             return result & EXCEPTIONS_MASK;
 230         }
 231         else
 232             assert(0, "Not yet supported");
 233     }
 234
 235     static void resetIeeeFlags() @trusted
 236     {
 237         version (GNU)
 238         {
 239             version (X86_Any)
 240             {
 241                 asm nothrow @nogc
 242                 {
 243                     "fnclex";
 244                 }
 245
 246                 // Also clear exception flags in MXCSR, SSE's control register.
 247                 if (haveSSE)
 248                 {
 249                     uint mxcsr;
 250                     asm nothrow @nogc
 251                     {
 252                         "stmxcsr %0" : "=m" (mxcsr);
 253                     }
 254                     mxcsr &= ~EXCEPTIONS_MASK;
 255                     asm nothrow @nogc
 256                     {
 257                         "ldmxcsr %0" : : "m" (mxcsr);
 258                     }
 259                 }
 260             }
 261             else version (ARM)
 262             {
 263                 version (ARM_SoftFloat)
 264                     return;
 265                 else
 266                 {
 267                     uint old = FloatingPointControl.getControlState();
 268                     old &= ~0b11111; // http://infocenter.arm.com/help/topic/com.arm.doc.ddi0408i/Chdfifdc.html
 269                     asm nothrow @nogc
 270                     {
 271                         "vmsr FPSCR, %0" : : "r" (old);
 272                     }
 273                 }
 274             }
 275             else version (RISCV_Any)
 276             {
 277                 version (D_SoftFloat)
 278                     return;
 279                 else
 280                 {
 281                     uint newValues = 0x0;
 282                     asm nothrow @nogc
 283                     {
 284                         "fsflags %0" : : "r" (newValues);
 285                     }
 286                 }
 287             }
 288             else
 289                 assert(0, "Not yet supported");
 290         }
 291         else
 292         version (InlineAsm_X86_Any)
 293         {
 294             asm nothrow @nogc
 295             {
 296                 fnclex;
 297             }
 298
 299             // Also clear exception flags in MXCSR, SSE's control register.
 300             if (haveSSE)
 301             {
 302                 uint mxcsr;
 303                 asm nothrow @nogc { stmxcsr mxcsr; }
 304                 mxcsr &= ~EXCEPTIONS_MASK;
 305                 asm nothrow @nogc { ldmxcsr mxcsr; }
 306             }
 307         }
 308         else version (RISCV_Any)
 309         {
 310             mixin(`
 311             uint newValues = 0x0;
 312             asm pure nothrow @nogc
 313             {
 314                 "fsflags %0" : : "r" (newValues);
 315             }
 316             `);
 317         }
 318         else version (LoongArch_Any)
 319         {
 320             asm nothrow @nogc
 321             {
 322                 "movgr2fcsr $r2,$r0";
 323             }
 324         }
 325         else
 326         {
 327             /* SPARC:
 328               int tmpval;
 329               asm pure nothrow @nogc { st %fsr, tmpval; }
 330               tmpval &=0xFFFF_FC00;
 331               asm pure nothrow @nogc { ld tmpval, %fsr; }
 332             */
 333            assert(0, "Not yet supported");
 334         }
 335     }
 336
 337 public:
 338     /**
 339      * The result cannot be represented exactly, so rounding occurred.
 340      * Example: `x = sin(0.1);`
 341      */
 342     @property bool inexact() @safe const { return (flags & INEXACT_MASK) != 0; }
 343
 344     /**
 345      * A zero was generated by underflow
 346      * Example: `x = real.min*real.epsilon/2;`
 347      */
 348     @property bool underflow() @safe const { return (flags & UNDERFLOW_MASK) != 0; }
 349
 350     /**
 351      * An infinity was generated by overflow
 352      * Example: `x = real.max*2;`
 353      */
 354     @property bool overflow() @safe const { return (flags & OVERFLOW_MASK) != 0; }
 355
 356     /**
 357      * An infinity was generated by division by zero
 358      * Example: `x = 3/0.0;`
 359      */
 360     @property bool divByZero() @safe const { return (flags & DIVBYZERO_MASK) != 0; }
 361
 362     /**
 363      * A machine NaN was generated.
 364      * Example: `x = real.infinity * 0.0;`
 365      */
 366     @property bool invalid() @safe const { return (flags & INVALID_MASK) != 0; }
 367 }
 368
 369 ///
 370 version (StdDdoc)
 371 @safe unittest
 372 {
 373     import std.math.traits : isNaN;
 374
 375     static void func() {
 376         int a = 10 * 10;
 377     }
 378     real a = 3.5;
 379     // Set all the flags to zero
 380     resetIeeeFlags();
 381     assert(!ieeeFlags.divByZero);
 382     // Perform a division by zero.
 383     a /= 0.0L;
 384     assert(a == real.infinity);
 385     assert(ieeeFlags.divByZero);
 386     // Create a NaN
 387     a *= 0.0L;
 388     assert(ieeeFlags.invalid);
 389     assert(isNaN(a));
 390
 391     // Check that calling func() has no effect on the
 392     // status flags.
 393     IeeeFlags f = ieeeFlags;
 394     func();
 395     assert(ieeeFlags == f);
 396 }
 397
 398 @safe unittest
 399 {
 400     import std.math.traits : isNaN;
 401
 402     static void func() {
 403         int a = 10 * 10;
 404     }
 405     real a = 3.5;
 406     // Set all the flags to zero
 407     resetIeeeFlags();
 408     assert(!ieeeFlags.divByZero);
 409     // Perform a division by zero.
 410     a = forceDivOp(a, 0.0L);
 411     assert(a == real.infinity);
 412     assert(ieeeFlags.divByZero);
 413     // Create a NaN
 414     a = forceMulOp(a, 0.0L);
 415     assert(ieeeFlags.invalid);
 416     assert(isNaN(a));
 417
 418     // Check that calling func() has no effect on the
 419     // status flags.
 420     IeeeFlags f = ieeeFlags;
 421     func();
 422     assert(ieeeFlags == f);
 423 }
 424
 425 @safe unittest
 426 {
 427     import std.meta : AliasSeq;
 428
 429     static struct Test
 430     {
 431         void delegate() @trusted action;
 432         bool function() @trusted ieeeCheck;
 433     }
 434
 435     static foreach (T; AliasSeq!(float, double, real))
 436     {{
 437         T x; // Needs to be here to avoid `call without side effects` warning.
 438         auto tests = [
 439             Test(
 440                 () { x = forceAddOp!T(1, 0.1L); },
 441                 () => ieeeFlags.inexact
 442             ),
 443             Test(
 444                 () { x = forceDivOp!T(T.min_normal, T.max); },
 445                 () => ieeeFlags.underflow
 446             ),
 447             Test(
 448                 () { x = forceAddOp!T(T.max, T.max); },
 449                 () => ieeeFlags.overflow
 450             ),
 451             Test(
 452                 () { x = forceDivOp!T(1, 0); },
 453                 () => ieeeFlags.divByZero
 454             ),
 455             Test(
 456                 () { x = forceDivOp!T(0, 0); },
 457                 () => ieeeFlags.invalid
 458             )
 459         ];
 460         foreach (test; tests)
 461         {
 462             resetIeeeFlags();
 463             assert(!test.ieeeCheck());
 464             test.action();
 465             assert(test.ieeeCheck());
 466         }
 467     }}
 468 }
 469
 470 /// Set all of the floating-point status flags to false.
 471 void resetIeeeFlags() @trusted nothrow @nogc
 472 {
 473     IeeeFlags.resetIeeeFlags();
 474 }
 475
 476 ///
 477 version (StdDdoc)
 478 @safe unittest
 479 {
 480     resetIeeeFlags();
 481     real a = 3.5;
 482     a /= 0.0L;
 483     assert(a == real.infinity);
 484     assert(ieeeFlags.divByZero);
 485
 486     resetIeeeFlags();
 487     assert(!ieeeFlags.divByZero);
 488 }
 489
 490 @safe unittest
 491 {
 492     resetIeeeFlags();
 493     real a = 3.5;
 494     a = forceDivOp(a, 0.0L);
 495     assert(a == real.infinity);
 496     assert(ieeeFlags.divByZero);
 497
 498     resetIeeeFlags();
 499     assert(!ieeeFlags.divByZero);
 500 }
 501
 502 /// Returns: snapshot of the current state of the floating-point status flags
 503 @property IeeeFlags ieeeFlags() @trusted pure nothrow @nogc
 504 {
 505    return IeeeFlags(IeeeFlags.getIeeeFlags());
 506 }
 507
 508 ///
 509 version (StdDdoc)
 510 @safe nothrow unittest
 511 {
 512     import std.math.traits : isNaN;
 513
 514     resetIeeeFlags();
 515     real a = 3.5;
 516
 517     a /= 0.0L;
 518     assert(a == real.infinity);
 519     assert(ieeeFlags.divByZero);
 520
 521     a *= 0.0L;
 522     assert(isNaN(a));
 523     assert(ieeeFlags.invalid);
 524 }
 525
 526 @safe nothrow unittest
 527 {
 528     import std.math.traits : isNaN;
 529
 530     resetIeeeFlags();
 531     real a = 3.5;
 532
 533     a = forceDivOp(a, 0.0L);
 534     assert(a == real.infinity);
 535     assert(ieeeFlags.divByZero);
 536
 537     a = forceMulOp(a, 0.0L);
 538     assert(isNaN(a));
 539     assert(ieeeFlags.invalid);
 540 }
 541
 542 } // IeeeFlagsSupport
 543
 544
 545 version (FloatingPointControlSupport)
 546 {
 547
 548 /** Control the Floating point hardware
 549
 550   Change the IEEE754 floating-point rounding mode and the floating-point
 551   hardware exceptions.
 552
 553   By default, the rounding mode is roundToNearest and all hardware exceptions
 554   are disabled. For most applications, debugging is easier if the $(I division
 555   by zero), $(I overflow), and $(I invalid operation) exceptions are enabled.
 556   These three are combined into a $(I severeExceptions) value for convenience.
 557   Note in particular that if $(I invalidException) is enabled, a hardware trap
 558   will be generated whenever an uninitialized floating-point variable is used.
 559
 560   All changes are temporary. The previous state is restored at the
 561   end of the scope.
 562
 563
 564 Example:
 565 ----
 566 {
 567     FloatingPointControl fpctrl;
 568
 569     // Enable hardware exceptions for division by zero, overflow to infinity,
 570     // invalid operations, and uninitialized floating-point variables.
 571     fpctrl.enableExceptions(FloatingPointControl.severeExceptions);
 572
 573     // This will generate a hardware exception, if x is a
 574     // default-initialized floating point variable:
 575     real x; // Add `= 0` or even `= real.nan` to not throw the exception.
 576     real y = x * 3.0;
 577
 578     // The exception is only thrown for default-uninitialized NaN-s.
 579     // NaN-s with other payload are valid:
 580     real z = y * real.nan; // ok
 581
 582     // The set hardware exceptions and rounding modes will be disabled when
 583     // leaving this scope.
 584 }
 585 ----
 586
 587  */
 588 struct FloatingPointControl
 589 {
 590 nothrow @nogc:
 591
 592     alias RoundingMode = uint; ///
 593
 594     version (StdDdoc)
 595     {
 596         enum : RoundingMode
 597         {
 598             /** IEEE rounding modes.
 599              * The default mode is roundToNearest.
 600              *
 601              *  roundingMask = A mask of all rounding modes.
 602              */
 603             roundToNearest,
 604             roundDown, /// ditto
 605             roundUp, /// ditto
 606             roundToZero, /// ditto
 607             roundingMask, /// ditto
 608         }
 609     }
 610     else version (CRuntime_Microsoft)
 611     {
 612         // Microsoft uses hardware-incompatible custom constants in fenv.h (core.stdc.fenv).
 613         enum : RoundingMode
 614         {
 615             roundToNearest = 0x0000,
 616             roundDown      = 0x0400,
 617             roundUp        = 0x0800,
 618             roundToZero    = 0x0C00,
 619             roundingMask   = roundToNearest | roundDown
 620                              | roundUp | roundToZero,
 621         }
 622     }
 623     else
 624     {
 625         enum : RoundingMode
 626         {
 627             roundToNearest = core.stdc.fenv.FE_TONEAREST,
 628             roundDown      = core.stdc.fenv.FE_DOWNWARD,
 629             roundUp        = core.stdc.fenv.FE_UPWARD,
 630             roundToZero    = core.stdc.fenv.FE_TOWARDZERO,
 631             roundingMask   = roundToNearest | roundDown
 632                              | roundUp | roundToZero,
 633         }
 634     }
 635
 636     /***
 637      * Change the floating-point hardware rounding mode
 638      *
 639      * Changing the rounding mode in the middle of a function can interfere
 640      * with optimizations of floating point expressions, as the optimizer assumes
 641      * that the rounding mode does not change.
 642      * It is best to change the rounding mode only at the
 643      * beginning of the function, and keep it until the function returns.
 644      * It is also best to add the line:
 645      * ---
 646      * pragma(inline, false);
 647      * ---
 648      * as the first line of the function so it will not get inlined.
 649      * Params:
 650      *    newMode = the new rounding mode
 651      */
 652     @property void rounding(RoundingMode newMode) @trusted
 653     {
 654         initialize();
 655         setControlState((getControlState() & (-1 - roundingMask)) | (newMode & roundingMask));
 656     }
 657
 658     /// Returns: the currently active rounding mode
 659     @property static RoundingMode rounding() @trusted pure
 660     {
 661         return cast(RoundingMode)(getControlState() & roundingMask);
 662     }
 663
 664     alias ExceptionMask = uint; ///
 665
 666     version (StdDdoc)
 667     {
 668         enum : ExceptionMask
 669         {
 670             /** IEEE hardware exceptions.
 671              *  By default, all exceptions are masked (disabled).
 672              *
 673              *  severeExceptions = The overflow, division by zero, and invalid
 674              *  exceptions.
 675              */
 676             subnormalException,
 677             inexactException, /// ditto
 678             underflowException, /// ditto
 679             overflowException, /// ditto
 680             divByZeroException, /// ditto
 681             invalidException, /// ditto
 682             severeExceptions, /// ditto
 683             allExceptions, /// ditto
 684         }
 685     }
 686     else version (ARM_Any)
 687     {
 688         enum : ExceptionMask
 689         {
 690             subnormalException    = 0x8000,
 691             inexactException      = 0x1000,
 692             underflowException    = 0x0800,
 693             overflowException     = 0x0400,
 694             divByZeroException    = 0x0200,
 695             invalidException      = 0x0100,
 696             severeExceptions   = overflowException | divByZeroException
 697                                  | invalidException,
 698             allExceptions      = severeExceptions | underflowException
 699                                  | inexactException | subnormalException,
 700         }
 701     }
 702     else version (PPC_Any)
 703     {
 704         enum : ExceptionMask
 705         {
 706             inexactException      = 0x0008,
 707             divByZeroException    = 0x0010,
 708             underflowException    = 0x0020,
 709             overflowException     = 0x0040,
 710             invalidException      = 0x0080,
 711             severeExceptions   = overflowException | divByZeroException
 712                                  | invalidException,
 713             allExceptions      = severeExceptions | underflowException
 714                                  | inexactException,
 715         }
 716     }
 717     else version (RISCV_Any)
 718     {
 719         enum : ExceptionMask
 720         {
 721             inexactException      = 0x01,
 722             divByZeroException    = 0x08,
 723             underflowException    = 0x02,
 724             overflowException     = 0x04,
 725             invalidException      = 0x10,
 726             severeExceptions   = overflowException | divByZeroException
 727                                  | invalidException,
 728             allExceptions      = severeExceptions | underflowException
 729                                  | inexactException,
 730         }
 731     }
 732     else version (HPPA)
 733     {
 734         enum : ExceptionMask
 735         {
 736             inexactException      = 0x01,
 737             underflowException    = 0x02,
 738             overflowException     = 0x04,
 739             divByZeroException    = 0x08,
 740             invalidException      = 0x10,
 741             severeExceptions   = overflowException | divByZeroException
 742                                  | invalidException,
 743             allExceptions      = severeExceptions | underflowException
 744                                  | inexactException,
 745         }
 746     }
 747     else version (LoongArch_Any)
 748     {
 749         enum : ExceptionMask
 750         {
 751             inexactException      = 0x00,
 752             divByZeroException    = 0x01,
 753             overflowException     = 0x02,
 754             underflowException    = 0x04,
 755             invalidException      = 0x08,
 756             severeExceptions   = overflowException | divByZeroException
 757                                  | invalidException,
 758             allExceptions      = severeExceptions | underflowException
 759                                  | inexactException,
 760         }
 761     }
 762     else version (MIPS_Any)
 763     {
 764         enum : ExceptionMask
 765         {
 766             inexactException      = 0x0080,
 767             divByZeroException    = 0x0400,
 768             overflowException     = 0x0200,
 769             underflowException    = 0x0100,
 770             invalidException      = 0x0800,
 771             severeExceptions   = overflowException | divByZeroException
 772                                  | invalidException,
 773             allExceptions      = severeExceptions | underflowException
 774                                  | inexactException,
 775         }
 776     }
 777     else version (SPARC_Any)
 778     {
 779         enum : ExceptionMask
 780         {
 781             inexactException      = 0x0800000,
 782             divByZeroException    = 0x1000000,
 783             overflowException     = 0x4000000,
 784             underflowException    = 0x2000000,
 785             invalidException      = 0x8000000,
 786             severeExceptions   = overflowException | divByZeroException
 787                                  | invalidException,
 788             allExceptions      = severeExceptions | underflowException
 789                                  | inexactException,
 790         }
 791     }
 792     else version (IBMZ_Any)
 793     {
 794         enum : ExceptionMask
 795         {
 796             inexactException      = 0x08000000,
 797             divByZeroException    = 0x40000000,
 798             overflowException     = 0x20000000,
 799             underflowException    = 0x10000000,
 800             invalidException      = 0x80000000,
 801             severeExceptions   = overflowException | divByZeroException
 802                                  | invalidException,
 803             allExceptions      = severeExceptions | underflowException
 804                                  | inexactException,
 805         }
 806     }
 807     else version (X86_Any)
 808     {
 809         enum : ExceptionMask
 810         {
 811             inexactException      = 0x20,
 812             underflowException    = 0x10,
 813             overflowException     = 0x08,
 814             divByZeroException    = 0x04,
 815             subnormalException    = 0x02,
 816             invalidException      = 0x01,
 817             severeExceptions   = overflowException | divByZeroException
 818                                  | invalidException,
 819             allExceptions      = severeExceptions | underflowException
 820                                  | inexactException | subnormalException,
 821         }
 822     }
 823     else
 824         static assert(false, "Not implemented for this architecture");
 825
 826     version (ARM_Any)
 827     {
 828         static bool hasExceptionTraps_impl() @safe
 829         {
 830             auto oldState = getControlState();
 831             // If exceptions are not supported, we set the bit but read it back as zero
 832             // https://sourceware.org/ml/libc-ports/2012-06/msg00091.html
 833             setControlState(oldState | divByZeroException);
 834             immutable result = (getControlState() & allExceptions) != 0;
 835             setControlState(oldState);
 836             return result;
 837         }
 838     }
 839
 840     /// Returns: true if the current FPU supports exception trapping
 841     @property static bool hasExceptionTraps() @safe pure
 842     {
 843         version (X86_Any)
 844             return true;
 845         else version (PPC_Any)
 846             return true;
 847         else version (MIPS_Any)
 848             return true;
 849         else version (LoongArch_Any)
 850             return true;
 851         else version (ARM_Any)
 852         {
 853             // The hasExceptionTraps_impl function is basically pure,
 854             // as it restores all global state
 855             auto fptr = ( () @trusted => cast(bool function() @safe
 856                 pure nothrow @nogc)&hasExceptionTraps_impl)();
 857             return fptr();
 858         }
 859         else
 860             assert(0, "Not yet supported");
 861     }
 862
 863     /// Enable (unmask) specific hardware exceptions. Multiple exceptions may be ORed together.
 864     void enableExceptions(ExceptionMask exceptions) @trusted
 865     {
 866         assert(hasExceptionTraps);
 867         initialize();
 868         version (X86_Any)
 869             setControlState(getControlState() & ~(exceptions & allExceptions));
 870         else
 871             setControlState(getControlState() | (exceptions & allExceptions));
 872     }
 873
 874     /// Disable (mask) specific hardware exceptions. Multiple exceptions may be ORed together.
 875     void disableExceptions(ExceptionMask exceptions) @trusted
 876     {
 877         assert(hasExceptionTraps);
 878         initialize();
 879         version (X86_Any)
 880             setControlState(getControlState() | (exceptions & allExceptions));
 881         else
 882             setControlState(getControlState() & ~(exceptions & allExceptions));
 883     }
 884
 885     /// Returns: the exceptions which are currently enabled (unmasked)
 886     @property static ExceptionMask enabledExceptions() @trusted pure
 887     {
 888         assert(hasExceptionTraps);
 889         version (X86_Any)
 890             return (getControlState() & allExceptions) ^ allExceptions;
 891         else
 892             return (getControlState() & allExceptions);
 893     }
 894
 895     ///  Clear all pending exceptions, then restore the original exception state and rounding mode.
 896     ~this() @trusted
 897     {
 898         clearExceptions();
 899         if (initialized)
 900             setControlState(savedState);
 901     }
 902
 903 private:
 904     ControlState savedState;
 905
 906     bool initialized = false;
 907
 908     version (ARM_Any)
 909     {
 910         alias ControlState = uint;
 911     }
 912     else version (HPPA)
 913     {
 914         alias ControlState = uint;
 915     }
 916     else version (PPC_Any)
 917     {
 918         alias ControlState = uint;
 919     }
 920     else version (RISCV_Any)
 921     {
 922         alias ControlState = uint;
 923     }
 924     else version (LoongArch_Any)
 925     {
 926         alias ControlState = uint;
 927     }
 928     else version (MIPS_Any)
 929     {
 930         alias ControlState = uint;
 931     }
 932     else version (SPARC_Any)
 933     {
 934         alias ControlState = ulong;
 935     }
 936     else version (IBMZ_Any)
 937     {
 938         alias ControlState = uint;
 939     }
 940     else version (X86_Any)
 941     {
 942         alias ControlState = ushort;
 943     }
 944     else
 945         static assert(false, "Not implemented for this architecture");
 946
 947     void initialize() @safe
 948     {
 949         // BUG: This works around the absence of this() constructors.
 950         if (initialized) return;
 951         clearExceptions();
 952         savedState = getControlState();
 953         initialized = true;
 954     }
 955
 956     // Clear all pending exceptions
 957     static void clearExceptions() @safe
 958     {
 959         version (IeeeFlagsSupport)
 960             resetIeeeFlags();
 961         else
 962             static assert(false, "Not implemented for this architecture");
 963     }
 964
 965     // Read from the control register
 966     package(std.math) static ControlState getControlState() @trusted pure
 967     {
 968         version (GNU)
 969         {
 970             version (X86_Any)
 971             {
 972                 ControlState cont;
 973                 asm pure nothrow @nogc
 974                 {
 975                     "fstcw %0" : "=m" (cont);
 976                 }
 977                 return cont;
 978             }
 979             else version (AArch64)
 980             {
 981                 ControlState cont;
 982                 asm pure nothrow @nogc
 983                 {
 984                     "mrs %0, FPCR;" : "=r" (cont);
 985                 }
 986                 return cont;
 987             }
 988             else version (ARM)
 989             {
 990                 ControlState cont;
 991                 version (ARM_SoftFloat)
 992                    cont = 0;
 993                 else
 994                 {
 995                     asm pure nothrow @nogc
 996                     {
 997                         "vmrs %0, FPSCR" : "=r" (cont);
 998                     }
 999                 }
1000                 return cont;
1001             }
1002             else version (RISCV_Any)
1003             {
1004                 version (D_SoftFloat)
1005                     return 0;
1006                 else
1007                 {
1008                     ControlState cont;
1009                     asm pure nothrow @nogc
1010                     {
1011                         "frcsr %0" : "=r" (cont);
1012                     }
1013                     return cont;
1014                 }
1015             }
1016             else
1017                 assert(0, "Not yet supported");
1018         }
1019         else
1020         version (D_InlineAsm_X86)
1021         {
1022             short cont;
1023             asm pure nothrow @nogc
1024             {
1025                 xor EAX, EAX;
1026                 fstcw cont;
1027             }
1028             return cont;
1029         }
1030         else version (D_InlineAsm_X86_64)
1031         {
1032             short cont;
1033             asm pure nothrow @nogc
1034             {
1035                 xor RAX, RAX;
1036                 fstcw cont;
1037             }
1038             return cont;
1039         }
1040         else version (RISCV_Any)
1041         {
1042             mixin(`
1043             ControlState cont;
1044             asm pure nothrow @nogc
1045             {
1046                 "frcsr %0" : "=r" (cont);
1047             }
1048             return cont;
1049             `);
1050         }
1051         else version (LoongArch_Any)
1052         {
1053             ControlState cont;
1054             asm pure nothrow @nogc
1055             {
1056                 "movfcsr2gr %0,$r0" : "=r" (cont);
1057             }
1058             cont &= (roundingMask | allExceptions);
1059             return cont;
1060         }
1061         else
1062             assert(0, "Not yet supported");
1063     }
1064
1065     // Set the control register
1066     package(std.math) static void setControlState(ControlState newState) @trusted
1067     {
1068         version (GNU)
1069         {
1070             version (X86_Any)
1071             {
1072                 asm nothrow @nogc
1073                 {
1074                     "fclex; fldcw %0" : : "m" (newState);
1075                 }
1076
1077                 // Also update MXCSR, SSE's control register.
1078                 if (haveSSE)
1079                 {
1080                     uint mxcsr;
1081                     asm nothrow @nogc
1082                     {
1083                         "stmxcsr %0" : "=m" (mxcsr);
1084                     }
1085
1086                     /* In the FPU control register, rounding mode is in bits 10 and
1087                        11. In MXCSR it's in bits 13 and 14. */
1088                     mxcsr &= ~(roundingMask << 3);             // delete old rounding mode
1089                     mxcsr |= (newState & roundingMask) << 3;   // write new rounding mode
1090
1091                     /* In the FPU control register, masks are bits 0 through 5.
1092                        In MXCSR they're 7 through 12. */
1093                     mxcsr &= ~(allExceptions << 7);            // delete old masks
1094                     mxcsr |= (newState & allExceptions) << 7;  // write new exception masks
1095
1096                     asm nothrow @nogc
1097                     {
1098                         "ldmxcsr %0" : : "m" (mxcsr);
1099                     }
1100                 }
1101             }
1102             else version (AArch64)
1103             {
1104                 asm nothrow @nogc
1105                 {
1106                     "msr FPCR, %0;" : : "r" (newState);
1107                 }
1108             }
1109             else version (ARM)
1110             {
1111                 version (ARM_SoftFloat)
1112                    return;
1113                 else
1114                 {
1115                     asm nothrow @nogc
1116                     {
1117                         "vmsr FPSCR, %0" : : "r" (newState);
1118                     }
1119                 }
1120             }
1121             else version (RISCV_Any)
1122             {
1123                 version (D_SoftFloat)
1124                     return;
1125                 else
1126                 {
1127                     asm nothrow @nogc
1128                     {
1129                         "fscsr %0" : : "r" (newState);
1130                     }
1131                 }
1132             }
1133             else
1134                 assert(0, "Not yet supported");
1135         }
1136         else
1137         version (InlineAsm_X86_Any)
1138         {
1139             asm nothrow @nogc
1140             {
1141                 fclex;
1142                 fldcw newState;
1143             }
1144
1145             // Also update MXCSR, SSE's control register.
1146             if (haveSSE)
1147             {
1148                 uint mxcsr;
1149                 asm nothrow @nogc { stmxcsr mxcsr; }
1150
1151                 /* In the FPU control register, rounding mode is in bits 10 and
1152                 11. In MXCSR it's in bits 13 and 14. */
1153                 mxcsr &= ~(roundingMask << 3);             // delete old rounding mode
1154                 mxcsr |= (newState & roundingMask) << 3;   // write new rounding mode
1155
1156                 /* In the FPU control register, masks are bits 0 through 5.
1157                 In MXCSR they're 7 through 12. */
1158                 mxcsr &= ~(allExceptions << 7);            // delete old masks
1159                 mxcsr |= (newState & allExceptions) << 7;  // write new exception masks
1160
1161                 asm nothrow @nogc { ldmxcsr mxcsr; }
1162             }
1163         }
1164         else version (RISCV_Any)
1165         {
1166             mixin(`
1167             asm pure nothrow @nogc
1168             {
1169                 "fscsr %0" : : "r" (newState);
1170             }
1171             `);
1172         }
1173         else version (LoongArch_Any)
1174         {
1175             asm nothrow @nogc
1176             {
1177                 "movgr2fcsr $r0,%0" :
1178                 : "r" (newState & (roundingMask | allExceptions));
1179             }
1180         }
1181         else
1182             assert(0, "Not yet supported");
1183     }
1184 }
1185
1186 ///
1187 @safe unittest
1188 {
1189     import std.math.rounding : lrint;
1190
1191     FloatingPointControl fpctrl;
1192
1193     fpctrl.rounding = FloatingPointControl.roundDown;
1194     assert(lrint(1.5) == 1.0);
1195
1196     fpctrl.rounding = FloatingPointControl.roundUp;
1197     assert(lrint(1.4) == 2.0);
1198
1199     fpctrl.rounding = FloatingPointControl.roundToNearest;
1200     assert(lrint(1.5) == 2.0);
1201 }
1202
1203 @safe unittest
1204 {
1205     void ensureDefaults()
1206     {
1207         assert(FloatingPointControl.rounding
1208                == FloatingPointControl.roundToNearest);
1209         if (FloatingPointControl.hasExceptionTraps)
1210             assert(FloatingPointControl.enabledExceptions == 0);
1211     }
1212
1213     {
1214         FloatingPointControl ctrl;
1215     }
1216     ensureDefaults();
1217
1218     {
1219         FloatingPointControl ctrl;
1220         ctrl.rounding = FloatingPointControl.roundDown;
1221         assert(FloatingPointControl.rounding == FloatingPointControl.roundDown);
1222     }
1223     ensureDefaults();
1224
1225     if (FloatingPointControl.hasExceptionTraps)
1226     {
1227         FloatingPointControl ctrl;
1228         ctrl.enableExceptions(FloatingPointControl.divByZeroException
1229                               | FloatingPointControl.overflowException);
1230         assert(ctrl.enabledExceptions ==
1231                (FloatingPointControl.divByZeroException
1232                 | FloatingPointControl.overflowException));
1233
1234         ctrl.rounding = FloatingPointControl.roundUp;
1235         assert(FloatingPointControl.rounding == FloatingPointControl.roundUp);
1236     }
1237     ensureDefaults();
1238 }
1239
1240 @safe unittest // rounding
1241 {
1242     import std.meta : AliasSeq;
1243
1244     static T addRound(T)(uint rm)
1245     {
1246         pragma(inline, false);
1247         FloatingPointControl fpctrl;
1248         fpctrl.rounding = rm;
1249         T x = 1;
1250         x = forceAddOp(x, 0.1L);
1251         return x;
1252     }
1253
1254     static T subRound(T)(uint rm)
1255     {
1256         pragma(inline, false);
1257         FloatingPointControl fpctrl;
1258         fpctrl.rounding = rm;
1259         T x = -1;
1260         x = forceSubOp(x, 0.1L);
1261         return x;
1262     }
1263
1264     static foreach (T; AliasSeq!(float, double, real))
1265     {{
1266         /* Be careful with changing the rounding mode, it interferes
1267          * with common subexpressions. Changing rounding modes should
1268          * be done with separate functions that are not inlined.
1269          */
1270
1271         {
1272             T u = addRound!(T)(FloatingPointControl.roundUp);
1273             T d = addRound!(T)(FloatingPointControl.roundDown);
1274             T z = addRound!(T)(FloatingPointControl.roundToZero);
1275
1276             assert(u > d);
1277             assert(z == d);
1278         }
1279
1280         {
1281             T u = subRound!(T)(FloatingPointControl.roundUp);
1282             T d = subRound!(T)(FloatingPointControl.roundDown);
1283             T z = subRound!(T)(FloatingPointControl.roundToZero);
1284
1285             assert(u > d);
1286             assert(z == u);
1287         }
1288     }}
1289 }
1290
1291 } // FloatingPointControlSupport
1292
1293 version (StdUnittest)
1294 {
1295     // These helpers are intended to avoid constant propagation by the optimizer.
1296     pragma(inline, false) private @safe
1297     {
1298         T forceAddOp(T)(T x, T y) { return x + y; }
1299         T forceSubOp(T)(T x, T y) { return x - y; }
1300         T forceMulOp(T)(T x, T y) { return x * y; }
1301         T forceDivOp(T)(T x, T y) { return x / y; }
1302     }
1303 }