jart
diff --git a/‎examples/trapping.c
Lines changed: 142 additions & 0 deletions b/‎examples/trapping.c
Lines changed: 142 additions & 0 deletions
diff --git a/‎libc/calls/ucontext.h
Lines changed: 41 additions & 0 deletions b/‎libc/calls/ucontext.h
Lines changed: 41 additions & 0 deletions
diff --git a/‎libc/cosmo.h
Lines changed: 1 addition & 0 deletions b/‎libc/cosmo.h
Lines changed: 1 addition & 0 deletions
diff --git a/‎libc/intrin/fedisableexcept.c
Lines changed: 92 additions & 0 deletions b/‎libc/intrin/fedisableexcept.c
Lines changed: 92 additions & 0 deletions
diff --git a/‎libc/intrin/feenableexcept.c
Lines changed: 98 additions & 0 deletions b/‎libc/intrin/feenableexcept.c
Lines changed: 98 additions & 0 deletions
@@ -0,0 +1,142 @@
+#include <fenv.h>
+#include <math.h>
+#include <signal.h>
+#include <stdio.h>
+#include <string.h>
+#include <ucontext.h>
+#include <unistd.h>
+#include "libc/calls/struct/aarch64.internal.h"
+
+/*
+   Do you put lots of assert(!isnan(x)) in your code??
+   Your microprocessor has a feature to automate this.
+
+       Uncaught SIGFPE (FPE_FLTINV)
+       __math_invalidf at libc/tinymath/math_errf.c:88
+       logf at libc/tinymath/logf.c:100
+       main at examples/trapping.c:29
+       cosmo at libc/runtime/cosmo.S:105
+       _start at libc/crt/crt.S:116
+
+   This file shows how to use floating point exception
+   trapping with Cosmopolitan Libc.
+*/
+
+#define TRAPS (FE_INVALID | FE_DIVBYZERO | FE_OVERFLOW | FE_UNDERFLOW)
+
+void spring_trap(int sig, siginfo_t *si, void *arg) {
+
+  // print signal safely
+  const char *msg;
+  int sic = si->si_code;
+  if (sic == FPE_INTDIV)
+    msg = "FPE_INTDIV: ";  // integer divide by zero
+  else if (sic == FPE_INTOVF)
+    msg = "FPE_INTOVF: ";  // integer overflow
+  else if (sic == FPE_FLTDIV)
+    msg = "FPE_FLTDIV: ";  // floating point divide by zero
+  else if (sic == FPE_FLTOVF)
+    msg = "FPE_FLTOVF: ";  // floating point overflow
+  else if (sic == FPE_FLTUND)
+    msg = "FPE_FLTUND: ";  // floating point underflow
+  else if (sic == FPE_FLTRES)
+    msg = "FPE_FLTRES: ";  // floating point inexact
+  else if (sic == FPE_FLTINV)
+    msg = "FPE_FLTINV: ";  // invalid floating point operation
+  else if (sic == FPE_FLTSUB)
+    msg = "FPE_FLTSUB: ";  // subscript out of range
+  else
+    msg = "SIGFPE: ";
+  write(1, msg, strlen(msg));
+
+  // recover from trap so that execution may resume
+  // without this the same signal will just keep getting raised
+  ucontext_t *ctx = arg;
+#ifdef __x86_64__
+  if (ctx->uc_mcontext.fpregs) {
+    ctx->uc_mcontext.fpregs->mxcsr |= TRAPS << 7;  // disable traps
+    ctx->uc_mcontext.fpregs->mxcsr &= ~TRAPS;      // clear cages
+    return;
+  }
+#elif defined(__aarch64__)
+  struct _aarch64_ctx *ac;
+  for (ac = (struct _aarch64_ctx *)ctx->uc_mcontext.__reserved; ac->magic;
+       ac = (struct _aarch64_ctx *)((char *)ac + ac->size)) {
+    if (ac->magic == FPSIMD_MAGIC) {
+      struct fpsimd_context *sm = (struct fpsimd_context *)ac;
+      sm->fpcr &= ~(TRAPS << 8);  // disable traps
+      sm->fpsr &= ~TRAPS;         // clear cages
+      return;
+    }
+  }
+#endif
+
+  // exit if we can't recover execution
+  msg = "cannot recover from signal\n";
+  write(1, msg, strlen(msg));
+  _exit(1);
+}
+
+void setup_trap(void) {
+  struct sigaction sa;
+  sigemptyset(&sa.sa_mask);
+  sa.sa_flags = SA_SIGINFO;
+  sa.sa_sigaction = spring_trap;
+  sigaction(SIGFPE, &sa, 0);
+}
+
+void activate_trap(void) {
+  feclearexcept(TRAPS);
+  if (feenableexcept(TRAPS)) {
+    static bool once;
+    if (!once) {
+      fprintf(stderr, "warning: trapping math isn't supported on this cpu\n");
+      once = true;
+    }
+  }
+}
+
+float ident(float x) {
+  return x;
+}
+float (*veil)(float) = ident;
+
+int main(int argc, char *argv[]) {
+  float x;
+  setup_trap();
+
+  // test illegal math
+  activate_trap();
+  x = 0 / veil(0);
+  printf("0/0 = %g\n", x);
+
+  // test divide by zero
+  activate_trap();
+  x = 1 / veil(0);
+  printf("1/0 = %g\n", x);
+
+  // test divide by zero again
+  activate_trap();
+  x = -1 / veil(0);
+  printf("-1/0 = %g\n", x);
+
+  // test domain error
+  activate_trap();
+  x = logf(veil(-1));
+  printf("log(-1) = %g\n", x);
+
+  // test imaginary number
+  activate_trap();
+  x = sqrtf(veil(-1));
+  printf("sqrt(-1) = %g\n", x);
+
+  // test overflow
+  activate_trap();
+  x = expf(veil(88.8));
+  printf("expf(88.8) = %g\n", x);
+
+  // test underflow
+  activate_trap();
+  x = expf(veil(-104));
+  printf("expf(-104) = %g\n", x);
+}
@@ -43,14 +43,55 @@ struct FpuStackEntry {
 };
 
 struct thatispacked FpuState {
+
+  /* 8087 FPU Control Word
+      IM: Invalid Operation ───────────────┐
+      DM: Denormal Operand ───────────────┐│
+      ZM: Zero Divide ───────────────────┐││
+      OM: Overflow ─────────────────────┐│││
+      UM: Underflow ───────────────────┐││││
+      PM: Precision ──────────────────┐│││││
+      PC: Precision Control ───────┐  ││││││
+       {float,∅,double,long double}│  ││││││
+      RC: Rounding Control ──────┐ │  ││││││
+       {even, →-∞, →+∞, →0}      │┌┤  ││││││
+                                ┌┤││  ││││││
+                               d││││rr││││││
+                          0b0000001001111111 */
   uint16_t cwd;
+
+  /* 8087 FPU Status Word */
   uint16_t swd;
+
   uint16_t ftw;
   uint16_t fop;
   uint64_t rip;
   uint64_t rdp;
+
+  /* SSE CONTROL AND STATUS REGISTER
+     IE: Invalid Operation Flag ──────────────┐
+     DE: Denormal Flag ──────────────────────┐│
+     ZE: Divide-by-Zero Flag ───────────────┐││
+     OE: Overflow Flag ────────────────────┐│││
+     UE: Underflow Flag ──────────────────┐││││
+     PE: Precision Flag ─────────────────┐│││││
+     DAZ: Denormals Are Zeros ──────────┐││││││
+     IM: Invalid Operation Mask ───────┐│││││││
+     DM: Denormal Operation Mask ─────┐││││││││
+     ZM: Divide-by-Zero Mask ────────┐│││││││││
+     OM: Overflow Mask ─────────────┐││││││││││
+     UM: Underflow Mask ───────────┐│││││││││││
+     PM: Precision Mask ──────────┐││││││││││││
+     RC: Rounding Control ───────┐│││││││││││││
+       {even, →-∞, →+∞, →0}      ││││││││││││││
+     FTZ: Flush To Zero ───────┐ ││││││││││││││
+                               │┌┤│││││││││││││
+               ┌──────────────┐││││││││││││││││
+               │   reserved   │││││││││││││││││
+             0b00000000000000000001111110000000 */
   uint32_t mxcsr;
   uint32_t mxcr_mask;
+
   struct FpuStackEntry st[8];
   struct XmmRegister xmm[16];
   uint32_t __padding[24];
 
@@ -5,6 +5,7 @@ COSMOPOLITAN_C_START_
 errno_t cosmo_once(_Atomic(uint32_t) *, void (*)(void));
 int systemvpe(const char *, char *const[], char *const[]) libcesque;
 char *GetProgramExecutableName(void);
+void unleaf(void);
 
 COSMOPOLITAN_C_END_
 #endif /* COSMOPOLITAN_LIBC_COSMO_H_ */
@@ -0,0 +1,92 @@
+/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
+│ vi: set et ft=c ts=2 sts=2 sw=2 fenc=utf-8                               :vi │
+╞══════════════════════════════════════════════════════════════════════════════╡
+│ Copyright 2024 Justine Alexandra Roberts Tunney                              │
+│                                                                              │
+│ Permission to use, copy, modify, and/or distribute this software for         │
+│ any purpose with or without fee is hereby granted, provided that the         │
+│ above copyright notice and this permission notice appear in all copies.      │
+│                                                                              │
+│ THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL                │
+│ WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED                │
+│ WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE             │
+│ AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL         │
+│ DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR        │
+│ PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER               │
+│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR             │
+│ PERFORMANCE OF THIS SOFTWARE.                                                │
+╚─────────────────────────────────────────────────────────────────────────────*/
+#include "libc/runtime/fenv.h"
+
+/**
+ * Disables floating point exception trapping, e.g.
+ *
+ *     feenableexcept(FE_INVALID | FE_DIVBYZERO |
+ *                    FE_OVERFLOW | FE_UNDERFLOW);
+ *
+ * When trapping is enabled, something should handle SIGFPE. Calling
+ * ShowCrashReports() at startup will install a generic handler with
+ * backtraces and the symbol of the `si->si_code` which UNIX defines
+ *
+ * - `FPE_INTOVF`: integer overflow
+ * - `FPE_INTDIV`: integer divide by zero
+ * - `FPE_FLTDIV`: floating point divide by zero
+ * - `FPE_FLTOVF`: floating point overflow
+ * - `FPE_FLTUND`: floating point underflow
+ * - `FPE_FLTRES`: floating point inexact
+ * - `FPE_FLTINV`: invalid floating point operation
+ * - `FPE_FLTSUB`: subscript out of range
+ *
+ * It's important to not use the `-ffast-math` or `-Ofast` flags when
+ * compiling code that needs to be debugged. Using `-fsignaling-nans`
+ * will also help, since GCC doesn't enable that by default.
+ *
+ * @param excepts may bitwise-or the following:
+ *     - `FE_INVALID`
+ *     - `FE_DIVBYZERO`
+ *     - `FE_OVERFLOW`
+ *     - `FE_UNDERFLOW`
+ *     - `FE_INEXACT`
+ *     - `FE_ALL_EXCEPT` (all of the above)
+ * @see fetestexcept() if you don't want to deal with signals
+ * @see feenableexcept() to turn it on in the first place
+ */
+int fedisableexcept(int excepts) {
+
+  // limit to what we know
+  excepts &= FE_ALL_EXCEPT;
+
+#ifdef __x86_64__
+
+#ifndef NOX87
+  // configure 8087 fpu control word
+  // setting the bits enables suppression
+  unsigned short x87cw;
+  asm("fstcw\t%0" : "=m"(x87cw));
+  x87cw |= excepts;
+  asm("fldcw\t%0" : /* no inputs */ : "m"(x87cw));
+#endif
+
+  // configure modern sse control word
+  // setting the bits enables suppression
+  unsigned mxcsr;
+  asm("stmxcsr\t%0" : "=m"(mxcsr));
+  mxcsr |= excepts << 7;
+  asm("ldmxcsr\t%0" : /* no inputs */ : "m"(mxcsr));
+
+  return 0;
+
+#elif defined(__aarch64__)
+
+  unsigned fpcr;
+  unsigned fpcr2;
+  fpcr = __builtin_aarch64_get_fpcr();
+  fpcr2 = fpcr & ~(excepts << 8);
+  if (fpcr != fpcr2)
+    __builtin_aarch64_set_fpcr(fpcr2);
+  return (fpcr >> 8) & FE_ALL_EXCEPT;
+
+#else
+  return -1;
+#endif
+}
@@ -0,0 +1,98 @@
+/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
+│ vi: set et ft=c ts=2 sts=2 sw=2 fenc=utf-8                               :vi │
+╞══════════════════════════════════════════════════════════════════════════════╡
+│ Copyright 2024 Justine Alexandra Roberts Tunney                              │
+│                                                                              │
+│ Permission to use, copy, modify, and/or distribute this software for         │
+│ any purpose with or without fee is hereby granted, provided that the         │
+│ above copyright notice and this permission notice appear in all copies.      │
+│                                                                              │
+│ THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL                │
+│ WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED                │
+│ WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE             │
+│ AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL         │
+│ DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR        │
+│ PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER               │
+│ TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR             │
+│ PERFORMANCE OF THIS SOFTWARE.                                                │
+╚─────────────────────────────────────────────────────────────────────────────*/
+#include "libc/runtime/fenv.h"
+
+/**
+ * Enables floating point exception trapping, e.g.
+ *
+ *     feenableexcept(FE_INVALID | FE_DIVBYZERO |
+ *                    FE_OVERFLOW | FE_UNDERFLOW);
+ *
+ * When trapping is enabled, something should handle SIGFPE. Calling
+ * ShowCrashReports() at startup will install a generic handler with
+ * backtraces and the symbol of the `si->si_code` which UNIX defines
+ *
+ * - `FPE_INTOVF`: integer overflow
+ * - `FPE_INTDIV`: integer divide by zero
+ * - `FPE_FLTDIV`: floating point divide by zero
+ * - `FPE_FLTOVF`: floating point overflow
+ * - `FPE_FLTUND`: floating point underflow
+ * - `FPE_FLTRES`: floating point inexact
+ * - `FPE_FLTINV`: invalid floating point operation
+ * - `FPE_FLTSUB`: subscript out of range
+ *
+ * It's important to not use the `-ffast-math` or `-Ofast` flags when
+ * compiling code that needs to be debugged. Using `-fsignaling-nans`
+ * will also help, since GCC doesn't enable that by default.
+ *
+ * @param excepts may bitwise-or the following:
+ *     - `FE_INVALID`
+ *     - `FE_DIVBYZERO`
+ *     - `FE_OVERFLOW`
+ *     - `FE_UNDERFLOW`
+ *     - `FE_INEXACT`
+ *     - `FE_ALL_EXCEPT` (all of the above)
+ * @see fetestexcept() if you don't want to deal with signals
+ * @see fedisableexcept() to turn it back off again
+ */
+int feenableexcept(int excepts) {
+
+  // limit to what we know
+  excepts &= FE_ALL_EXCEPT;
+
+#ifdef __x86_64__
+
+#ifndef NOX87
+  // configure 8087 fpu control word
+  // celaring the bits disables suppression
+  unsigned short x87cw;
+  asm("fstcw\t%0" : "=m"(x87cw));
+  x87cw &= ~excepts;
+  asm("fldcw\t%0" : /* no inputs */ : "m"(x87cw));
+#endif
+
+  // configure modern sse control word
+  // clearing the bits disables suppression
+  unsigned mxcsr;
+  asm("stmxcsr\t%0" : "=m"(mxcsr));
+  mxcsr &= ~(excepts << 7);
+  asm("ldmxcsr\t%0" : /* no inputs */ : "m"(mxcsr));
+
+  return 0;
+
+#elif defined(__aarch64__)
+
+  unsigned fpcr;
+  unsigned fpcr2;
+  unsigned updated_fpcr;
+  fpcr = __builtin_aarch64_get_fpcr();
+  fpcr2 = fpcr | (excepts << 8);
+  if (fpcr != fpcr2) {
+    __builtin_aarch64_set_fpcr(fpcr2);
+    // floating point exception trapping is optional in aarch64
+    updated_fpcr = __builtin_aarch64_get_fpsr();
+    if (fpcr2 & ~updated_fpcr)
+      return -1;
+  }
+  return (fpcr >> 8) & FE_ALL_EXCEPT;
+
+#else
+  return -1;
+#endif
+}