gencgc: More precise conservatism for pointers to boxed pages.

[sbcl.git] / src / runtime / ppc-linux-os.c
diff --git a/src/runtime/ppc-linux-os.c b/src/runtime/ppc-linux-os.c

index 443c733..c2dc019 100644 (file)
--- a/src/runtime/ppc-linux-os.c
+++ b/src/runtime/ppc-linux-os.c
@@ -18,6 +18,7 @@
  #include <stdio.h>
  #include <sys/param.h>
  #include <sys/file.h>
+#include "sbcl.h"
  #include "./signal.h"
  #include "os.h"
  #include "arch.h"
@@ -25,7 +26,6 @@
  #include "interrupt.h"
  #include "interr.h"
  #include "lispregs.h"
-#include "sbcl.h"
  #include <sys/socket.h>
  #include <sys/utsname.h>
  
@@ -34,42 +34,106 @@
  #include <sys/time.h>
  #include <sys/stat.h>
  #include <unistd.h>
+#include <sys/prctl.h>
  
  #include "validate.h"
+#include "ppc-linux-mcontext.h"
+
  size_t os_vm_page_size;
  
-struct thread *arch_os_get_current_thread() {
-    return all_threads;
-}
  int arch_os_thread_init(struct thread *thread) {
-    return 1;                  /* success */
+#if defined(LISP_FEATURE_SB_THREAD)
+    pthread_setspecific(specials,thread);
+#endif
+
+    /* For some reason, PPC Linux appears to default to not generating
+     * floating point exceptions.  PR_SET_FPEXC is a PPC-specific
+     * option new in kernel 2.4.21 and 2.5.32 that allows us to
+     * configure this.  Should we need to run on an older kenel, the
+     * equivalent trick is to get into a signal-handling context and
+     * modify the saved machine state register.
+     *
+     * PR_FP_EXC_PRECISE may be more accurate than we need,
+     * particularly if we move to the x86oid trick of inserting
+     * explicit synchronization for floating-point exception
+     * delivery.  If we wish to move to such a model, the other two
+     * exception delivery modes that we could use are PR_FP_EXC_ASYNC
+     * and PR_FP_EXC_NONRECOV, and exception delivery can be forced
+     * by any access to the FPSCR.  -- AB, 2010-May-23 */
+    prctl(PR_SET_FPEXC, PR_FP_EXC_PRECISE, 0, 0);
+
+    return 1;                   /* success */
  }
  int arch_os_thread_cleanup(struct thread *thread) {
-    return 1;                  /* success */
+    return 1;                   /* success */
  }
  
  os_context_register_t   *
  os_context_register_addr(os_context_t *context, int offset)
  {
+#if defined(GLIBC231_STYLE_UCONTEXT)
      return &((context->uc_mcontext.regs)->gpr[offset]);
+#elif defined(GLIBC232_STYLE_UCONTEXT)
+    return &((context->uc_mcontext.uc_regs->gregs)[offset]);
+#endif
  }
  
  os_context_register_t *
  os_context_pc_addr(os_context_t *context)
  {
+#if defined(GLIBC231_STYLE_UCONTEXT)
      return &((context->uc_mcontext.regs)->nip);
+#elif defined(GLIBC232_STYLE_UCONTEXT)
+    return &((context->uc_mcontext.uc_regs->gregs)[PT_NIP]);
+#endif
  }
  
  os_context_register_t *
  os_context_lr_addr(os_context_t *context)
  {
+#if defined(GLIBC231_STYLE_UCONTEXT)
      return &((context->uc_mcontext.regs)->link);
+#elif defined(GLIBC232_STYLE_UCONTEXT)
+    return &((context->uc_mcontext.uc_regs->gregs)[PT_LNK]);
+#endif
+}
+
+os_context_register_t *
+os_context_ctr_addr(os_context_t *context)
+{
+    /* Like os_context_fp_control() and os_context_lr_addr(), this
+     * uses an index beyond the declared end of the array in order to
+     * find the correct register value in the context. */
+#if defined(GLIBC231_STYLE_UCONTEXT)
+    /* FIXME: This probably should be ->ctr instead of ->gpr[PT_CTR]. */
+    return &((context->uc_mcontext.regs)->gpr[PT_CTR]);
+#elif defined(GLIBC232_STYLE_UCONTEXT)
+    return &((context->uc_mcontext.uc_regs)->gregs[PT_CTR]);
+#endif
+}
+
+os_context_register_t *
+os_context_cr_addr(os_context_t *context)
+{
+    /* Like os_context_fp_control() and os_context_lr_addr(), this
+     * uses an index beyond the declared end of the array in order to
+     * find the correct register value in the context. */
+#if defined(GLIBC231_STYLE_UCONTEXT)
+    /* FIXME: This probably should be ->ccr instead of ->gpr[PT_CCR]. */
+    return &((context->uc_mcontext.regs)->gpr[PT_CCR]);
+#elif defined(GLIBC232_STYLE_UCONTEXT)
+    return &((context->uc_mcontext.uc_regs)->gregs[PT_CCR]);
+#endif
  }
  
  sigset_t *
  os_context_sigmask_addr(os_context_t *context)
  {
+#if defined(GLIBC231_STYLE_UCONTEXT)
+    return &context->uc_sigmask;
+#elif defined(GLIBC232_STYLE_UCONTEXT)
      return &context->uc_sigmask;
+#endif
  }
  
  unsigned long
@@ -80,40 +144,34 @@ os_context_fp_control(os_context_t *context)
         registers, and PT_FPSCR is an offset that is larger than 32
         (the number of ppc registers), but that happens to get the
         right answer. -- CSR, 2002-07-11 */
-    return context->uc_mcontext.regs->gpr[PT_FPSCR]; 
+#if defined(GLIBC231_STYLE_UCONTEXT)
+    return context->uc_mcontext.regs->gpr[PT_FPSCR];
+#elif defined(GLIBC232_STYLE_UCONTEXT)
+    return context->uc_mcontext.uc_regs->gregs[PT_FPSCR];
+#endif
  }
  
-void 
+void
  os_restore_fp_control(os_context_t *context)
  {
-    unsigned long control;
-    
-    control = os_context_fp_control(context) & 
-      /* FIXME: Should we preserve the user's requested rounding mode?
-
-         Note that doing 
-
-        ~(FLOAT_STICKY_BITS_MASK | FLOAT_EXCEPTIONS_BYTE_MASK)
-
-        here leads to infinite SIGFPE for invalid operations, as
-        there are bits in the control register that need to be
-        cleared that are let through by that mask. -- CSR, 2002-07-16 */
-      FLOAT_TRAPS_BYTE_MASK;
-    
-    /* FIXME: Shoot me now.
-       
-       Hardcoded nastiness: the "0"s below refer to the first floating
-       point registers -- we should let gcc deal with that. The 8(31)
-       refers to the position on the stack, less one, of control (we
-       need for control to be the high word of the double loaded by
-       lfd; how do I know that r31 contains the stack? I don't, I'm
-       just guessing. The 255, on the other hand, is a valid constant
-       -- it says "move everything in the upper word into the floating
-       point control register. -- CSR, 2002-07-16 */
-    asm ("stw %0, 12(31); lfd 0, 8(31); mtfsf 255, 0" : : "r" (control) : "r31");
+    /* KLUDGE: mtfsf has to be run against a float register, so we
+     * construct the float we need to use as an integer, then cast
+     * a pointer to its storage to a double and load that.  For
+     * this to work, control must be the same width as a double,
+     * 64 bits.  And why aren't we using a union here, anyway? */
+    unsigned long long control;
+    double d;
+
+    /* FIXME: We are only preserving enabled traps and rounding
+     * mode here.  Do we also want to preserve "fast mode"? */
+    control = os_context_fp_control(context) &
+        (FLOAT_TRAPS_BYTE_MASK | FLOAT_ROUNDING_MODE_MASK);
+
+    d = *((double *) &control);
+    asm volatile ("mtfsf 0xff,%0" : : "f" (d));
  }
  
-void 
+void
  os_flush_icache(os_vm_address_t address, os_vm_size_t length)
  {
      /* see ppc-arch.c */