[Sbcl-commits] master: Preliminary work towards threads on win32

SourceForge Headquarters 225 Broadway Suite 1600 San Diego, CA 92101 +1 (858) 454-5900

The branch "master" has been updated in SBCL:
       via  7aef55b130d95c384b63422807f1848faa9aba5a (commit)
      from  1dd3616e9eadaba9f1ca86b72d64551fbd75f399 (commit)

- Log -----------------------------------------------------------------
commit 7aef55b130d95c384b63422807f1848faa9aba5a
Author: David Lichteblau <da...@li...>
Date:   Tue Sep 18 17:12:09 2012 +0200

    Preliminary work towards threads on win32
    
      * Implement SB-THREAD
    
      * Support WITH-TIMEOUT, etc.
    
    Implementation details:
    
      * Implement pthreads, futex API on top of Win32.
      * Adds support for the timer facility using sb-wtimer.
      * Implement an interruptable `nanosleep' using waitable timers.
      * Threading on Windows uses safepoints to stop the world.
        On this platform, either all or none of :SB-THREAD, :SB-SAFEPOINT,
        :SB-THRUPT, and :SB-WTIMER need to be enabled together.
      * On this platform, INTERRUPT-THREAD will not run interruptions
        in a target thread that is executing foreign code, even though
        the POSIX version of sb-thrupt still allows this (potentially
        unsafe) form of signalling by default.
    
    Does not yet include interruptible I/O, which will be made available
    separately.  Slime users are requested to build SBCL without threads
    until then.
    
    Note that these changes alone are not yet sufficient to make SBCL on
    Windows an ideal backend.  Users looking for a particularly stable
    or thread-enabled version of SBCL for Windows are still advised to
    use the well-known Windows branch instead.
    
    This is a merge of features developed earlier by Dmitry Kalyanov and
    Anton Kovalenko.
---
 src/code/cold-init.lisp                   |    5 +-
 src/code/run-program.lisp                 |    6 +-
 src/code/target-exception.lisp            |  100 ++
 src/code/target-thread.lisp               |    6 +-
 src/code/toplevel.lisp                    |    4 +-
 src/code/win32.lisp                       |   13 +-
 src/compiler/generic/objdef.lisp          |    1 +
 src/runtime/Config.x86-win32              |    5 +-
 src/runtime/gencgc.c                      |   10 +-
 src/runtime/interrupt.c                   |   70 +-
 src/runtime/interrupt.h                   |    9 +-
 src/runtime/os-common.c                   |    2 +-
 src/runtime/parse.c                       |    6 +-
 src/runtime/print.c                       |    3 +
 src/runtime/pthreads_win32.c              | 1582 +++++++++++++++++++++++++++++
 src/runtime/pthreads_win32.h              |  421 ++++++++
 src/runtime/runtime.c                     |   13 +-
 src/runtime/runtime.h                     |   17 +-
 src/runtime/safepoint.c                   |   67 ++-
 src/runtime/save.c                        |    6 +-
 src/runtime/thread.c                      |   93 ++-
 src/runtime/thread.h                      |   27 +-
 src/runtime/win32-os.c                    |  829 +++++++++++++---
 src/runtime/win32-os.h                    |   54 +-
 src/runtime/win32-thread-private-events.h |   13 +
 src/runtime/wrap.c                        |   14 +-
 src/runtime/x86-arch.c                    |    3 +-
 src/runtime/x86-arch.h                    |   16 +-
 src/runtime/x86-assem.S                   |   18 +-
 src/runtime/x86-win32-os.c                |   94 +-
 src/runtime/x86-win32-os.h                |   16 +-
 tools-for-build/grovel-headers.c          |   35 +
 32 files changed, 3275 insertions(+), 283 deletions(-)

diff --git a/src/code/cold-init.lisp b/src/code/cold-init.lisp
index c343f4a..48a2027 100644
--- a/src/code/cold-init.lisp
+++ b/src/code/cold-init.lisp
@@ -230,7 +230,8 @@
   (show-and-call stream-cold-init-or-reset)
   (show-and-call !loader-cold-init)
   (show-and-call !foreign-cold-init)
-  #!-win32 (show-and-call signal-cold-init-or-reinit)
+  #!-(and win32 (not sb-thread))
+  (show-and-call signal-cold-init-or-reinit)
   (/show0 "enabling internal errors")
   (setf (sb!alien:extern-alien "internal_errors_enabled" boolean) t)
 
@@ -351,7 +352,7 @@ process to continue normally."
     (os-cold-init-or-reinit)
     (thread-init-or-reinit)
     (stream-reinit t)
-    #!-win32
+    #!-(and win32 (not sb-thread))
     (signal-cold-init-or-reinit)
     (setf (sb!alien:extern-alien "internal_errors_enabled" boolean) t)
     (float-cold-init-or-reinit))
diff --git a/src/code/run-program.lisp b/src/code/run-program.lisp
index 97d6d55..fee0dd7 100644
--- a/src/code/run-program.lisp
+++ b/src/code/run-program.lisp
@@ -145,7 +145,6 @@
   #+sb-doc
   "List of process structures for all active processes.")
 
-#-win32
 (defvar *active-processes-lock*
   (sb-thread:make-mutex :name "Lock for active processes."))
 
@@ -153,11 +152,8 @@
 ;;; mutex is needed. More importantly the sigchld signal handler also
 ;;; accesses it, that's why we need without-interrupts.
 (defmacro with-active-processes-lock (() &body body)
-  #-win32
   `(sb-thread::with-system-mutex (*active-processes-lock*)
-     ,@body)
-  #+win32
-  `(progn ,@body))
+     ,@body))
 
 (defstruct (process (:copier nil))
   pid                 ; PID of child process
diff --git a/src/code/target-exception.lisp b/src/code/target-exception.lisp
index 803a758..0c5e7b7 100644
--- a/src/code/target-exception.lisp
+++ b/src/code/target-exception.lisp
@@ -101,3 +101,103 @@
 ;;;   I don't know if we still need this or not. Better safe for now.
 (defun receive-pending-interrupt ()
   (receive-pending-interrupt))
+
+(in-package "SB!UNIX")
+
+#!+sb-thread
+(progn
+  (defun receive-pending-interrupt ()
+    (receive-pending-interrupt))
+
+  (defmacro with-interrupt-bindings (&body body)
+    `(let*
+         ;; KLUDGE: Whatever is on the PCL stacks before the interrupt
+         ;; handler runs doesn't really matter, since we're not on the
+         ;; same call stack, really -- and if we don't bind these (esp.
+         ;; the cache one) we can get a bogus metacircle if an interrupt
+         ;; handler calls a GF that was being computed when the interrupt
+         ;; hit.
+         ((sb!pcl::*cache-miss-values-stack* nil)
+          (sb!pcl::*dfun-miss-gfs-on-stack* nil))
+       ,@body))
+
+;;; Evaluate CLEANUP-FORMS iff PROTECTED-FORM does a non-local exit.
+  (defmacro nlx-protect (protected-form &rest cleanup-froms)
+    (with-unique-names (completep)
+      `(let ((,completep nil))
+         (without-interrupts
+           (unwind-protect
+                (progn
+                  (allow-with-interrupts
+                    ,protected-form)
+                  (setq ,completep t))
+             (unless ,completep
+               ,@cleanup-froms))))))
+
+  (declaim (inline %unblock-deferrable-signals))
+  (sb!alien:define-alien-routine ("unblock_deferrable_signals"
+                                  %unblock-deferrable-signals)
+      sb!alien:void
+    (where sb!alien:unsigned)
+    (old sb!alien:unsigned))
+
+  (defun block-deferrable-signals ()
+    (%block-deferrable-signals 0 0))
+
+  (defun unblock-deferrable-signals ()
+    (%unblock-deferrable-signals 0 0))
+
+  (declaim (inline %block-deferrables-and-return-mask %apply-sigmask))
+  (sb!alien:define-alien-routine ("block_deferrables_and_return_mask"
+                                  %block-deferrables-and-return-mask)
+      sb!alien:unsigned)
+  (sb!alien:define-alien-routine ("apply_sigmask"
+                                  %apply-sigmask)
+      sb!alien:void
+    (mask sb!alien:unsigned))
+
+  (defmacro without-interrupts/with-deferrables-blocked (&body body)
+    (let ((mask-var (gensym)))
+      `(without-interrupts
+         (let ((,mask-var (%block-deferrables-and-return-mask)))
+           (unwind-protect
+                (progn ,@body)
+             (%apply-sigmask ,mask-var))))))
+
+  (defun invoke-interruption (function)
+    (without-interrupts
+      ;; Reset signal mask: the C-side handler has blocked all
+      ;; deferrable signals before funcalling into lisp. They are to be
+      ;; unblocked the first time interrupts are enabled. With this
+      ;; mechanism there are no extra frames on the stack from a
+      ;; previous signal handler when the next signal is delivered
+      ;; provided there is no WITH-INTERRUPTS.
+      (let ((sb!unix::*unblock-deferrables-on-enabling-interrupts-p* t))
+        (with-interrupt-bindings
+          (let ((sb!debug:*stack-top-hint*
+                 (nth-value 1 (sb!kernel:find-interrupted-name-and-frame))))
+            (allow-with-interrupts
+              (nlx-protect
+               (funcall function)
+               ;; We've been running with deferrables
+               ;; blocked in Lisp called by a C signal
+               ;; handler. If we return normally the sigmask
+               ;; in the interrupted context is restored.
+               ;; However, if we do an nlx the operating
+               ;; system will not restore it for us.
+               (when sb!unix::*unblock-deferrables-on-enabling-interrupts-p*
+                 ;; This means that storms of interrupts
+                 ;; doing an nlx can still run out of stack.
+                 (unblock-deferrable-signals)))))))))
+
+  (defmacro in-interruption ((&key) &body body)
+    #!+sb-doc
+    "Convenience macro on top of INVOKE-INTERRUPTION."
+    `(dx-flet ((interruption () ,@body))
+       (invoke-interruption #'interruption)))
+
+  (defun sb!kernel:signal-cold-init-or-reinit ()
+    #!+sb-doc
+    "Enable all the default signals that Lisp knows how to deal with."
+    (unblock-deferrable-signals)
+    (values)))
diff --git a/src/code/target-thread.lisp b/src/code/target-thread.lisp
index 5f61722..773fe9c 100644
--- a/src/code/target-thread.lisp
+++ b/src/code/target-thread.lisp
@@ -1605,12 +1605,12 @@ the state of a thread:
   (interrupt-thread thread #'break)
 
 Short version: be careful out there."
- #!+win32
+  #!+(and (not sb-thread) win32)
+  #!+(and (not sb-thread) win32)
   (declare (ignore thread))
-  #!+win32
   (with-interrupt-bindings
     (with-interrupts (funcall function)))
-  #!-win32
+  #!-(and (not sb-thread) win32)
   (let ((os-thread (thread-os-thread thread)))
     (cond ((not os-thread)
            (error 'interrupt-thread-error :thread thread))
diff --git a/src/code/toplevel.lisp b/src/code/toplevel.lisp
index f3f226b..a72e064 100644
--- a/src/code/toplevel.lisp
+++ b/src/code/toplevel.lisp
@@ -202,7 +202,7 @@ any non-negative real number."
            :format-arguments (list seconds)
            :datum seconds
            :expected-type '(real 0)))
-  #!-win32
+  #!-(and win32 (not sb-thread))
   (multiple-value-bind (sec nsec)
       (if (integerp seconds)
           (values seconds 0)
@@ -216,7 +216,7 @@ any non-negative real number."
           do (decf sec (expt 10 8))
              (sb!unix:nanosleep (expt 10 8) 0))
     (sb!unix:nanosleep sec nsec))
-  #!+win32
+  #!+(and win32 (not sb-thread))
   (sb!win32:millisleep (truncate (* seconds 1000)))
   nil)
 
diff --git a/src/code/win32.lisp b/src/code/win32.lisp
index 25b00ad..1f8e7ed 100644
--- a/src/code/win32.lisp
+++ b/src/code/win32.lisp
@@ -154,10 +154,21 @@
 
 ;;;; System Functions
 
-;;; Sleep for MILLISECONDS milliseconds.
+#!-sb-thread
 (define-alien-routine ("Sleep@4" millisleep) void
   (milliseconds dword))
 
+#!+sb-thread
+(defun sb!unix:nanosleep (sec nsec)
+  (let ((*allow-with-interrupts* *interrupts-enabled*))
+    (without-interrupts
+      (let ((timer (sb!impl::os-create-wtimer)))
+        (sb!impl::os-set-wtimer timer sec nsec)
+        (unwind-protect
+             (do () ((with-local-interrupts
+                       (zerop (sb!impl::os-wait-for-wtimer timer)))))
+          (sb!impl::os-close-wtimer timer))))))
+
 #!+sb-unicode
 (progn
   (defvar *ansi-codepage* nil)
diff --git a/src/compiler/generic/objdef.lisp b/src/compiler/generic/objdef.lisp
index bfc0281..35e7cb5 100644
--- a/src/compiler/generic/objdef.lisp
+++ b/src/compiler/generic/objdef.lisp
@@ -398,6 +398,7 @@
   (control-stack-guard-page-protected)
   (alien-stack-start :c-type "lispobj *" :length #!+alpha 2 #!-alpha 1)
   (alien-stack-pointer :c-type "lispobj *" :length #!+alpha 2 #!-alpha 1)
+  #!+win32 (private-events :c-type "struct private_events" :length 2)
   (this :c-type "struct thread *" :length #!+alpha 2 #!-alpha 1)
   (prev :c-type "struct thread *" :length #!+alpha 2 #!-alpha 1)
   (next :c-type "struct thread *" :length #!+alpha 2 #!-alpha 1)
diff --git a/src/runtime/Config.x86-win32 b/src/runtime/Config.x86-win32
index f77b20a..a047e63 100644
--- a/src/runtime/Config.x86-win32
+++ b/src/runtime/Config.x86-win32
@@ -14,7 +14,8 @@ TARGET=sbcl.exe
 ASSEM_SRC = x86-assem.S
 ARCH_SRC = x86-arch.c
 
-OS_SRC = win32-os.c x86-win32-os.c os-common.c
+OS_SRC = win32-os.c x86-win32-os.c os-common.c pthreads_win32.c
+
 # The "--Wl,--export-dynamic" flags are here to help people
 # experimenting with callbacks from C to SBCL, by allowing linkage to
 # SBCL src/runtime/*.c symbols from C. Work on this is good, but it's
@@ -35,7 +36,7 @@ endif
 
 GC_SRC = gencgc.c
 
-CFLAGS = -g -Wall -O3 -fno-omit-frame-pointer
+CFLAGS = -g -Wall -O3 -fno-omit-frame-pointer -mno-cygwin -march=i686 -DWINVER=0x0501
 ASFLAGS = $(CFLAGS)
 
 CPP = cpp
diff --git a/src/runtime/gencgc.c b/src/runtime/gencgc.c
index 823410c..a89d59c 100644
--- a/src/runtime/gencgc.c
+++ b/src/runtime/gencgc.c
@@ -26,10 +26,14 @@
 
 #include <stdlib.h>
 #include <stdio.h>
-#include <signal.h>
 #include <errno.h>
 #include <string.h>
 #include "sbcl.h"
+#if defined(LISP_FEATURE_WIN32) && defined(LISP_FEATURE_SB_THREAD)
+#include "pthreads_win32.h"
+#else
+#include <signal.h>
+#endif
 #include "runtime.h"
 #include "os.h"
 #include "interr.h"
@@ -3321,7 +3325,7 @@ preserve_context_registers (os_context_t *c)
     /* On Darwin the signal context isn't a contiguous block of memory,
      * so just preserve_pointering its contents won't be sufficient.
      */
-#if defined(LISP_FEATURE_DARWIN)
+#if defined(LISP_FEATURE_DARWIN)||defined(LISP_FEATURE_WIN32)
 #if defined LISP_FEATURE_X86
     preserve_pointer((void*)*os_context_register_addr(c,reg_EAX));
     preserve_pointer((void*)*os_context_register_addr(c,reg_ECX));
@@ -3350,9 +3354,11 @@ preserve_context_registers (os_context_t *c)
     #error "preserve_context_registers needs to be tweaked for non-x86 Darwin"
 #endif
 #endif
+#if !defined(LISP_FEATURE_WIN32)
     for(ptr = ((void **)(c+1))-1; ptr>=(void **)c; ptr--) {
         preserve_pointer(*ptr);
     }
+#endif
 }
 #endif
 
diff --git a/src/runtime/interrupt.c b/src/runtime/interrupt.c
index fe09ec2..9b82a58 100644
--- a/src/runtime/interrupt.c
+++ b/src/runtime/interrupt.c
@@ -102,7 +102,7 @@ union interrupt_handler interrupt_handlers[NSIG];
  * work for SIGSEGV and similar. It is good enough for timers, and
  * maybe all deferrables. */
 
-#ifdef LISP_FEATURE_SB_THREAD
+#if defined(LISP_FEATURE_SB_THREAD) && !defined(LISP_FEATURE_WIN32)
 static void
 add_handled_signals(sigset_t *sigset)
 {
@@ -121,7 +121,7 @@ void block_signals(sigset_t *what, sigset_t *where, sigset_t *old);
 static boolean
 maybe_resignal_to_lisp_thread(int signal, os_context_t *context)
 {
-#ifdef LISP_FEATURE_SB_THREAD
+#if defined(LISP_FEATURE_SB_THREAD) && !defined(LISP_FEATURE_WIN32)
     if (!pthread_getspecific(lisp_thread)) {
         if (!(sigismember(&deferrable_sigset,signal))) {
             corruption_warning_and_maybe_lose
@@ -175,7 +175,7 @@ maybe_resignal_to_lisp_thread(int signal, os_context_t *context)
 
 static void run_deferred_handler(struct interrupt_data *data,
                                  os_context_t *context);
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
 static void store_signal_data_for_later (struct interrupt_data *data,
                                          void *handler, int signal,
                                          siginfo_t *info,
@@ -240,7 +240,7 @@ boolean
 all_signals_blocked_p(sigset_t *sigset, sigset_t *sigset2,
                                 const char *name)
 {
-#if !defined(LISP_FEATURE_WIN32)
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     int i;
     boolean has_blocked = 0, has_unblocked = 0;
     sigset_t current;
@@ -314,7 +314,7 @@ sigset_t gc_sigset;
 
 #endif
 
-#if !defined(LISP_FEATURE_WIN32)
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
 boolean
 deferrables_blocked_p(sigset_t *sigset)
 {
@@ -325,7 +325,7 @@ deferrables_blocked_p(sigset_t *sigset)
 void
 check_deferrables_unblocked_or_lose(sigset_t *sigset)
 {
-#if !defined(LISP_FEATURE_WIN32)
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     if (deferrables_blocked_p(sigset))
         lose("deferrables blocked\n");
 #endif
@@ -334,13 +334,13 @@ check_deferrables_unblocked_or_lose(sigset_t *sigset)
 void
 check_deferrables_blocked_or_lose(sigset_t *sigset)
 {
-#if !defined(LISP_FEATURE_WIN32)
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     if (!deferrables_blocked_p(sigset))
         lose("deferrables unblocked\n");
 #endif
 }
 
-#if !defined(LISP_FEATURE_WIN32)
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
 boolean
 blockables_blocked_p(sigset_t *sigset)
 {
@@ -351,7 +351,7 @@ blockables_blocked_p(sigset_t *sigset)
 void
 check_blockables_unblocked_or_lose(sigset_t *sigset)
 {
-#if !defined(LISP_FEATURE_WIN32)
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     if (blockables_blocked_p(sigset))
         lose("blockables blocked\n");
 #endif
@@ -361,6 +361,24 @@ void
 check_blockables_blocked_or_lose(sigset_t *sigset)
 {
 #if !defined(LISP_FEATURE_WIN32)
+    /* On Windows, there are no actual signals, but since the win32 port
+     * tracks the sigmask and checks it explicitly, some functions are
+     * still required to keep the mask set up properly.  (After all, the
+     * goal of the sigmask emulation is to not have to change all the
+     * call sites in the first place.)
+     *
+     * However, this does not hold for all signals equally: While
+     * deferrables matter ("is interrupt-thread okay?"), it is not worth
+     * having to set up blockables properly (which include the
+     * non-existing GC signals).
+     *
+     * Yet, as the original comment explains it:
+     *   Adjusting FREE-INTERRUPT-CONTEXT-INDEX* and other aspecs of
+     *   fake_foreign_function_call machinery are sometimes useful here[...].
+     *
+     * So we merely skip this assertion.
+     *   -- DFL, trying to expand on a comment by AK.
+     */
     if (!blockables_blocked_p(sigset))
         lose("blockables unblocked\n");
 #endif
@@ -397,7 +415,7 @@ check_gc_signals_blocked_or_lose(sigset_t *sigset)
 void
 block_deferrable_signals(sigset_t *where, sigset_t *old)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     block_signals(&deferrable_sigset, where, old);
 #endif
 }
@@ -405,7 +423,7 @@ block_deferrable_signals(sigset_t *where, sigset_t *old)
 void
 block_blockable_signals(sigset_t *where, sigset_t *old)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     block_signals(&blockable_sigset, where, old);
 #endif
 }
@@ -414,7 +432,7 @@ block_blockable_signals(sigset_t *where, sigset_t *old)
 void
 block_gc_signals(sigset_t *where, sigset_t *old)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     block_signals(&gc_sigset, where, old);
 #endif
 }
@@ -423,7 +441,7 @@ block_gc_signals(sigset_t *where, sigset_t *old)
 void
 unblock_deferrable_signals(sigset_t *where, sigset_t *old)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     if (interrupt_handler_pending_p())
         lose("unblock_deferrable_signals: losing proposition\n");
 #ifndef LISP_FEATURE_SB_SAFEPOINT
@@ -436,7 +454,7 @@ unblock_deferrable_signals(sigset_t *where, sigset_t *old)
 void
 unblock_blockable_signals(sigset_t *where, sigset_t *old)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     unblock_signals(&blockable_sigset, where, old);
 #endif
 }
@@ -454,7 +472,7 @@ unblock_gc_signals(sigset_t *where, sigset_t *old)
 void
 unblock_signals_in_context_and_maybe_warn(os_context_t *context)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     sigset_t *sigset = os_context_sigmask_addr(context);
 #ifndef LISP_FEATURE_SB_SAFEPOINT
     if (all_signals_blocked_p(sigset, &gc_sigset, "gc")) {
@@ -548,7 +566,7 @@ in_leaving_without_gcing_race_p(struct thread *thread)
 void
 check_interrupt_context_or_lose(os_context_t *context)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     struct thread *thread = arch_os_get_current_thread();
     struct interrupt_data *data = thread->interrupt_data;
     int interrupt_deferred_p = (data->pending_handler != 0);
@@ -793,7 +811,7 @@ interrupt_internal_error(os_context_t *context, boolean continuable)
 #endif
     context_sap = alloc_sap(context);
 
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     thread_sigmask(SIG_SETMASK, os_context_sigmask_addr(context), 0);
 #endif
 
@@ -1048,7 +1066,7 @@ interrupt_handle_now(int signal, siginfo_t *info, os_context_t *context)
 
     check_blockables_blocked_or_lose(0);
 
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     if (sigismember(&deferrable_sigset,signal))
         check_interrupts_enabled_or_lose(context);
 #endif
@@ -1115,11 +1133,11 @@ interrupt_handle_now(int signal, siginfo_t *info, os_context_t *context)
 
         FSHOW_SIGNAL((stderr,"/calling C-level handler\n"));
 
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
         /* Allow signals again. */
         thread_sigmask(SIG_SETMASK, os_context_sigmask_addr(context), 0);
-#endif
         (*handler.c)(signal, info, context);
+#endif
     }
 
     if (were_in_lisp)
@@ -1928,17 +1946,21 @@ sigabrt_handler(int signal, siginfo_t *info, os_context_t *context)
 void
 interrupt_init(void)
 {
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     int i;
     SHOW("entering interrupt_init()");
+#ifndef LISP_FEATURE_WIN32
     see_if_sigaction_nodefer_works();
+#endif
     sigemptyset(&deferrable_sigset);
     sigemptyset(&blockable_sigset);
     sigemptyset(&gc_sigset);
     sigaddset_deferrable(&deferrable_sigset);
     sigaddset_blockable(&blockable_sigset);
     sigaddset_gc(&gc_sigset);
+#endif
 
+#ifndef LISP_FEATURE_WIN32
     /* Set up high level handler information. */
     for (i = 0; i < NSIG; i++) {
         interrupt_handlers[i].c =
@@ -1950,8 +1972,8 @@ interrupt_init(void)
             (void (*)(int, siginfo_t*, os_context_t*))SIG_DFL;
     }
     undoably_install_low_level_interrupt_handler(SIGABRT, sigabrt_handler);
+#endif
     SHOW("returning from interrupt_init()");
-#endif
 }
 
 #ifndef LISP_FEATURE_WIN32
@@ -2000,7 +2022,7 @@ unhandled_trap_error(os_context_t *context)
     unblock_gc_signals(0, 0);
 #endif
     context_sap = alloc_sap(context);
-#ifndef LISP_FEATURE_WIN32
+#if !defined(LISP_FEATURE_WIN32) || defined(LISP_FEATURE_SB_THREAD)
     thread_sigmask(SIG_SETMASK, os_context_sigmask_addr(context), 0);
 #endif
     funcall1(StaticSymbolFunction(UNHANDLED_TRAP_ERROR), context_sap);
@@ -2014,11 +2036,13 @@ void
 handle_trap(os_context_t *context, int trap)
 {
     switch(trap) {
+#if !(defined(LISP_FEATURE_WIN32) && defined(LISP_FEATURE_SB_THREAD))
     case trap_PendingInterrupt:
         FSHOW((stderr, "/<trap pending interrupt>\n"));
         arch_skip_instruction(context);
         interrupt_handle_pending(context);
         break;
+#endif
     case trap_Error:
     case trap_Cerror:
         FSHOW((stderr, "/<trap error/cerror %d>\n", trap));
diff --git a/src/runtime/interrupt.h b/src/runtime/interrupt.h
index 3a6a51b..83514d7 100644
--- a/src/runtime/interrupt.h
+++ b/src/runtime/interrupt.h
@@ -12,7 +12,7 @@
 #if !defined(_INCLUDE_INTERRUPT_H_)
 #define _INCLUDE_INTERRUPT_H_
 
-#include <signal.h>
+#include "runtime.h"
 #include <string.h>
 
 /*
@@ -24,7 +24,12 @@
  * stack by the kernel, so copying a libc-sized sigset_t into it will
  * overflow and cause other data on the stack to be corrupted */
 /* FIXME: do not rely on NSIG being a multiple of 8 */
-#define REAL_SIGSET_SIZE_BYTES ((NSIG/8))
+
+#ifdef LISP_FEATURE_WIN32
+# define REAL_SIGSET_SIZE_BYTES (4)
+#else
+# define REAL_SIGSET_SIZE_BYTES ((NSIG/8))
+#endif
 
 static inline void
 sigcopyset(sigset_t *new, sigset_t *old)
diff --git a/src/runtime/os-common.c b/src/runtime/os-common.c
index fa845bf..698d0c9 100644
--- a/src/runtime/os-common.c
+++ b/src/runtime/os-common.c
@@ -75,7 +75,7 @@ os_get_errno(void)
 }
 
 
-#if defined(LISP_FEATURE_SB_THREAD) && !defined(CANNOT_USE_POSIX_SEM_T)
+#if defined(LISP_FEATURE_SB_THREAD) && (!defined(CANNOT_USE_POSIX_SEM_T) || defined(LISP_FEATURE_WIN32))
 
 void
 os_sem_init(os_sem_t *sem, unsigned int value)
diff --git a/src/runtime/parse.c b/src/runtime/parse.c
index beedc29..66292af 100644
--- a/src/runtime/parse.c
+++ b/src/runtime/parse.c
@@ -14,9 +14,13 @@
 #include <stdio.h>
 #include <stdlib.h>
 #include <ctype.h>
-#include <signal.h>
 
 #include "sbcl.h"
+#if defined(LISP_FEATURE_WIN32) && defined(LISP_FEATURE_SB_THREAD)
+#include "pthreads_win32.h"
+#else
+#include <signal.h>
+#endif
 #include "runtime.h"
 
 #if defined(LISP_FEATURE_SB_LDB)
diff --git a/src/runtime/print.c b/src/runtime/print.c
index da8744e..67a7c20 100644
--- a/src/runtime/print.c
+++ b/src/runtime/print.c
@@ -215,6 +215,9 @@ fshow_fun(void __attribute__((__unused__)) *ignored,
 #ifdef LISP_FEATURE_GENCGC
 #include "gencgc-alloc-region.h" /* genesis/thread.h needs this */
 #endif
+#if defined(LISP_FEATURE_WIN32)
+# include "win32-thread-private-events.h" /* genesis/thread.h needs this */
+#endif
 #include "genesis/static-symbols.h"
 #include "genesis/primitive-objects.h"
 #include "genesis/static-symbols.h"
diff --git a/src/runtime/pthreads_win32.c b/src/runtime/pthreads_win32.c
new file mode 100644
index 0000000..c307da2
--- /dev/null
+++ b/src/runtime/pthreads_win32.c
@@ -0,0 +1,1582 @@
+#include "sbcl.h"
+#ifdef LISP_FEATURE_SB_THREAD /* entire file */
+
+#define PTHREAD_INTERNALS
+#include "pthreads_win32.h"
+#include <stdlib.h>
+#include <stdio.h>
+#include <time.h>
+#include <sys/time.h>
+
+#ifdef PTHREAD_DEBUG_OUTPUT
+#define pthshow(fmt,...)                        \
+  do {                                          \
+  fprintf(stderr,fmt "\n", __VA_ARGS__);        \
+  fflush(stderr);                               \
+  } while (0)
+
+#define DEBUG_OWN(cs) do {(cs)->owner=pthread_self(); } while(0)
+#define DEBUG_RELEASE(cs) do {(cs)->owner=0;} while(0)
+
+#else
+#define pthshow(fmt,...) do {} while (0)
+#define DEBUG_OWN(cs) do {} while(0)
+#define DEBUG_RELEASE(cs) do {} while(0)
+#endif
+
+
+struct freelist_cell {
+    struct freelist_cell * next;
+    void* data;
+};
+
+struct freelist {
+    void* (*create_fn)();
+    pthread_mutex_t lock;
+    struct freelist_cell * empty;
+    struct freelist_cell * full;
+    unsigned int count;
+};
+
+#define FREELIST_INITIALIZER(create_fn)                 \
+    {                                                   \
+        event_create, PTHREAD_MUTEX_INITIALIZER,        \
+            NULL, NULL, 0                               \
+            }                                           \
+
+
+static void* freelist_get(struct freelist *fl)
+{
+    void* result = NULL;
+    if (fl->full) {
+        pthread_mutex_lock(&fl->lock);
+        if (fl->full) {
+            struct freelist_cell *cell = fl->full;
+            fl->full = cell->next;
+            result = cell->data;
+            cell->next = fl->empty;
+            fl->empty = cell;
+        }
+        pthread_mutex_unlock(&fl->lock);
+    }
+    if (!result) {
+        result = fl->create_fn();
+    }
+    return result;
+}
+
+static void freelist_return(struct freelist *fl, void*data)
+{
+    struct freelist_cell* cell = NULL;
+    if (fl->empty) {
+        pthread_mutex_lock(&fl->lock);
+        if (fl->empty) {
+            cell = fl->empty;
+            fl->empty = cell->next;
+            goto add_locked;
+        }
+        pthread_mutex_unlock(&fl->lock);
+    }
+    if (!cell) {
+        int i,n=32;
+        cell = malloc(sizeof(*cell)*n);
+        for (i=0; i<(n-1); ++i)
+            cell[i].next = &cell[i+1];
+        cell[i].next = NULL;
+    }
+
+    pthread_mutex_lock(&fl->lock);
+    ++fl->count;
+ add_locked:
+    cell->data = data;
+    cell->next = fl->full;
+    fl->full = cell;
+    pthread_mutex_unlock(&fl->lock);
+}
+
+int pthread_attr_init(pthread_attr_t *attr)
+{
+  attr->stack_size = 0;
+  return 0;
+}
+
+int pthread_attr_destroy(pthread_attr_t *attr)
+{
+  return 0;
+}
+
+int pthread_attr_setstack(pthread_attr_t *attr, void *stackaddr, size_t stacksize)
+{
+  fprintf(stderr, "pthread_attr_setstack called\n");
+  ExitProcess(1);
+  return 0;
+}
+
+int pthread_attr_setstacksize(pthread_attr_t *attr, size_t stacksize)
+{
+  attr->stack_size = stacksize;
+  return 0;
+}
+
+
+typedef unsigned char boolean;
+
+/* TLS management internals */
+
+static DWORD thread_self_tls_index;
+
+static void (*tls_destructors[PTHREAD_KEYS_MAX])(void*);
+static boolean tls_used[PTHREAD_KEYS_MAX];
+static pthread_key_t tls_max_used_key;
+static pthread_mutex_t thread_key_lock = PTHREAD_MUTEX_INITIALIZER;
+static void tls_call_destructors();
+static pthread_t tls_impersonate(pthread_t other) {
+  pthread_t old = pthread_self();
+  TlsSetValue(thread_self_tls_index,other);
+  return old;
+}
+
+static void do_nothing() {}
+/* Fiber context hooks */
+void (*pthread_save_context_hook)() = do_nothing;
+void (*pthread_restore_context_hook)() = do_nothing;
+
+/* Some parts of pthread_np API provide access to Windows NT Fibers
+   (cooperatively scheduled coroutines). Each fiber is wrapped in its
+   own pthread.
+
+   Fibers may be entered by different threads during their lifetime,
+   i.e. they are orthogonal to threads.
+
+   Contrary to the raw NT Fibers API, we will distinguish two kinds of
+   objects: fibers-created-as-fibers and any other thing (thread that
+   is not a fiber, thread converted to fiber, system thread
+   noticed). Consequently, though there is no "main fiber" in NT,
+   there _is_ a main pthread for each (wrapped) system thread, living
+   or dying with this system thread. It may be converted to fiber, but
+   its "fiberness" is incidental, only to be able to switch into
+   another fibers or create them.
+
+   Any fiber that is currently running belongs to some thread
+   (fiber-created-as-thread, to be exact). Call it FCAT group.
+
+   [1] Entrance lock: prevent double entry.
+
+   [2] Suspend for fibers -> "try locking entrance lock; if failed, do
+   real thread suspend"
+
+   [3] Resume for fibers -> two strategies depending on what [2] done.
+
+   [4] Exit/death for fibers -> switch to its FCAT group.
+
+   [2],[3],[4] doesn't apply to threads-converted-to-fibers: full
+   stop/resume is done on them if there is no cooperatively-accessed
+   published context (of which see below).
+*/
+void pthread_np_suspend(pthread_t thread)
+{
+  pthread_mutex_lock(&thread->fiber_lock);
+  if (thread->fiber_group) {
+      CONTEXT context;
+      SuspendThread(thread->fiber_group->handle);
+      context.ContextFlags = CONTEXT_FULL;
+      GetThreadContext(thread->fiber_group->handle, &context);
+  }
+}
+
+/* Momentary suspend/getcontext/resume without locking or preventing
+   fiber reentrance.  This call is for asymmetric synchronization,
+   ensuring that the thread sees global state before doing any
+   globally visible stores.
+*/
+void pthread_np_serialize(pthread_t thread)
+{
+    CONTEXT winctx;
+    winctx.ContextFlags = CONTEXT_INTEGER;
+    if (!thread->created_as_fiber) {
+        SuspendThread(thread->handle);
+        GetThreadContext(thread->handle,&winctx);
+        ResumeThread(thread->handle);
+    }
+}
+
+int pthread_np_get_thread_context(pthread_t thread, CONTEXT* context)
+{
+  context->ContextFlags = CONTEXT_FULL;
+  return thread->fiber_group &&
+      GetThreadContext(thread->fiber_group->handle, context) != 0;
+}
+
+void pthread_np_resume(pthread_t thread)
+{
+  HANDLE host_thread = thread->fiber_group ? thread->fiber_group->handle : NULL;
+  /* Unlock first, _then_ resume, or we may end up accessing freed
+     pthread structure (e.g. at startup with CREATE_SUSPENDED) */
+  pthread_mutex_unlock(&thread->fiber_lock);
+  if (host_thread) {
+    ResumeThread(host_thread);
+  }
+}
+
+/* FIXME shouldn't be used. */
+void pthread_np_request_interruption(pthread_t thread)
+{
+  if (thread->waiting_cond) {
+    pthread_cond_broadcast(thread->waiting_cond);
+  }
+}
+
+/* Thread identity, as much as pthreads are concerned, is determined
+   by pthread_t structure that is stored in TLS slot
+   (thread_self_tls_index). This slot is reassigned when fibers are
+   switched with pthread_np API.
+
+   Two reasons for not using fiber-local storage for this purpose: (1)
+   Fls is too young: all other things work with Win2000, it requires
+   WinXP; (2) this implementation works also with threads that aren't
+   fibers, and it's a good thing.
+
+   There is one more case, besides fiber switching, when pthread_self
+   identity migrates between system threads: for non-main system
+   thread that is not [pthread_create]d, thread-specific data
+   destructors run in a thread from a system thread pool, after the
+   original thread dies. In order to provide compatibility with
+   classic pthread TSD, the system pool thread acquires dead thread's
+   identity for the duration of destructor calls.
+*/
+pthread_t pthread_self()
+{
+  return (pthread_t)TlsGetValue(thread_self_tls_index);
+}
+
+const char * state_to_str(pthread_thread_state state)
+{
+  switch (state) {
+    case pthread_state_running: return "running";
+    case pthread_state_finished: return "finished";
+    case pthread_state_joined: return "joined";
+  default: return "unknown";
+  }
+}
+
+/* Two kinds of threads (or fibers) are supported: (1) created by
+   pthread_create, (2) created independently and noticed by
+   pthread_np_notice_thread. The first kind is running a predefined
+   thread function or fiber function; thread_or_fiber_function
+   incorporates whatever they have in common.
+*/
+static void thread_or_fiber_function(pthread_t self)
+{
+  pthread_t prev = tls_impersonate(self);
+  void* arg = self->arg;
+  pthread_fn fn = self->start_routine;
+
+  if (prev) {
+    pthread_mutex_lock(&prev->fiber_lock);
+    prev->fiber_group = NULL;
+    /* Previous fiber, that started us, had assigned our
+       fiber_group. Now we clear its fiber_group. */
+    pthread_mutex_unlock(&prev->fiber_lock);
+  }
+  self->retval = fn(arg);
+  pthread_mutex_lock(&self->lock);
+  self->state = pthread_state_finished;
+  pthread_cond_broadcast(&self->cond);
+  while (!self->detached && self->state != pthread_state_joined) {
+    if (self->created_as_fiber) {
+      pthread_mutex_unlock(&self->lock);
+      pthread_np_switch_to_fiber(self->fiber_group);
+      pthread_mutex_lock(&self->lock);
+    } else {
+      pthread_cond_wait(&self->cond, &self->lock);
+    }
+  }
+  pthread_mutex_unlock(&self->lock);
+  pthread_mutex_destroy(&self->lock);
+  pthread_mutex_destroy(&self->fiber_lock);
+  pthread_cond_destroy(&self->cond);
+  tls_call_destructors();
+}
+
+/* Thread function for [pthread_create]d threads. Thread may become a
+   fiber later, but (as stated above) it isn't supposed to be
+   reattached to other system thread, even after it happens.
+*/
+DWORD WINAPI Thread_Function(LPVOID param)
+{
+  pthread_t self = (pthread_t) param;
+
+  self->teb = NtCurrentTeb();
+  thread_or_fiber_function(param);
+  CloseHandle(self->handle);
+  {
+    void* fiber = self->fiber;
+    free(self);
+    if (fiber) {
+      /* If thread was converted to fiber, deleting the fiber from
+         itself exits the thread. There are some rumors on possible
+         memory leaks if we just ExitThread or return here, hence the
+         statement below. However, no memory leaks on bare ExitThread
+         were observed yet. */
+      DeleteFiber(GetCurrentFiber());
+    }
+  }
+  return 0;
+}
+
+/* Fiber can't delete itself without exiting the current thread
+   simultaneously. We arrange for some other fiber calling
+   fiber_destructor when fiber dies but doesn't want to terminate its
+   thread. */
+static void fiber_destructor(void* fiber) { DeleteFiber(fiber); }
+
+VOID CALLBACK Fiber_Function(LPVOID param)
+{
+  pthread_t self = (pthread_t) param;
+  thread_or_fiber_function(param);
+  {
+    /* fiber_group is a main thread into which we are to call */
+    pthread_t group = self->fiber_group;
+    free(self);
+    /* pthread_np_run_in_fiber (see below) normally switches back to
+       caller. Nullify our identity, so it knows there is nothing to
+       switch to, and continues running instead. */
+    tls_impersonate(NULL);
+    if (group) {
+      /* Every running [pthread_create]d fiber runs in some thread
+         that has its own pthread_self identity (that was created as
+         thread and later converted to fiber). `group' field of
+         running fiber always points to that other pthread.
+
+         Now switch to our group ("current master fiber created as
+         thread"), asking it to delete our (OS) fiber data with
+         fiber_destructor. */
+      pthread_np_run_in_fiber(group, fiber_destructor, GetCurrentFiber());
+    }
+    /* Within current pthread API we never end up here.
+
+     BTW, if fibers are ever pooled, to avoid stack space reallocation
+     etc, jumping to the beginning of Fiber_Function should be the
+     thing to do here. */
+    DeleteFiber(GetCurrentFiber()); /* Exits. See Thread_Function for
+                                       explanation -- why not
+                                       ExitThread. */
+  }
+}
+
+/* Signals */
+struct sigaction signal_handlers[NSIG];
+
+/* Never called for now */
+int sigaction(int signum, const struct sigaction* act, struct sigaction* oldact)
+{
+  struct sigaction newact = *act;
+  if (oldact)
+    *oldact = signal_handlers[signum];
+  if (!(newact.sa_flags & SA_SIGINFO)) {
+      newact.sa_sigaction = (typeof(newact.sa_sigaction))newact.sa_handler;
+  }
+  signal_handlers[signum] = newact;
+  return 0;
+}
+
+/* Create thread or fiber, depending on current thread's "fiber
+   factory mode". In the latter case, switch into newly-created fiber
+   immediately.
+*/
+int pthread_create(pthread_t *thread, const pthread_attr_t *attr,
+                   void *(*start_routine) (void *), void *arg)
+{
+  pthread_t pth = (pthread_t)calloc(sizeof(pthread_thread),1);
+  pthread_t self = pthread_self();
+  int i;
+  HANDLE createdThread = NULL;
+
+  if (self && self->fiber_factory) {
+    pth->fiber = CreateFiber (attr ? attr->stack_size : 0, Fiber_Function, pth);
+    if (!pth->fiber) return 1;
+    pth->created_as_fiber = 1;
+    /* Has no fiber-group until someone enters it (we will) */
+  } else {
+    createdThread = CreateThread(NULL, attr ? attr->stack_size : 0,
+                                 Thread_Function, pth, CREATE_SUSPENDED, NULL);
+    if (!createdThread) return 1;
+    /* FCAT is its own fiber-group [initially] */
+    pth->fiber_group = pth;
+    pth->handle = createdThread;
+  }
+  pth->start_routine = start_routine;
+  pth->arg = arg;
+  if (self) {
+    pth->blocked_signal_set = self->blocked_signal_set;
+  } else {
+    sigemptyset(&pth->blocked_signal_set);
+  }
+  pth->state = pthread_state_running;
+  pthread_mutex_init(&pth->lock, NULL);
+  pthread_mutex_init(&pth->fiber_lock, NULL);
+  pthread_cond_init(&pth->cond, NULL);
+  pth->detached = 0;
+  if (thread) *thread = pth;
+  if (pth->fiber) {
+    pthread_np_switch_to_fiber(pth);
+  } else {
+    /* Resume will unlock, so we lock here */
+    pthread_mutex_lock(&pth->fiber_lock);
+    pthread_np_resume(pth);
+  }
+  return 0;
+}
+
+int pthread_equal(pthread_t thread1, pthread_t thread2)
+{
+  return thread1 == thread2;
+}
+
+int pthread_detach(pthread_t thread)
+{
+  int retval = 0;
+  pthread_mutex_lock(&thread->lock);
+  thread->detached = 1;
+  pthread_cond_broadcast(&thread->cond);
+  pthread_mutex_unlock(&thread->lock);
+  return retval;
+}
+
+int pthread_join(pthread_t thread, void **retval)
+{
+  int fiberp = thread->created_as_fiber;
+  pthread_mutex_lock(&thread->lock);
+  while (thread->state != pthread_state_finished) {
+    if (fiberp) {
+      /* just trying */
+      pthread_mutex_unlock(&thread->lock);
+      pthread_np_switch_to_fiber(thread);
+      pthread_mutex_lock(&thread->lock);
+    } else {
+      pthread_cond_wait(&thread->cond, &thread->lock);
+    }
+  }
+  thread->state = pthread_state_joined;
+  pthread_cond_broadcast(&thread->cond);
+  if (retval)
+    *retval = thread->retval;
+  pthread_mutex_unlock(&thread->lock);
+  if (fiberp)
+    pthread_np_switch_to_fiber(thread);
+  return 0;
+}
+
+/* We manage our own TSD instead of relying on system TLS for anything
+   other than pthread identity itself. Reasons: (1) Windows NT TLS
+   slots are expensive, (2) pthread identity migration requires only
+   one TLS slot assignment, instead of massive copying. */
+int pthread_key_create(pthread_key_t *key, void (*destructor)(void*))
+{
+  pthread_key_t index;
+  boolean success = 0;
+  pthread_mutex_lock(&thread_key_lock);
+  for (index = 0; index < PTHREAD_KEYS_MAX; ++index) {
+    if (!tls_used[index]) {
+      if (tls_max_used_key<index)
+        tls_max_used_key = index;
+      tls_destructors[index] = destructor;
+      tls_used[index] = 1;
+      success = 1;
+      break;
+    }
+  }
+  pthread_mutex_unlock(&thread_key_lock);
+
+  if (success) {
+    *key = index;
+    return 0;
+  } else {
+    return 1;
+  }
+}
+
+int pthread_key_delete(pthread_key_t key)
+{
+  /* tls_used flag is not a machine word. Let's lock, as there is no
+     atomic guarantee even on x86.  */
+  pthread_mutex_lock(&thread_key_lock);
+  tls_destructors[key] = 0;
+  /* No memory barrier here: application is responsible for proper
+     call sequence, and having the key around at this point is an
+     official UB.  */
+  tls_used[key] = 0;
+  pthread_mutex_unlock(&thread_key_lock);
+  return 0;
+}
+
+void  __attribute__((sysv_abi)) *pthread_getspecific(pthread_key_t key)
+{
+  return pthread_self()->specifics[key];
+}
+
+/* Internal function calling destructors for current pthread */
+static void tls_call_destructors()
+{
+  pthread_key_t key;
+  int i;
+  int called;
+
+  for (i = 0; i<PTHREAD_DESTRUCTOR_ITERATIONS; ++i) {
+    called = 0;
+    for (key = 0; key<=tls_max_used_key; ++key) {
+      void *cell = pthread_getspecific(key);
+      pthread_setspecific(key,NULL);
+      if (cell && tls_destructors[key]) {
+        (tls_destructors[key])(cell);
+        called = 1;
+      }
+    }
+    if (!called)
+      break;
+  }
+}
+
+pthread_mutex_t once_mutex = PTHREAD_MUTEX_INITIALIZER;
+
+int pthread_once(pthread_once_t *once_control, void (*init_routine)(void))
+{
+  if (PTHREAD_ONCE_INIT == *once_control) {
+    pthread_mutex_lock(&once_mutex);
+    if (PTHREAD_ONCE_INIT == *once_control) {
+      init_routine();
+      *once_control = 42;
+    }
+    pthread_mutex_unlock(&once_mutex);
+  }
+  return 0;
+}
+
+/* TODO call signal handlers */
+int pthread_sigmask(int how, const sigset_t *set, sigset_t *oldset)
+{
+  pthread_t self = pthread_self();
+  if (oldset)
+    *oldset = self->blocked_signal_set;
+  if (set) {
+    switch (how) {
+      case SIG_BLOCK:
+        self->blocked_signal_set |= *set;
+        break;
+      case SIG_UNBLOCK:
+        self->blocked_signal_set &= ~(*set);
+        break;
+      case SIG_SETMASK:
+        self->blocked_signal_set = *set;
+        break;
+    }
+  }
+  return 0;
+}
+
+pthread_mutex_t mutex_init_lock;
+
+int pthread_mutex_init(pthread_mutex_t * mutex, const pthread_mutexattr_t * attr)
+{
+  *mutex = (struct _pthread_mutex_info*)malloc(sizeof(struct _pthread_mutex_info));
+  InitializeCriticalSection(&(*mutex)->cs);
+  (*mutex)->file = " (free) ";
+  return 0;
+}
+
+int pthread_mutexattr_init(pthread_mutexattr_t* attr)
+{
+  return 0;
+}
+int pthread_mutexattr_destroy(pthread_mutexattr_t* attr)
+{
+  return 0;
+}
+
+int pthread_mutexattr_settype(pthread_mutexattr_t* attr,int mutex_type)
+{
+  return 0;
+}
+
+int pthread_mutex_destroy(pthread_mutex_t *mutex)
+{
+    if (*mutex != PTHREAD_MUTEX_INITIALIZER) {
+        pthread_np_assert_live_mutex(mutex,"destroy");
+        DeleteCriticalSection(&(*mutex)->cs);
+        free(*mutex);
+        *mutex = &DEAD_MUTEX;
+    }
+    return 0;
+}
+
+/* Add pending signal to (other) thread */
+void pthread_np_add_pending_signal(pthread_t thread, int signum)
+{
+    /* See __sync_fetch_and_or() for gcc 4.4, at least.  As some
+       people are still using gcc 3.x, I prefer to do this in asm.
+
+       For win64 we'll HAVE to rewrite it. __sync_fetch_and_or() seems
+       to be a rational choice -- there are plenty of GCCisms in SBCL
+       anyway.
+    */
+    sigset_t to_add = 1<<signum;
+    asm("lock orl %1,%0":"=m"(thread->pending_signal_set):"r"(to_add));
+}
+
+static void futex_interrupt(pthread_t thread);
+
+/* This pthread_kill doesn't do anything to notify target pthread of a
+ * new pending signal.
+ *
+ * DFL: ... or so the original comment claimed, but that was before
+ * futexes.  Now that we wake up futexes, it's not entirely accurate
+ * anymore, is it? */
+int pthread_kill(pthread_t thread, int signum)
+{
+  pthread_np_add_pending_signal(thread,signum);
+  futex_interrupt(thread);
+  return 0;
+}
+
+void pthread_np_remove_pending_signal(pthread_t thread, int signum)
+{
+    sigset_t to_and = ~(1<<signum);
+    asm("lock andl %1,%0":"=m"(thread->pending_signal_set):"r"(to_and));
+}
+
+sigset_t pthread_np_other_thread_sigpending(pthread_t thread)
+{
+    return
+        InterlockedCompareExchange((volatile LONG*)&thread->pending_signal_set,
+                                   0, 0);
+}
+
+/* Mutex implementation uses CRITICAL_SECTIONs. Somethings to keep in
+   mind: (1) uncontested locking is cheap; (2) long wait on a busy
+   lock causes exception, so it should never be attempted; (3) those
+   mutexes are recursive; (4) one thread locks, the other unlocks ->
+   the next one hangs. */
+int pthread_mutex_lock(pthread_mutex_t *mutex)
+{
+  pthread_np_assert_live_mutex(mutex,"lock");
+  if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+    pthread_mutex_lock(&mutex_init_lock);
+    if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+      pthread_mutex_init(mutex, NULL);
+    }
+    pthread_mutex_unlock(&mutex_init_lock);
+  }
+  EnterCriticalSection(&(*mutex)->cs);
+  DEBUG_OWN(*mutex);
+  return 0;
+}
+
+int pthread_mutex_trylock(pthread_mutex_t *mutex)
+{
+  pthread_np_assert_live_mutex(mutex,"trylock");
+  if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+    pthread_mutex_lock(&mutex_init_lock);
+    if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+      pthread_mutex_init(mutex, NULL);
+    }
+    pthread_mutex_unlock(&mutex_init_lock);
+  }
+  if (TryEnterCriticalSection(&(*mutex)->cs)) {
+      DEBUG_OWN(*mutex);
+      return 0;
+  }
+  else
+    return EBUSY;
+}
+
+/* Versions of lock/trylock useful for debugging. Our header file
+   conditionally redefines lock/trylock to call them. */
+
+int pthread_mutex_lock_annotate_np(pthread_mutex_t *mutex, const char* file, int line)
+{
+  int contention = 0;
+  pthread_np_assert_live_mutex(mutex,"lock");
+  if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+    pthread_mutex_lock(&mutex_init_lock);
+    if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+      pthread_mutex_init(mutex, NULL);
+      pthshow("Mutex #x%p: automatic initialization; #x%p %s +%d",
+              mutex, *mutex,
+              file, line);
+    }
+    pthread_mutex_unlock(&mutex_init_lock);
+  }
+  if ((*mutex)->owner) {
+    pthshow("Mutex #x%p -> #x%p: contention; owned by #x%p, wanted by #x%p",
+            mutex, *mutex,
+            (*mutex)->owner,
+            pthread_self());
+    pthshow("Mutex #x%p -> #x%p: contention notes: old %s +%d, new %s +%d",
+            mutex, *mutex,
+            (*mutex)->file,(*mutex)->line, file, line);
+    contention = 1;
+  }
+  EnterCriticalSection(&(*mutex)->cs);
+  if (contention) {
+    pthshow("Mutex #x%p -> #x%p: contention end; left by #x%p, taken by #x%p",
+            mutex, *mutex,
+            (*mutex)->owner,
+            pthread_self());
+    pthshow("Mutex #x%p -> #x%p: contention notes: old %s +%d, new %s +%d",
+            mutex, *mutex,
+            (*mutex)->file,(*mutex)->line, file, line);
+  }
+  (*mutex)->owner = pthread_self();
+  (*mutex)->file = file;
+  (*mutex)->line = line;
+  return 0;
+}
+
+int pthread_mutex_trylock_annotate_np(pthread_mutex_t *mutex, const char* file, int line)
+{
+  int contention = 0;
+  pthread_np_assert_live_mutex(mutex,"trylock");
+  if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+    pthread_mutex_lock(&mutex_init_lock);
+    if (*mutex == PTHREAD_MUTEX_INITIALIZER) {
+      pthread_mutex_init(mutex, NULL);
+    }
+    pthread_mutex_unlock(&mutex_init_lock);
+  }
+  if ((*mutex)->owner) {
+    pthshow("Mutex #x%p -> #x%p: tried contention; owned by #x%p, wanted by #x%p",
+            mutex, *mutex,
+            (*mutex)->owner,
+            pthread_self());
+    pthshow("Mutex #x%p -> #x%p: contention notes: old %s +%d, new %s +%d",
+            mutex, *mutex,
+            (*mutex)->file,(*mutex)->line, file, line);
+    contention = 1;
+  }
+  if (TryEnterCriticalSection(&(*mutex)->cs)) {
+    if (contention) {
+      pthshow("Mutex #x%p -> #x%p: contention end; left by #x%p, taken by #x%p",
+              mutex, *mutex,
+              (*mutex)->owner,
+              pthread_self());
+      pthshow("Mutex #x%p -> #x%p: contention notes: old %s +%d, new %s +%d",
+              mutex, *mutex,
+              (*mutex)->file,(*mutex)->line, file, line);
+    }
+    (*mutex)->owner = pthread_self();
+    (*mutex)->file = file;
+    (*mutex)->line = line;
+    return 0;
+  }
+  else
+    return EBUSY;
+}
+
+int pthread_mutex_unlock(pthread_mutex_t *mutex)
+{
+  /* Owner is for debugging only; NB if mutex is used recursively,
+     owner field will lie. */
+  pthread_np_assert_live_mutex(mutex,"unlock");
+  DEBUG_RELEASE(*mutex);
+  LeaveCriticalSection(&(*mutex)->cs);
+  return 0;
+}
+
+/* Condition variables implemented with events and wakeup queues. */
+
+/* Thread-local wakeup events are kept in TSD to avoid kernel object
+   creation on each call to pthread_cond_[timed]wait */
+static pthread_key_t cv_event_key;
+
+/* .info field in wakeup record is an "opportunistic" indicator that
+   wakeup has happened. On timeout from WaitForSingleObject, thread
+   doesn't know (1) whether to reset event, (2) whether to (try) to
+   find and unlink wakeup record. Let's let it know (of course,
+   it will know for sure only under cv_wakeup_lock). */
+
+#define WAKEUP_WAITING_NOTIMEOUT 0
+#define WAKEUP_WAITING_TIMEOUT 4
+
+#define WAKEUP_HAPPENED 1
+#define WAKEUP_BY_INTERRUPT 2
+
+static void* event_create()
+{
+    return (void*)CreateEvent(NULL,FALSE,FALSE,NULL);
+}
+
+static struct freelist event_freelist = FREELIST_INITIALIZER(event_create);
+
+
+unsigned int pthread_free_event_pool_size()
+{
+    return event_freelist.count;
+}
+
+static HANDLE fe_get_event()
+{
+    return (HANDLE)freelist_get(&event_freelist);
+}
+
+static void fe_return_event(HANDLE handle)
+{
+    freelist_return(&event_freelist, (void*)handle);
+}
+
+static void cv_event_destroy(void* event)
+{
+  CloseHandle((HANDLE)event);
+}
+
+static HANDLE cv_default_event_get_fn()
+{
+  HANDLE event = pthread_getspecific(cv_event_key);
+  if (!event) {
+    event = CreateEvent(NULL, FALSE, FALSE, NULL);
+    pthread_setspecific(cv_event_key, event);
+  } else {
+    /* ResetEvent(event); used to be here. Let's try without.  It's
+       safe in pthread_cond_wait: if WaitForSingleObjectEx ever
+       returns, event is reset automatically, and the wakeup queue item
+       is removed by the signaller under wakeup_lock.
+
+       pthread_cond_timedwait should reset the event if
+       cv_wakeup_remove failed to find its wakeup record, otherwise
+       it's safe too. */
+  }
+  return event;
+}
+
+static void cv_default_event_return_fn(HANDLE event)
+{
+  /* ResetEvent(event); could be here as well (and used to be).
+     Avoiding syscalls makes sense, however. */
+}
+
+static pthread_condattr_t cv_default_attr = {
+  0,                            /* alertable */
+  fe_get_event,
+  fe_return_event,
+  /* cv_default_event_get_fn,      /\* get_fn *\/ */
+  /* cv_default_event_return_fn    /\* return_fn *\/ */
+};
+
+int pthread_cond_init(pthread_cond_t * cv, const pthread_condattr_t * attr)
+{
+  if (!attr)
+    attr = &cv_default_attr;
+  pthread_mutex_init(&cv->wakeup_lock, NULL);
+  cv->first_wakeup = NULL;
+  cv->last_wakeup = NULL;
+  cv->alertable = attr->alertable;
+  cv->get_fn = attr->get_fn;
+  cv->return_fn = attr->return_fn;
+  return 0;
+}
+
+int pthread_condattr_init(pthread_condattr_t *attr)
+{
+  *attr = cv_default_attr;
+  return 0;
+}
+
+int pthread_condattr_destroy(pthread_condattr_t *attr)
+{
+  return 0;
+}
+int pthread_condattr_setevent_np(pthread_condattr_t *attr,
+                                 cv_event_get_fn get_fn, cv_event_return_fn ret_fn)
+{
+    attr->get_fn = get_fn ? get_fn : fe_get_event;// cv_default_event_get_fn;
+    attr->return_fn = ret_fn ? ret_fn : fe_return_event; // cv_default_event_return_fn;
+    return 0;
+}
+
+int pthread_cond_destroy(pthread_cond_t *cv)
+{
+  pthread_mutex_destroy(&cv->wakeup_lock);
+  return 0;
+}
+
+int pthread_cond_broadcast(pthread_cond_t *cv)
+{
+  int count = 0;
+
+  HANDLE postponed[128];
+  int npostponed = 0,i;
+
+  /* No strict requirements to memory visibility model, because of
+     mutex unlock around waiting. */
+  if (!cv->first_wakeup)
+      return 0;
+  pthread_mutex_lock(&cv->wakeup_lock);
+  while (cv->first_wakeup)
+  {
+    struct thread_wakeup * w = cv->first_wakeup;
+    HANDLE waitevent = w->event;
+    cv->first_wakeup = w->next;
+    w->info = WAKEUP_HAPPENED;
+    postponed[npostponed++] = waitevent;
+    if (/* w->info == WAKEUP_WAITING_TIMEOUT || */ npostponed ==
+        sizeof(postponed)/sizeof(postponed[0])) {
+        for (i=0; i<npostponed; ++i)
+            SetEvent(postponed[i]);
+        npostponed = 0;
+    }
+    ++count;
+  }
+  cv->last_wakeup = NULL;
+  pthread_mutex_unlock(&cv->wakeup_lock);
+  for (i=0; i<npostponed; ++i)
+      SetEvent(postponed[i]);
+  return 0;
+}
+
+int pthread_cond_signal(pthread_cond_t *cv)
+{
+  struct thread_wakeup * w;
+  /* No strict requirements to memory visibility model, because of
+     mutex unlock around waiting. */
+  if (!cv->first_wakeup)
+      return 0;
+  pthread_mutex_lock(&cv->wakeup_lock);
+  w = cv->first_wakeup;
+  if (w) {
+    HANDLE waitevent = w->event;
+    cv->first_wakeup = w->next;
+    if (!cv->first_wakeup)
+      cv->last_wakeup = NULL;
+    w->info = WAKEUP_HAPPENED;
+    SetEvent(waitevent);
+  }
+  pthread_mutex_unlock(&cv->wakeup_lock);
+  return 0;
+}
+
+/* Return value is used for futexes: 0=ok, 1 on unexpected word change. */
+int cv_wakeup_add(struct pthread_cond_t* cv, struct thread_wakeup* w)
+{
+  HANDLE event;
+  w->next = NULL;
+  pthread_mutex_lock(&cv->wakeup_lock);
+  if (w->uaddr) {
+      if (w->uval != *w->uaddr) {
+          pthread_mutex_unlock(&cv->wakeup_lock);
+          return 1;
+      }
+      pthread_self()->futex_wakeup = w;
+  }
+  event = cv->get_fn();
+  w->event = event;
+  if (cv->last_wakeup == w) {
+    fprintf(stderr, "cv->last_wakeup == w\n");
+    fflush(stderr);
+    ExitProcess(0);
+  }
+  if (cv->last_wakeup != NULL)
+  {
+    cv->last_wakeup->next = w;
+    cv->last_wakeup = w;
+  }
+  else
+  {
+    cv->first_wakeup = w;
+    cv->last_wakeup = w;
+  }
+  pthread_mutex_unlock(&cv->wakeup_lock);
+  return 0;
+}
+
+/* Return true if wakeup found, false if missing */
+int cv_wakeup_remove(struct pthread_cond_t* cv, struct thread_wakeup* w)
+{
+  int result = 0;
+  if (w->info == WAKEUP_HAPPENED || w->info == WAKEUP_BY_INTERRUPT)
+      goto finish;
+  pthread_mutex_lock(&cv->wakeup_lock);
+  {
+    if (w->info == WAKEUP_HAPPENED || w->info == WAKEUP_BY_INTERRUPT)
+        goto unlock;
+    if (cv->first_wakeup == w) {
+      cv->first_wakeup = w->next;
+      if (cv->last_wakeup == w)
+        cv->last_wakeup = NULL;
+      result = 1;
+    } else {
+      struct thread_wakeup * prev = cv->first_wakeup;
+      while (prev && prev->next != w)
+        prev = prev->next;
+      if (!prev) {
+        goto unlock;
+      }
+      prev->next = w->next;
+      if (cv->last_wakeup == w)
+        cv->last_wakeup = prev;
+      result = 1;
+    }
+  }
+ unlock:
+  pthread_mutex_unlock(&cv->wakeup_lock);
+ finish:
+  return result;
+}
+
+
+int pthread_cond_wait(pthread_cond_t * cv, pthread_mutex_t * cs)
+{
+  struct thread_wakeup w;
+  w.uaddr = 0;
+  w.info = WAKEUP_WAITING_NOTIMEOUT;
+  cv_wakeup_add(cv, &w);
+  if (cv->last_wakeup->next == cv->last_wakeup) {
+      pthread_np_lose(5,"cv->last_wakeup->next == cv->last_wakeup\n");
+  }
+  if (cv->last_wakeup->next != NULL) {
+      pthread_np_lose(5,"cv->last_wakeup->next == cv->last_wakeup\n");
+  }
+  pthread_self()->waiting_cond = cv;
+  DEBUG_RELEASE(*cs);
+  pthread_mutex_unlock(cs);
+  do {
+      if (cv->alertable) {
+          while (WaitForSingleObjectEx(w.event, INFINITE, TRUE) == WAIT_IO_COMPLETION);
+      } else {
+          WaitForSingleObject(w.event, INFINITE);
+      }
+  } while (w.info == WAKEUP_WAITING_NOTIMEOUT);
+  pthread_self()->waiting_cond = NULL;
+  /* Event is signalled once, wakeup is dequeued by signaller. */
+  cv->return_fn(w.event);
+  pthread_mutex_lock(cs);
+  DEBUG_OWN(*cs);
+  return 0;
+}
+
+int pthread_cond_timedwait(pthread_cond_t * cv, pthread_mutex_t * cs,
+                           const struct timespec * abstime)
+{
+  DWORD rv;
+  struct thread_wakeup w;
+  pthread_t self = pthread_self();
+
+  w.info = WAKEUP_WAITING_TIMEOUT;
+  w.uaddr = 0;
+  cv_wakeup_add(cv, &w);
+  if (cv->last_wakeup->next == cv->last_wakeup) {
+    fprintf(stderr, "cv->last_wakeup->next == cv->last_wakeup\n");
+    ExitProcess(0);
+  }
+  self->waiting_cond = cv;
+  DEBUG_RELEASE(*cs);
+  /* barrier (release); waiting_cond globally visible */
+  pthread_mutex_unlock(cs);
+  {
+    struct timeval cur_tm;
+    long sec, msec;
+    gettimeofday(&cur_tm, NULL);
+    sec = abstime->tv_sec - cur_tm.tv_sec;
+    msec = sec * 1000 + abstime->tv_nsec / 1000000 - cur_tm.tv_usec / 1000;
+    if (msec < 0)
+      msec = 0;
+    do {
+        if (cv->alertable) {
+            while ((rv = WaitForSingleObjectEx(w.event, msec, TRUE))
+                   == WAIT_IO_COMPLETION);
+        } else {
+            rv = WaitForSingleObject(w.event, msec);
+        }
+    } while (rv == WAIT_OBJECT_0 && w.info == WAKEUP_WAITING_TIMEOUT);
+  }
+  self->waiting_cond = NULL;
+
+  if (rv == WAIT_TIMEOUT) {
+    if (!cv_wakeup_remove(cv, &w)) {
+      /* Someone removed our wakeup record: though we got a timeout,
+         event was (will be) signalled before we are here.
+         Consume this wakeup. */
+      WaitForSingleObject(w.event, INFINITE);
+    }
+  }
+  cv->return_fn(w.event);
+  pthread_mutex_lock(cs);
+  DEBUG_OWN(*cs);
+  if (rv == WAIT_TIMEOUT)
+    return ETIMEDOUT;
+  else
+    return 0;
+}
+
+int sched_yield()
+{
+  /* http://stackoverflow.com/questions/1383943/switchtothread-vs-sleep1
+     SwitchToThread(); was here. Unsure what's better for us, just trying.. */
+
+  if(!SwitchToThread())
+      Sleep(0);
+  return 0;
+}
+
+void pthread_lock_structures()
+{
+  pthread_mutex_lock(&mutex_init_lock);
+}
+
+void pthread_unlock_structures()
+{
+  pthread_mutex_unlock(&mutex_init_lock);
+}
+
+static int pthread_initialized = 0;
+
+static pthread_cond_t futex_pseudo_cond;
+
+void pthreads_win32_init()
+{
+  if (!pthread_initialized) {
+    thread_self_tls_index = TlsAlloc();
+    pthread_mutex_init(&mutex_init_lock, NULL);
+    pthread_np_notice_thread();
+    pthread_key_create(&cv_event_key,cv_event_destroy);
+    pthread_cond_init(&futex_pseudo_cond, NULL);
+    pthread_initialized = 1;
+  }
+}...
 
[truncated message content]

[Sbcl-commits] master: Preliminary work towards threads on win32

Common Lisp compiler and runtime

[Sbcl-commits] master: Preliminary work towards threads on win32