;;; Unix waitt & process objects for scsh ;;; Copyright (c) 1993, 1994, 1995 by Olin Shivers. ;;; This is a GC'd abstraction for Unix process id's. ; ;; The problem with Unix pids is (a) they clutter up the kernel ;;; process table until you wait(2) them, and (b) you can only ;;; wait(2) them once. Scsh's process objects are similar, but ;;; allow the storage to be allocated in the scsh address space, ;;; and out of the kernel process table, and they can be waited on ;;; multiple times. ;;; Process objects ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; (define-record proc ; A process object pid ; Proc's pid. (finished? #f) ; Running, stopped, done (status (make-placeholder)) ; The cached exit status of the process (zombie #t) ; Misnomer. Whether or not the process has ; (not) been waited on. ;; Make proc objects print like #{proc 2318}. ((disclose p) (list "proc" (proc:pid p) (proc:finished? p)))) ;; Unfortunately there is no way to specify the name of the constructor- ;; function in Olins define-record macro, so I had to do this... (define (make-procobj pid) (let ((procobj (make-proc pid))) (add-finalizer! procobj procobj-finalizer) procobj)) ;; Weak pointer tables. Much more efficient than populations. ;; Maps pids to processes. Unexited processes are strong pointers, exited ;; procs are weak pointers (to allow gc'ing). ;; ;; JMG: why ever unexited processes were strong pointer, this won't work ;; with (autoreap-policy 'late), since then gc waits for the strong pointer ;; until it wait(2)s and the strong pointer waits for wait(2) which is ;; nothing but a deadlock (define process-table (make-integer-table)) (make-reinitializer (lambda () (set! process-table (make-integer-table)))) (define process-table-lock (make-lock)) (define (process-table-ref n) (with-lock process-table-lock (lambda () (weak-table-ref process-table n)))) (define (process-table-set! n val) (with-lock process-table-lock (lambda () (weak-table-set! process-table n val)))) (define (process-table-delete-procobj! procobj) (with-lock process-table-lock (lambda () (if (eq? (weak-table-ref process-table (proc:pid procobj)) procobj) (weak-table-set! process-table (proc:pid procobj) #f))))) (define (maybe-pid->proc pid) (process-table-ref pid)) (define (pid->proc pid . maybe-probe?) (let ((probe? (:optional maybe-probe? #f))) (or (maybe-pid->proc pid) (case probe? ((#f) (error "Pid has no corresponding process object" pid)) ((create) (new-child-proc pid)) (else #f))))) ;;; Coerce pids and procs to procs. (define (->proc proc/pid) (cond ((proc? proc/pid) proc/pid) ((and (integer? proc/pid) (>= proc/pid 0)) (pid->proc proc/pid 'create)) (else (error "Illegal parameter" ->proc proc/pid)))) ;;; Is X a pid or a proc? (define (pid/proc? x) (or (proc? x) (and (integer? x) (>= x 0)))) ;;; Process reaping ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; ;;; "Reaping" a process means using wait(2) to move its exit status from the ;;; kernel's process table into scsh, thus cleaning up the kernel's process ;;; table and saving the value in a gc'd data structure, where it can be ;;; referenced multiple times. ;;; ;;; - Stopped processes are never reaped, only dead ones. (May change -df) ;;; ;;; - Stopped process status codes are never cached in proc objects, ;;; only status codes for dead processes. So you can wait for a ;;; dead process multiple times, but only once per process-stop. ;;; (May change -df) ;;; ;;; - Unfortunately, reaping a process loses the information specifying its ;;; process group, so if a process is reaped into scsh, it cannot be ;;; waited for by WAIT-PROCESS-GROUP. Notice that only dead processes are ;;; reaped, not suspended ones. Programs almost never use WAIT-PROCESS-GROUP ;;; to wait for dead processes, so this is not likely to be a problem. If ;;; it is, turn autoreaping off with (autoreap-policy #f). ;;; (This never worked right, and it might be wiped out completely -fd) ;;; ;;; - Reaping can be encouraged by calling (REAP-ZOMBIES). ;;; (autoreap-policy [new-policy]) ;;; Watch this area ;;; I'm really tired of opening everything (i.e. events) in scsh-level-0 ;;; this is here until someone (Olin !!!) cleans up the scsh modules (define next-sigevent (structure-ref sigevents next-sigevent)) (define most-recent-sigevent (structure-ref sigevents most-recent-sigevent)) (define *autoreap-policy* #f) ; Not exported from this module. (define (autoreap-policy . maybe-policy) (let ((old-policy *autoreap-policy*)) (if (pair? maybe-policy) (let ((new-policy (car maybe-policy))) (cond ((pair? (cdr maybe-policy)) (error "Too many args to autoreap-policy" maybe-policy)) ((not (memq new-policy '(early late #f))) (error "Illegal autoreap policy." new-policy)) (else (set! *autoreap-policy* new-policy) (cond ((eq? new-policy 'early) (set-sigchld-handler! early-sigchld-handler) (set-post/gc-handler! reap-need-reaping)) ((eq? new-policy 'late) (set-sigchld-handler! late-sigchld-handler) (set-post/gc-handler! reap-need-reaping)) (else (set-sigchld-handler! noauto-sigchld-handler) (set-post/gc-handler! (lambda () #f)))))))) old-policy)) ;;; we don't register the post/gc-handler until the first police change ;;; --- this made sense, but why? (define *post/gc-handler* (lambda () (error "*post/gc-handler* was not defined"))) (define (really-set-post/gc-handler! handler) (set! *post/gc-handler* handler)) (define (start-set-post/gc-handler! handler) (set! set-post/gc-handler! really-set-post/gc-handler!) (set-post/gc-handler! handler) (spawn (lambda () (let lp ((event (most-recent-sigevent))) (let ((next-event (next-sigevent event interrupt/post-gc))) (*post/gc-handler*) (lp next-event)))) '*post/gc-handler*-thread)) (define set-post/gc-handler! start-set-post/gc-handler!) (define (*sigchld-handler*) (early-sigchld-handler)) (define (set-sigchld-handler! handler) (set! *sigchld-handler* handler)) (define (with-autoreaping thunk) (set! *autoreap-policy* 'early) ((structure-ref threads-internal spawn-on-root) (lambda () (let lp ((event (most-recent-sigevent))) (let ((next-event (next-sigevent event interrupt/chld))) (*sigchld-handler*) (lp next-event)))) 'auto-reaping) (thunk)) ;;; This list contains pids whose proc-obj were gc'd before they died ;;; We try to reap them after every gc and maybe on every SIGCHLD (define need-reaping '()) (define need-reaping-lock (make-lock)) (define (need-reaping-add! pid) (obtain-lock need-reaping-lock) (set! need-reaping (cons pid need-reaping)) (release-lock need-reaping-lock)) (define (need-reaping-remove! pid) (obtain-lock need-reaping-lock) (set! need-reaping (del pid need-reaping)) (release-lock need-reaping-lock)) (define (reap-need-reaping) (obtain-lock need-reaping-lock) (set! need-reaping (filter (lambda (pid) (not (reap-pid pid))) need-reaping)) (release-lock need-reaping-lock)) ;;; reap this special pid ;;; return status or #f (define (reap-pid pid) (with-lock wait-lock (lambda () (let ((status (atomic-wait pid wait/poll))) (if status (waited-by-reap pid status)) status)))) ;;; Handler for SIGCHLD according policy (define (late-sigchld-handler) #f) (define (early-sigchld-handler) (reap-zombies)) (define (noauto-sigchld-handler) #f) ;;; Finalizer for procobjs ;;; (define (procobj-finalizer procobj) (process-table-delete-procobj! procobj) (if (not (proc:finished? procobj)) (need-reaping-add! (proc:pid procobj)))) ;;; (reap-zombies) => bool ;;; Move any zombies from the kernel process table into scsh. ;;; Return true if no more outstanding children; #f if some still live. (define (reap-zombies) (let lp () (obtain-lock wait-lock) (receive (pid status) (%wait-any (bitwise-ior wait/poll wait/stopped-children)) (if (and pid (not (status:stop-sig status))) (begin (waited-by-reap pid status) (release-lock wait-lock) ; (format (current-error-port) ; "Reaping ~d[~d]~%" pid status) (lp)) (begin (release-lock wait-lock) status))))) (define (new-child-proc pid) (let ((proc (make-procobj pid))) (process-table-set! pid proc) proc)) ;;; (WAIT proc/pid [flags]) ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; ;;; (wait proc/pid [flags]) => status or #f ;;; ;;; FLAGS (default 0) is the exclusive or of the following: ;;; wait/poll ;;; Return #f immediately if there are no ;;; unwaited children available. ;;; wait/stopped-children ;;; Report on suspended children as well. ;;; ;;; If the process hasn't terminated (or suspended, if wait/stopped ;;; is set) and wait/poll is set, return #f. ;;; (I'm working on the flags -df) ;;; JMG: We have to be careful about wait/poll and autoreap-policy: ;;; If it was 'late at anytime, we may missed the exit of pid/proc ;;; So we cannot just block and hope reap-zombies will give us the status ;;; With this lock, we ensure that only one thread may call ;;; really-wait for a given pid and manipulates the associated process object (define wait-lock (make-lock)) (define (wait pid/proc . maybe-flags) (let* ((flags (:optional maybe-flags 0)) (proc (->proc pid/proc)) (win (lambda (status) (waited-by-wait proc status) status))) ;; save the event before we check for finished (let ((pre-event (most-recent-sigevent))) (with-lock wait-lock (lambda () (cond ((atomic-wait proc (bitwise-ior flags wait/poll)) => win) ((zero? (bitwise-and flags wait/poll)) ;; we have to block and hence use the event system (let lp ((pre-event pre-event)) (cond ((atomic-wait proc (bitwise-ior flags wait/poll)) => win) (else (release-lock wait-lock) (let ((next-event (next-sigevent pre-event interrupt/chld))) (obtain-lock wait-lock) (lp next-event)))))) (else #f))))))) ;;; -> process-object proc status/#f (define (atomic-wait proc flags) (cond ((proc:finished? proc) (placeholder-value (proc:status proc))) (else (really-wait (proc:pid proc) (bitwise-ior flags wait/poll))))) ;;; This one is used, to wait on a positive pid ;;; We NEVER do a blocking wait syscall (define (really-wait pid flags) (if (zero? (bitwise-and flags wait/poll)) (error "really-wait without wait/poll")) (if (< pid 1) (error "really-wait on nonpos pid" pid)) (receive (return_pid status) (%wait-pid pid flags) (cond ((zero? return_pid) #f) ; failed wait/poll ((= pid return_pid) status) ; made it (else (error "mismatch in really-wait" return_pid pid))))) ;;; All you have to do, if pid was reaped ;;; proc_obj is maybe no longer alive (define (waited-by-reap pid status) (cond ((maybe-pid->proc pid) => (lambda (proc) (obituary proc status) (push-reaped-proc proc) )))) ;;; All you have to do, if a wait on proc was successful (define (waited-by-wait proc status) (obituary proc status) (mark-proc-waited! proc)) ;;; we know from somewhere that proc is dead (define (obituary proc status) (if (not (proc? proc)) (error "obituary: proc was not a procobj" proc)) (need-reaping-remove! (proc:pid proc)) ; in case it started during 'late (placeholder-set! (proc:status proc) status) (set-proc:finished? proc #t)) ;;; (wait-any [flags]) => [proc status] ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; ;;; [#f #f] => non-blocking, none ready. ;;; [#f #t] => no more. (define (wait-any . maybe-flags) (let ((flags (:optional maybe-flags 0))) (if (zero? (bitwise-and flags wait/poll)) (begin (receive (pid status) ;; before we maybe block via placeholder-value ;; do a really-wait-any for the ones, missed by 'late (really-wait-any (bitwise-ior flags wait/poll)) (if (not pid) (let ((win (get-reaped-proc!))) (values win (placeholder-value (proc:status win)))) (values pid status)))) ;; The rest of this is quite crude and can be safely ignored. -df ;; JMG: wait-any is crude and so its implementation ;; It got even worse, now that we have this fu*$#%g 'late (if (maybe-obtain-lock reaped-proc-pop-lock) (if (eq? reaped-proc-head reaped-proc-tail) ;;; due to 'late we cannot be sure, that they all have been ;;; reaped (begin (release-lock reaped-proc-pop-lock) (really-wait-any flags)) (let* ((retnode (placeholder-value reaped-proc-head)) (retval (weak-pointer-ref (reaped-proc:proc retnode)))) (set! reaped-proc-head (reaped-proc:next retnode)) (release-lock reaped-proc-pop-lock) (if retval (values retval (placeholder-value (proc:status retval))) (values #f #f)))) (values #f #f))))) (define (really-wait-any flags) (if (zero? (bitwise-and flags wait/poll)) (error "real-wait-any without wait/poll" flags)) (with-lock wait-lock (lambda () (receive (pid status) (%wait-any flags) (if pid (let ((proc (new-child-proc pid))) (waited-by-wait proc status) (values proc status)) (values #f #f)))))) ;;; (wait-process-group [proc-group flags]) => [proc status] ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; ;;; [#f #f] => non-blocking, none ready. ;;; [#f #t] => no more. ;;; ;;; ;;; If you are doing process-group waits, you do *not* want to use ;;; early autoreaping, since the reaper loses process-group information. ;;; (I'm working on it -df) (define (wait-process-group . args) (let-optionals args ((proc-group 0) (flags 0)) (let ((proc-group (cond ((integer? proc-group) proc-group) ((proc? proc-group) (proc:pid proc-group)) (else (error "Illegal argument" wait-process-group proc-group)))) (win (lambda (pid status) (let ((proc (pid->proc pid 'create))) (if proc (waited-by-wait proc status)) (values proc status))))) ;; save the event before we check for finished (let ((pre-event (most-recent-sigevent))) (receive (pid status) (%wait-process-group proc-group (bitwise-ior flags wait/poll)) (cond (pid (win pid status)) ((zero? (bitwise-and flags wait/poll)) ;; we have to block and hence use the event system (let lp ((pre-event pre-event)) (receive (pid status) (%wait-process-group proc-group (bitwise-ior flags wait/poll)) (if pid (win pid status) (lp (next-sigevent pre-event interrupt/chld)))))) (else (values #f status)))))))) ;;; (%wait-any flags) (%wait-pid pid flags) (%wait-process-group pgrp flags) ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; ;;; Direct interfaces to waitpid(2) call. As opposed to %wait-pid this ;;; waits on any child (using -1) and gets along if no child is alive ;;; at all (i.e. catches errno/child). ;;; [#f #f] means no processes ready on a non-blocking wait. ;;; [#f #t] means no waitable process on wait-any. (define (%wait-any flags) (with-errno-handler ((errno packet) ((errno/child) (values #f #t))) (receive (pid status) (%wait-pid -1 flags) (if (zero? pid) (values #f #f) ; None ready. (values pid status))))) (define (%wait-process-group pgrp flags) (if (zero? (bitwise-and flags wait/poll)) (error "really-wait without wait/poll")) (with-errno-handler ((errno packet) ((errno/child) (values #f #t))) (receive (pid status) (%wait-pid (- pgrp) flags) (if (zero? pid) (values #f #f) ; None ready. (values pid status))))) ;;; Reaped process table ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; ;;; We keep track of procs that have been reaped but not yet waited on by ;;; the user's code. These proces are eligible for return by WAIT-ANY. ;;; We keep track of these so that WAIT-ANY will hand them out exactly once. ;;; What this code needs is traditional condition variables. ;;; This is (so far) reliable in the following ways: ;;; 1. No process will be returned twice by wait-any, ever. Even two different ;;; wait-anys. ;;; 2. Being un-reaped will not prevent garbage collection. ;;; (actually, there seems to be a problem with this -df) ;;; 3. If a process is waited on, or is gc'ed, wait-any will do the Right ;;; Thing. ;;; And UNreliable in the following ways: ;;; 1. If a wait and a wait-any are blocking simultaneously, the wait will ;;; always return the object. However, whether the wait-any will or not ;;; is based on racing semaphores. ;;; 2. While processes can still be garbage collected, the nodes on the ;;; wait-any list will not, and if the program never wait-any's, the queue ;;; will snake around, eating up memory like pac-man with the munchies. ;;; 3. The process may be garbage collected before wait-any gets to it, and ;;; that's just tough. ;;; -df (define-record reaped-proc proc (next (make-placeholder)) prev) (define reaped-proc-tail (make-reaped-proc (make-weak-pointer #f) 'head)) (define reaped-proc-head reaped-proc-tail) (define reaped-proc-push-lock (make-lock)) (define reaped-proc-pop-lock (make-lock)) ;;; Zippy sez: pop lock! (define (push-reaped-proc proc) (obtain-lock reaped-proc-push-lock) (let ((push-me (make-reaped-proc (make-weak-pointer proc) reaped-proc-tail))) (placeholder-set! (reaped-proc:next reaped-proc-tail) push-me) (add-finalizer! proc (make-reaped-proc-finalizer push-me)) (set! reaped-proc-tail push-me)) (release-lock reaped-proc-push-lock)) (define (make-reaped-proc-finalizer push-me) (lambda ignore (remove-reaped-proc push-me))) (define (remove-reaped-proc reaped-proc) (spawn (lambda () ;This is blocking, so should run by itself (set-reaped-proc:prev (placeholder-value (reaped-proc:next reaped-proc)) (reaped-proc:prev reaped-proc)) (set-reaped-proc:next (reaped-proc:prev reaped-proc) (reaped-proc:next reaped-proc))) "reaped-proc-removing-thread")) (define (pop-reaped-proc) (obtain-lock reaped-proc-pop-lock) ;;; pop lock pop lock pop lock! (let ((pop-me (placeholder-value (reaped-proc:next reaped-proc-head)))) (set! reaped-proc-head pop-me) (release-lock reaped-proc-pop-lock) (weak-pointer-ref (reaped-proc:proc pop-me)))) ;;; Pop one off the list. (define (get-reaped-proc!) (let loop ((try (pop-reaped-proc))) (if (and try (proc:zombie try)) try (loop (pop-reaped-proc))))) ;;; PROC no longer eligible to be in the list. Delete it. (define (mark-proc-waited! proc) (set-proc:zombie proc #f))