From dae01f4eb75f7bc8abe6e3c0a7029185469e137e Mon Sep 17 00:00:00 2001
From: olin-shivers <olin-shivers>
Date: Sun, 11 Mar 2001 18:52:59 +0000
Subject: [PATCH] - Folding the branch that packages up the SRFI 13 & 14
 integration changes   into the main trunk.

- Changing EXEC-PATH-LIST from a global var to a fluid. (scsh.scm &
  scsh-package.scm). This sort of snuck into this commit.
---
 Makefile.in                 |    9 +-
 scsh/fr.scm                 |    4 +-
 scsh/glob.scm               |   15 +-
 scsh/lib/ccp-pack.scm       |    2 +-
 scsh/lib/ccp.scm            |   20 +-
 scsh/lib/char-package.scm   |   59 +
 scsh/lib/cset-lib.html      | 2016 +++++++++++++++++++++++++++++++++
 scsh/lib/cset-lib.scm       |  804 +++++++++++++
 scsh/lib/cset-lib.txt       | 1271 +++++++++++++++++++++
 scsh/lib/cset-obsolete.scm  |   52 +
 scsh/lib/cset-package.scm   |  151 +++
 scsh/lib/cset-tests.scm     |  200 ++++
 scsh/lib/list-lib.scm       |    9 +-
 scsh/lib/srfi-1.html        |   78 +-
 scsh/lib/string-lib.scm     | 2129 +++++++++++++++++++++++------------
 scsh/lib/string-package.scm |  350 ++++++
 scsh/meta-arg.scm           |    2 +-
 scsh/rx/packages.scm        |    6 +-
 scsh/rx/parse.scm           |   49 +-
 scsh/rx/posixstr.scm        |    4 +-
 scsh/rx/re.scm              |    6 +-
 scsh/rx/rx-lib.scm          |    2 +-
 scsh/rx/simp.scm            |    4 +-
 scsh/rx/spencer.scm         |    2 +-
 scsh/scsh-interfaces.scm    |   76 +-
 scsh/scsh-package.scm       |   29 +-
 scsh/scsh.scm               |   16 +-
 27 files changed, 6418 insertions(+), 947 deletions(-)
 create mode 100644 scsh/lib/char-package.scm
 create mode 100644 scsh/lib/cset-lib.html
 create mode 100644 scsh/lib/cset-lib.scm
 create mode 100644 scsh/lib/cset-lib.txt
 create mode 100644 scsh/lib/cset-obsolete.scm
 create mode 100644 scsh/lib/cset-package.scm
 create mode 100644 scsh/lib/cset-tests.scm
 create mode 100644 scsh/lib/string-package.scm
diff --git a/Makefile.in b/Makefile.in
index d34a2ce..f2947fa 100644
--- a/Makefile.in
+++ b/Makefile.in
@@ -592,7 +592,6 @@ $(CIG).image: $(IMAGE) $(VM) $(srcdir)/cig/cig.scm $(srcdir)/cig/libcig.scm
 scsh: cig scsh/scsh scsh/scsh.image
 
 SCHEME =scsh/awk.scm \
-	scsh/char-set.scm \
 	scsh/defrec.scm \
 	scsh/endian.scm \
 	scsh/enumconst.scm \
@@ -672,10 +671,12 @@ loads = $(srcdir)/scsh/let-opt.scm $(srcdir)/scsh/scsh-interfaces.scm \
 	 $(srcdir)/scsh/rx/packages.scm \
 	 $(srcdir)/scsh/rx/cond-package.scm \
 	 $(srcdir)/scsh/scsh-package.scm \
-	 $(srcdir)/scsh/lib/string-pack.scm \
+	 $(srcdir)/scsh/lib/cset-package.scm \
+	 $(srcdir)/scsh/lib/string-package.scm \
 	 $(srcdir)/scsh/lib/list-pack.scm \
-	 $(srcdir)/scsh/lib/ccp-pack.scm
-
+	 $(srcdir)/scsh/lib/ccp-pack.scm \
+	 $(srcdir)/scsh/lib/char-package.scm \
+	 $(srcdir)/scsh/lib/cset-obsolete.scm
 
 scsh/scsh.image: $(VM) $(SCHEME) $(CIG).image
 	(echo ",translate =scheme48/ $(srcdir)/"; \
diff --git a/scsh/fr.scm b/scsh/fr.scm
index d98ceaf..a50782f 100644
--- a/scsh/fr.scm
+++ b/scsh/fr.scm
@@ -318,7 +318,7 @@
 	     s)))
 
 	((concat)		; CONCAT-delimiter reader.
-	 (let ((not-delims (char-set-invert delims)))
+	 (let ((not-delims (char-set-complement delims)))
 	   (lambda maybe-port
 	     (let* ((p (:optional maybe-port (current-input-port)))
 		    (s (read-delimited delims p 'concat)))
@@ -328,7 +328,7 @@
 			 (string-append s extra-delims))))))))
 
 	((split)		; SPLIT-delimiter reader.
-	 (let ((not-delims (char-set-invert delims)))
+	 (let ((not-delims (char-set-complement delims)))
 	   (lambda maybe-port
 	     (let ((p (:optional maybe-port (current-input-port))))
 	       (receive (s delim) (read-delimited delims p 'split)
diff --git a/scsh/glob.scm b/scsh/glob.scm
index 5f73ce1..900cb5b 100644
--- a/scsh/glob.scm
+++ b/scsh/glob.scm
@@ -151,16 +151,15 @@
 	      (case c
 		((#\])
 		 (let ((cset (fold (lambda (elt cset)
-				     (char-set-union
-				      cset
-				      (if (char? elt)
-					  (char-set elt)
-					  (ascii-range->char-set (char->ascii (car elt))
-								 (+ 1 (char->ascii (cdr elt)))))))
-				   char-set:empty
+				     (if (char? elt)
+					 (char-set-adjoin! cset elt)
+					 (ucs-range->char-set! (char->ascii (car elt))
+							       (+ 1 (char->ascii (cdr elt)))
+							       #f cset)))
+				   (char-set-copy char-set:empty)
 				   elts)))
 		   (values (re-char-set (if negate?
-					    (char-set-invert cset)
+					    (char-set-complement! cset)
 					    cset))
 			   i)))
 
diff --git a/scsh/lib/ccp-pack.scm b/scsh/lib/ccp-pack.scm
index b5095a1..50f4d1c 100644
--- a/scsh/lib/ccp-pack.scm
+++ b/scsh/lib/ccp-pack.scm
@@ -93,7 +93,7 @@
    ))
 
 (define-structure ccp-lib ccp-lib-interface
-  (open char-set-package
+  (open char-set-lib
 	ascii
 	defrec-package
 	string-lib
diff --git a/scsh/lib/ccp.scm b/scsh/lib/ccp.scm
index 16dcece..9f17cab 100644
--- a/scsh/lib/ccp.scm
+++ b/scsh/lib/ccp.scm
@@ -95,11 +95,11 @@
     (every (lambda (ccp2)
 	     (and (char-set= domain (ccp:domain ccp2))
 		  (let ((cmap2 (ccp:map ccp2)))
-		    (char-set-every? (lambda (c)
-				       (let ((i (char->ascii c)))
-					 (char=? (string-ref cmap  i)
-						 (string-ref cmap2 i))))
-				     domain))))
+		    (char-set-every (lambda (c)
+				      (let ((i (char->ascii c)))
+					(char=? (string-ref cmap  i)
+						(string-ref cmap2 i))))
+				    domain))))
 	   rest)))
 
 
@@ -116,11 +116,11 @@
 	       (rest (cdr rest)))
 	  (and (char-set<= domain1 domain2)
 	       (let ((cmap2 (ccp:map ccp2)))
-		 (char-set-every? (lambda (c)
-				    (let ((i (char->ascii c)))
-				      (char=? (string-ref cmap1 i)
-					      (string-ref cmap2 i))))
-				  domain1))
+		 (char-set-every (lambda (c)
+				   (let ((i (char->ascii c)))
+				     (char=? (string-ref cmap1 i)
+					     (string-ref cmap2 i))))
+				 domain1))
 	       (lp domain2 cmap2 rest))))))
 
 
diff --git a/scsh/lib/char-package.scm b/scsh/lib/char-package.scm
new file mode 100644
index 0000000..1d535c1
--- /dev/null
+++ b/scsh/lib/char-package.scm
@@ -0,0 +1,59 @@
+;;; These defs are things for characters *not* in SRFIs 13 & 14.
+;;; It includes some R5RS defs that are not correct in S48 in a Latin-1 world.
+
+(define-interface char-set-predicates-interface
+  (export
+   ((char-lower-case?		; R5RS
+     char-upper-case?		; R5RS
+     char-alphabetic?		; R5RS
+     char-numeric?		; R5RS
+     char-whitespace?		; R5RS
+
+     char-alphanumeric?		; For compatibility w/old code
+
+     char-letter?		; Scsh
+     char-digit?
+     char-letter+digit?
+     char-graphic?
+     char-printing?
+     char-blank?
+     char-iso-control?
+     char-punctuation?
+     char-symbol?
+     char-hex-digit?
+     char-ascii?)		(proc (:char) :boolean))))
+
+
+(define-structure char-set-predicates-lib char-set-predicates-interface
+  (open error-package	; ERROR
+	scsh-utilities	; DEPRECATED-PROC
+	char-set-lib
+	scheme)
+
+  (begin
+    ;; These are R5RS. We can't use the native S48 ones, because they
+    ;; don't handle full Latin-1.
+    (define (char-lower-case? c) (char-set-contains? char-set:lower-case c))
+    (define (char-upper-case? c) (char-set-contains? char-set:upper-case c))
+    (define (char-alphabetic? c) (char-set-contains? char-set:letter c))
+    (define (char-numeric?    c) (char-set-contains? char-set:digit    c))
+    (define (char-whitespace? c) (char-set-contains? char-set:whitespace c))
+
+    ;; These are scsh extensions to R5RS.
+    (define (char-letter?       c) (char-set-contains? char-set:letter       c))
+    (define (char-digit?        c) (char-set-contains? char-set:digit        c))
+    (define (char-letter+digit? c) (char-set-contains? char-set:letter+digit c))
+    (define (char-graphic?      c) (char-set-contains? char-set:graphic      c))
+    (define (char-printing?     c) (char-set-contains? char-set:printing     c))
+    (define (char-blank?        c) (char-set-contains? char-set:blank        c))
+    (define (char-iso-control?  c) (char-set-contains? char-set:iso-control  c))
+    (define (char-punctuation?  c) (char-set-contains? char-set:punctuation  c))
+    (define (char-symbol?       c) (char-set-contains? char-set:symbol       c))
+    (define (char-hex-digit?    c) (char-set-contains? char-set:hex-digit    c))
+    (define (char-ascii?        c) (char-set-contains? char-set:ascii        c))
+
+    ;; Obsolete scsh.
+    (define char-alphanumeric?
+      (deprecated-proc char-letter+digit? 'char-alphanumeric?
+		       "Use CHAR-LETTER+DIGIT? instead.")))
+  (optimize auto-integrate))
diff --git a/scsh/lib/cset-lib.html b/scsh/lib/cset-lib.html
new file mode 100644
index 0000000..b7eb80f
--- /dev/null
+++ b/scsh/lib/cset-lib.html
@@ -0,0 +1,2016 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN"
+            "http://www.w3.org/TR/html4/loose.dtd">
+<!-- 
+ - Do a paragraph check <p>
+ - The Unicode char tables are messed up, but it can't be fixed w/o CSS2
+   support, which I do not currently find in web browsers.
+ - Can I have bangs, plusses, or slashes in #tags? Spaces?
+        Yes: plus, bang, star   No: space  Yes: slash, question, ampersand
+        You can't put sharp in a path, so anything goes, really.
+        Nonetheless, some of these confuse Netscape, so I'll avoid them.
+ -->
+
+<!--========================================================================-->
+<html lang=en-US>
+  <head>
+    <meta name="keywords" content="Scheme, programming language, list processing, SRFI, underage lesbian sluts">
+    <link rev=made href="mailto:shivers@ai.mit.edu">
+    <title>SRFI 14: Character-set Library</title>
+
+    <!-- Should have a media=all to get, for example, printing to work.
+      == But my Netscape will completely ignore the tag if I do that.
+      -->
+    <style type="text/css">
+           /* A little general layout hackery for headers & the title. */
+           body { margin-left: +7%;
+                  font-family: "Helvetica", sans-serif;
+                  }
+           /* Netscape workaround: */
+           td, th { font-family: "Helvetica", sans-serif; }
+
+           code, pre { font-family: "courier new", "courier"; }
+
+           div.inset { margin-left: +5%; }
+
+           h1 { margin-left: -5%; }
+           h1, h2 { clear: both; }
+           h1, h2, h3, h4, h5, h6 { color: blue }
+           div.title-text { font-size: large; font-weight: bold; }
+	   h3 { margin-top: 2em; margin-bottom: 0em }
+
+           div.indent { margin-left: 2em; }       /* General indentation */
+           pre.code-example { margin-left: 2em; } /* Indent code examples. */
+
+	   /* "Continue" class marks text that isn't really the start
+	   ** of a new paragraph -- e.g., continuing a para after a 
+	   ** code sample.
+	   */
+	   p.continue { text-indent: 0em; margin-top: 0em}
+
+           /* This stuff is for definition lists of defined procedures.
+           ** A proc-def1 is used when you want a stack of procs to go
+           ** with one dd body. In this case, make the first
+           ** proc a proc-def1, following ones proc-defi's, and the last one
+           ** a proc-defn.
+           **
+           ** Unfortunately, Netscape has huge bugs with respect to style
+           ** sheets and dl list rendering. We have to set truly random
+           ** values here to get the rendering to come out. The proper values
+           ** are in the following style sheet, for Internet Explorer.
+           ** In the following settings, the *comments* say what the 
+           ** setting *really* causes Netscape to do.
+           **
+           ** Ugh. Professional coders sacrifice their self-respect,
+           ** that others may live.
+           */
+           /* m-t ignored; m-b sets top margin space. */
+           dt.proc-def1 { margin-top: 0ex; margin-bottom: 3ex; }
+           dt.proc-defi { margin-top: 0ex; margin-bottom: 0ex; }
+           dt.proc-defn { margin-top: 0ex; margin-bottom: 0ex; }
+
+           /* m-t works weird depending on whether or not the last line
+           ** of the previous entry was a pre. Set to zero.
+           */
+           dt.proc-def  { margin-top: 0ex; margin-bottom: 3ex; }
+
+           /* m-b sets space between dd & dt; m-t ignored. */
+           dd.proc-def { margin-bottom: 0.5ex; margin-top: 0ex; } 
+
+
+           /* Boldface the name of a procedure when it's being defined. */
+           code.proc-def { font-weight: bold; font-size: 110%}
+
+           /* For the index of procedures. 
+           ** Same hackery as for dt.proc-def, above.
+           */
+           /* m-b sets space between dd & dt; m-t ignored. */
+           dd.proc-index  { margin-bottom: 0ex; margin-top: 0ex; } 
+           /* What the fuck? */
+           pre.proc-index { margin-top: -2ex; }
+
+           /* Pull the table of contents back flush with the margin.
+           ** Both NS & IE screw this up in different ways.
+           */
+           #toc-table { margin-top: -2ex; margin-left: -5%; }
+
+           /* R5RS proc names are in italic; extended R5RS names 
+           ** in italic boldface.
+           */
+           span.r5rs-proc { font-weight: bold; }
+           span.r5rs-procx { font-style: italic; font-weight: bold; }
+
+           /* Spread out bibliographic lists. */
+           /* More Netscape-specific lossage; see the following stylesheet
+           ** for the proper values (used by IE).
+           */
+           dt.biblio { margin-bottom: 3ex; }
+
+           /* Links to draft copies (e.g., not at the official SRFI site)
+           ** are colored in red, so people will use them during the 
+           ** development process and kill them when the document's done.
+           */
+           a.draft { color: red; }
+
+    </style>
+
+    <style type="text/css" media=all>
+           /* Nastiness: Here, I'm using a bug to work around a bug.
+           ** Netscape rendering bugs mean you need bogus <dt> and <dd>
+           ** margin settings -- settings which screw up IE's proper rendering.
+           ** Fortunately, Netscape has *another* bug: it will ignore this
+           ** media=all style sheet. So I am placing the (proper) IE values
+           ** here. Perhaps, one day, when these rendering bugs are fixed,
+           ** this gross hackery can be removed.
+           */
+           dt.proc-def1 { margin-top: 3ex; margin-bottom: 0ex; }
+           dt.proc-defi { margin-top: 0ex; margin-bottom: 0ex; }
+           dt.proc-defn { margin-top: 0ex; margin-bottom: 0.5ex; }
+           dt.proc-def  { margin-top: 3ex; margin-bottom: 0.5ex; }
+
+           pre { margin-top: 1ex; }
+
+           dd.proc-def { margin-bottom: 2ex; margin-top: 0.5ex; } 
+
+           /* For the index of procedures. 
+           ** Same hackery as for dt.proc-def, above.
+           */
+           dd.proc-index { margin-top: 0ex; } 
+           pre.proc-index { margin-top: 0ex; }
+
+           /* Spread out bibliographic lists. */
+           dt.biblio { margin-top: 3ex; margin-bottom: 0ex; }
+           dd.biblio { margin-bottom: 1ex; }
+    </style>
+  </head>
+
+<body>
+
+<!--========================================================================-->
+<h1>Title</h1>
+<div class=title-text>
+Character-set Library
+</div>
+
+<!--========================================================================-->
+<h1>Author</H1>
+    <address>
+       <a href="http://www.ai.mit.edu/~shivers/">Olin Shivers</A> /
+       <a href="mailto:shivers@ai.mit.edu">shivers@ai.mit.edu</A>
+    </address>
+
+<!--========================================================================-->
+<h1>Table of contents</H1>
+
+<!-- A bug in netscape (?) keeps the first link in this UL from being active.
+==== So the Abstract link be dead. 99/8/22 -Olin
+-->
+<ul id=toc-table>
+<li><a href="#Abstract">Abstract</a>
+<li><a href="#VariableIndex">Variable index</a>
+<li><a href="#Rationale">Rationale</a>
+  <ul>
+  <li><a href="#LinearUpdateOperations">"Linear-update" operations</a>
+  <li><a href="#ExtraSRFI">Extra-SRFI recommendations</a>
+  </ul>
+
+<li><a href="#Specification">Specification</a>
+  <ul>
+  <li><a href="#GeneralProcs">General procedures</a>
+  <li><a href="#Iterating">Iterating over character sets</a>
+  <li><a href="#Creating">Creating character sets</a>
+  <li><a href="#Querying">Querying character sets</a>
+  <li><a href="#Algebra">Character set algebra</a>
+  <li><a href="#StandardCharsets">Standard character sets</a>
+  </ul>
+
+<li><a href="#StandardCharsetDefs">Unicode, Latin-1 and ASCII definitions of the standard character sets</a>
+<li><a href="#ReferenceImp">Reference implementation</a>
+<li><a href="#Acknowledgements">Acknowledgements</a>
+<li><a href="#Links">References &amp; Links</a>
+<li><a href="#Copyright">Copyright</a>
+</ul>
+
+<!--========================================================================-->
+<h1><a name="Abstract">Abstract</a></H1>
+<p>
+
+The ability to efficiently represent and manipulate sets of characters is an
+unglamorous but very useful capability for text-processing code -- one that
+tends to pop up in the definitions of other libraries.  Hence it is useful to
+specify a general substrate for this functionality early.  This SRFI defines a
+general library that provides this functionality. 
+
+It is accompanied by a reference implementation for the spec. The reference
+implementation is fairly efficient, straightforwardly portable, and has a
+"free software" copyright. The implementation is tuned for "small" 7 or 8
+bit character types, such as ASCII or Latin-1; the data structures and
+algorithms would have to be altered for larger 16 or 32 bit character types
+such as Unicode -- however, the specs have been carefully designed with these
+larger character types in mind.
+
+Several forthcoming SRFIs can be defined in terms of this one:
+<ul>
+    <li> string library
+    <li> delimited input procedures (<em>e.g.</em>, <code>read-line</code>)
+    <li> regular expressions
+</ul>
+
+
+<!--========================================================================-->
+<h1><a name="VariableIndex">Variable Index</a></h1>
+<p>
+Here is the complete set of bindings -- procedural and otherwise --
+exported by this library. In a Scheme system that has a module or package 
+system, these procedures should be contained in a module named "char-set-lib".
+
+<div class=indent>
+<dl>
+<dt class=proc-index> Predicates &amp; comparison
+<dd class=proc-index>
+<pre class=proc-index>
+<a href="#char-set-p">char-set?</a> <a href="#char-set=">char-set=</a> <a href="#char-set<=">char-set<=</a> <a href="#char-set-hash">char-set-hash</a>
+</pre>
+
+<dt class=proc-index> Iterating over character sets
+<dd class=proc-index>
+<pre class=proc-index>
+<a href="#char-set-cursor">char-set-cursor</a> <a href="#char-set-ref">char-set-ref</a> <a href="#char-set-cursor-next">char-set-cursor-next</a> <a href="#end-of-char-set-p">end-of-char-set?</a> 
+<a href="#char-set-fold">char-set-fold</a> <a href="#char-set-unfold">char-set-unfold</a> <a href="#char-set-unfold!">char-set-unfold!</a>
+<a href="#char-set-for-each">char-set-for-each</a> <a href="#char-set-map">char-set-map</a>
+</pre>
+
+<dt class=proc-index> Creating character sets
+<dd class=proc-index>
+<pre class=proc-index>
+<a href="#char-set-copy">char-set-copy</a> <a href="#char-set">char-set</a>
+
+<a href="#list->char-set">list->char-set</a>  <a href="#string->char-set">string->char-set</a>
+<a href="#list->char-set!">list->char-set!</a> <a href="#string->char-set!">string->char-set!</a>
+    
+<a href="#char-set-filter">char-set-filter</a>  <a href="#ucs-range->char-set">ucs-range->char-set</a> <a href="#
+char-set-filter!">
+char-set-filter!</a> <a href="#ucs-range->char-set!">ucs-range->char-set!</a>
+
+<a href="#->char-set">->char-set</a>
+</pre>
+
+<dt class=proc-index> Querying character sets
+<dd class=proc-index>
+<pre class=proc-index>
+<a href="#char-set->list">char-set->list</a> <a href="#char-set->string">char-set->string</a>
+<a href="#char-set-size">char-set-size</a> <a href="#char-set-count">char-set-count</a> <a href="#char-set-contains-p">char-set-contains?</a>
+<a href="#char-set-every">char-set-every</a> <a href="#char-set-any">char-set-any</a>
+</pre>
+
+<dt class=proc-index> Character-set algebra
+<dd class=proc-index>
+<pre class=proc-index>
+<a href="#char-set-adjoin">char-set-adjoin</a>  <a href="#char-set-delete">char-set-delete</a>
+<a href="#char-set-adjoin!">char-set-adjoin!</a> <a href="#char-set-delete!">char-set-delete!</a>
+
+<a href="#char-set-complement">char-set-complement</a>  <a href="#char-set-union">char-set-union</a>  <a href="#char-set-intersection">char-set-intersection</a>
+<a href="#char-set-complement!">char-set-complement!</a> <a href="#char-set-union!">char-set-union!</a> <a href="#char-set-intersection!">char-set-intersection!</a>
+
+<a href="#char-set-difference">char-set-difference</a>  <a href="#char-set-xor">char-set-xor</a>  <a href="#char-set-diff+intersection">char-set-diff+intersection</a>
+<a href="#char-set-difference!">char-set-difference!</a> <a href="#char-set-xor!">char-set-xor!</a> <a href="#char-set-diff+intersection!">char-set-diff+intersection!</a>
+</pre>
+
+<dt class=proc-index> Standard character sets
+<dd class=proc-index>
+<pre class=proc-index>
+<a href="#char-set:lower-case">char-set:lower-case</a>  <a href="#char-set:upper-case">char-set:upper-case</a>  <a href="#char-set:title-case">char-set:title-case</a>
+<a href="#char-set:letter">char-set:letter</a>      <a href="#char-set:digit">char-set:digit</a>       <a href="#char-set:letter+digit">char-set:letter+digit</a>
+<a href="#char-set:graphic">char-set:graphic</a>     <a href="#char-set:printing">char-set:printing</a>    <a href="#char-set:whitespace">char-set:whitespace</a>
+<a href="#char-set:iso-control">char-set:iso-control</a> <a href="#char-set:punctuation">char-set:punctuation</a> <a href="#char-set:symbol">char-set:symbol</a>
+<a href="#char-set:hex-digit">char-set:hex-digit</a>   <a href="#char-set:blank">char-set:blank</a>       <a href="#char-set:ascii">char-set:ascii</a>
+<a href="#char-set:empty">char-set:empty</a>       <a href="#char-set:full">char-set:full</a>
+</pre>
+
+</dl>
+</div>
+
+<!--========================================================================-->
+<h1><a name="Rationale">Rationale</a></h1>
+
+<p>
+The ability to efficiently manipulate sets of characters is quite
+useful for text-processing code. Encapsulating this functionality in
+a general, efficiently implemented library can assist all such code.
+This library defines a new data structure to represent these sets, called
+a "char-set." The char-set type is distinct from all other types.
+
+<p>
+This library is designed to be portable across implementations that use
+different character types and representations, especially ASCII, Latin-1
+and Unicode. Some effort has been made to preserve compatibility with Java
+in the Unicode case (see the definition of <code>char-set:whitespace</code> for the
+single real deviation).
+
+<!--========================================================================-->
+<h2><a name="LinearUpdateOperations">Linear-update operations</a></h2>
+
+<p>
+The procedures of this SRFI, by default, are "pure functional" -- they do not
+alter their parameters. However, this SRFI defines a set of "linear-update"
+procedures which have a hybrid pure-functional/side-effecting semantics: they
+are allowed, but not required, to side-effect one of their parameters in order
+to construct their result. An implementation may legally implement these
+procedures as pure, side-effect-free functions, or it may implement them using
+side effects, depending upon the details of what is the most efficient or
+simple to implement in terms of the underlying representation.
+
+<p>
+The linear-update routines all have names ending with "!".
+
+<p>
+Clients of these procedures <em>may not</em> rely upon these procedures working by
+side effect. For example, this is not guaranteed to work:
+<pre class=code-example>
+(let* ((cs1 (char-set #\a #\b #\c))      ; cs1 = {a,b,c}.
+       (cs2 (char-set-adjoin! cs1 #\d))) ; Add d to {a,b,c}.
+  cs1) ; Could be either {a,b,c} or {a,b,c,d}.
+</pre>
+<p class=continue>
+However, this is well-defined:
+<pre class=code-example>
+(let ((cs (char-set #\a #\b #\c)))
+  (char-set-adjoin! cs #\d)) ; Add d to {a,b,c}.
+</pre>
+
+<p>
+So clients of these procedures write in a functional style, but must
+additionally be sure that, when the procedure is called, there are no other
+live pointers to the potentially-modified character set (hence the term
+"linear update").
+
+<p>
+There are two benefits to this convention:
+<ul>
+  <li> Implementations are free to provide the most efficient possible
+    implementation, either functional or side-effecting.
+  <li> Programmers may nonetheless continue to assume that character sets
+    are purely functional data structures: they may be reliably shared
+    without needing to be copied, uniquified, and so forth.
+</ul>
+
+<p>
+Note that pure functional representations are the right thing for
+ASCII- or Latin-1-based Scheme implementations, since a char-set can
+be represented in an ASCII Scheme with 4 32-bit words. Pure set-algebra
+operations on such a representation are very fast and efficient. Programmers
+who code using linear-update operations are guaranteed the system will
+provide the best implementation across multiple platforms.
+
+<p>
+In practice, these procedures are most useful for efficiently constructing
+character sets in a side-effecting manner, in some limited local context, 
+before passing the character set outside the local construction scope to be
+used in a functional manner.
+
+<p>
+Scheme provides no assistance in checking the linearity of the potentially
+side-effected parameters passed to these functions --- there's no linear
+type checker or run-time mechanism for detecting violations. (But
+sophisticated programming environments, such as DrScheme, might help.)
+
+<!--========================================================================-->
+<h2><a name="ExtraSRFI">Extra-SRFI recommendations</a></h2>
+<p>
+Users are cautioned that the R5RS predicates 
+<div class=inset><code>
+char-alphabetic? <br>
+char-numeric? <br>
+char-whitespace? <br>
+char-upper-case? <br>
+char-lower-case? <br>
+</code>
+</div>
+<p class=continue>
+may or may not be in agreement with the SRFI 14 base character sets
+<div class=inset>
+<code>
+char-set:letter<br>
+char-set:digit<br>
+char-set:whitespace<br>
+char-set:upper-case<br>
+char-set:lower-case<br>
+</code>
+</div>
+<p class=continue>
+Implementors are strongly encouraged to bring these predicates into
+agreement with the base character sets of this SRFI; not to do so risks
+major confusion.
+
+
+<!--========================================================================-->
+<h1><a name="Specification">Specification</a></h1>
+<p>
+In the following procedure specifications:
+<ul>
+    <li> A <var>cs</var> parameter is a character set.
+
+    <li> An <var>s</var> parameter is a string.
+
+    <li> A <var>char</var> parameter is a character.
+
+    <li> A <var>char-list</var> parameter is a list of characters.
+
+    <li> A <var>pred</var> parameter is a unary character predicate procedure, returning 
+      a true/false value when applied to a character.
+
+    <li> An <var>obj</var> parameter may be any value at all.
+</ul>
+
+<p>
+Passing values to procedures with these parameters that do not satisfy these
+types is an error.
+
+<p>
+Unless otherwise noted in the specification of a procedure, procedures
+always return character sets that are distinct (from the point of view
+of the linear-update operations) from the parameter character sets. For
+example, <code>char-set-adjoin</code> is guaranteed to provide a fresh character set,
+even if it is not given any character parameters.
+
+<p>
+Parameters given in square brackets are optional. Unless otherwise noted in the
+text describing the procedure, any prefix of these optional parameters may
+be supplied, from zero arguments to the full list. When a procedure returns
+multiple values, this is shown by listing the return values in square
+brackets, as well. So, for example, the procedure with signature
+<pre class=code-example>
+halts? <var>f [x init-store]</var> -> <var>[boolean integer]</var>
+</pre>
+would take one (<var>f</var>), two (<var>f</var>, <var>x</var>) 
+or three (<var>f</var>, <var>x</var>, <var>init-store</var>) input parameters, 
+and return two values, a boolean and an integer.
+
+<p>
+A parameter followed by "<code>...</code>" means zero-or-more elements. 
+So the procedure with the signature
+<pre class=code-example>
+sum-squares <var>x ... </var> -> <var>number</var>
+</pre>
+takes zero or more arguments (<var>x ...</var>), 
+while the procedure with signature
+<pre class=code-example>
+spell-check <var>doc dict<sub>1</sub> dict<sub>2</sub> ...</var> -> <var>string-list</var>
+</pre>
+takes two required parameters 
+(<var>doc</var> and <var>dict<sub>1</sub></var>) 
+and zero or more optional parameters (<var>dict<sub>2</sub> ...</var>).
+
+
+<!--========================================================================-->
+<h2><a name="GeneralProcs">General procedures</a></h2>
+<dl>
+
+<!--
+==== char-set?
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-p"></a>
+<code class=proc-def>char-set?</code><var> obj -> boolean</var>
+<dd class=proc-def>
+
+    Is the object <var>obj</var> a character set?
+
+<!--
+==== char-set=
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set="></a>
+<code class=proc-def>char-set=</code><var> cs<sub>1</sub> ... -> boolean</var>
+<dd class=proc-def>
+    Are the character sets equal?
+<p>
+    Boundary cases:
+<pre class=code-example>
+(char-set=) => <var>true</var>
+(char-set= cs) => <var>true</var>
+</pre>
+
+<p>
+    Rationale: transitive binary relations are generally extended to n-ary
+    relations in Scheme, which enables clearer, more concise code to be
+    written. While the zero-argument and one-argument cases will almost
+    certainly not arise in first-order uses of such relations, they may well
+    arise in higher-order cases or macro-generated code. 
+    <em>E.g.,</em> consider
+<pre class=code-example>
+(apply char-set= cset-list)
+</pre>
+<p class=continue>
+    This is well-defined if the list is empty or a singleton list. Hence
+    we extend these relations to any number of arguments. Implementors
+    have reported actual uses of n-ary relations in higher-order cases
+    allowing for fewer than two arguments. The way of Scheme is to handle the
+    general case; we provide the fully general extension.
+<p>
+    A counter-argument to this extension is that 
+    <abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr>'s
+    transitive binary arithmetic relations 
+    (<code>=</code>, <code>&lt;</code>, <em>etc.</em>) 
+    require at least two arguments, hence
+    this decision is a break with the prior convention -- although it is
+    at least one that is backwards-compatible.
+
+<!--
+==== char-set<=
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set<="></a>
+<code class=proc-def>char-set<=</code><var> cs<sub>1</sub> ... -> boolean</var>
+<dd class=proc-def>
+    Returns true if every character set <var>cs<sub>i</sub></var> is 
+    a subset of character set <var>cs<sub>i+1</sub></var>.
+
+<p>
+Boundary cases:
+<pre class=code-example>
+(char-set<=) => <var>true</var>
+(char-set<= cs) => <var>true</var>
+</pre>
+<p>
+Rationale: See <code>char-set=</code> for discussion of zero- and one-argument
+applications. Consider testing a list of char-sets for monotonicity
+with 
+<pre class=code-example>
+(apply char-set<= cset-list)
+</pre>
+
+<!--
+==== char-set-hash
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-hash"></a>
+<code class=proc-def>char-set-hash</code><var> cs [bound] -> integer</var>
+<dd class=proc-def>
+    Compute a hash value for the character set <var>cs</var>. 
+    <var>Bound</var> is a non-negative
+    exact integer specifying the range of the hash function. A positive
+    value restricts the return value to the range [0,<var>bound</var>).
+
+    <p>
+    If <var>bound</var> is either zero or not given, the implementation may use
+    an implementation-specific default value, chosen to be as large as
+    is efficiently practical. For instance, the default range might be chosen
+    for a given implementation to map all strings into the range of
+    integers that can be represented with a single machine word.
+
+
+    <p>
+    Invariant:
+<pre class=code-example>
+(char-set= cs<sub>1</sub> cs<sub>2</sub>) => (= (char-set-hash cs<sub>1</sub> b) (char-set-hash cs<sub>2</sub> b))
+</pre>
+
+    <p>
+    A legal but nonetheless discouraged implementation:
+<pre class=code-example>
+(define (char-set-hash cs . maybe-bound) 1)
+</pre>
+
+<p>
+    Rationale: allowing the user to specify an explicit bound simplifies user
+    code by removing the mod operation that typically accompanies every hash
+    computation, and also may allow the implementation of the hash function to
+    exploit a reduced range to efficiently compute the hash value. 
+    <em>E.g.</em>, for
+    small bounds, the hash function may be computed in a fashion such that
+    intermediate values never overflow into bignum integers, allowing the
+    implementor to provide a fixnum-specific "fast path" for computing the
+    common cases very rapidly.
+
+</dl>
+
+<!--========================================================================-->
+<h2><a name="Iterating">Iterating over character sets</a></h2>
+
+<dl>
+<!--
+==== char-set-cursor char-set-ref char-set-cursor-next end-of-char-set?
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-cursor"></a>
+<a name="char-set-ref"></a>
+<a name="char-set-cursor-next"></a>
+<a name="end-of-char-set-p"></a>
+<code class=proc-def>char-set-cursor</code><var> cset -> cursor</var>
+<dt class=proc-defi>
+<code class=proc-def>char-set-ref</code><var> cset cursor -> char</var>
+<dt class=proc-defi>
+<code class=proc-def>char-set-cursor-next</code><var> cset cursor -> cursor</var>
+<dt class=proc-defn>
+<code class=proc-def>end-of-char-set?</code><var> cursor -> boolean</var>
+<dd class=proc-def>
+    Cursors are a low-level facility for iterating over the characters in a
+    set. A cursor is a value that indexes a character in a char set.
+    <code>char-set-cursor</code> produces a new cursor for a given char set. 
+    The set element indexed by the cursor is fetched with 
+    <code>char-set-ref</code>. 
+    A cursor index is incremented with <code>char-set-cursor-next</code>; 
+    in this way, code can step through every character in a char set. 
+    Stepping a cursor "past the end" of a char set produces a cursor that 
+    answers true to <code>end-of-char-set?</code>. 
+    It is an error to pass such a cursor to <code>char-set-ref</code> or to
+    <code>char-set-cursor-next</code>.
+
+<p>
+    A cursor value may not be used in conjunction with a different character
+    set; if it is passed to <code>char-set-ref</code> or 
+    <code>char-set-cursor-next</code> with
+    a character set other than the one used to create it, the results and
+    effects are undefined.
+
+<p>
+    Cursor values are <em>not</em> necessarily distinct from other types. 
+    They may be
+    integers, linked lists, records, procedures or other values. This license
+    is granted to allow cursors to be very "lightweight" values suitable for
+    tight iteration, even in fairly simple implementations.
+
+<p>
+    Note that these primitives are necessary to export an iteration facility
+    for char sets to loop macros.
+
+<p>
+    Example:
+<pre class=code-example>
+(define cs (char-set #\G #\a #\T #\e #\c #\h))
+
+;; Collect elts of CS into a list.
+(let lp ((cur (char-set-cursor cs)) (ans '()))
+  (if (end-of-char-set? cur) ans
+      (lp (char-set-cursor-next cs cur)
+          (cons (char-set-ref cs cur) ans))))
+  => (#\G #\T #\a #\c #\e #\h)
+
+;; Equivalently, using a list unfold (from SRFI 1):
+(unfold-right end-of-char-set? 
+              (curry char-set-ref cs)
+	      (curry char-set-cursor-next cs)
+	      (char-set-cursor cs))
+  => (#\G #\T #\a #\c #\e #\h)
+</pre>
+
+<p>
+    Rationale: Note that the cursor API's four functions "fit" the functional
+    protocol used by the unfolders provided by the list, string and char-set
+    SRFIs (see the example above). By way of contrast, here is a simpler, 
+    two-function API that was rejected for failing this criterion. Besides 
+    <code>char-set-cursor</code>, it provided a single
+    function that mapped a cursor and a character set to two values, the
+    indexed character and the next cursor. If the cursor had exhausted the
+    character set, then this function returned false instead of the character
+    value, and another end-of-char-set cursor. In this way, the other three
+    functions of the current API were combined together.
+
+<!--
+==== char-set-fold
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-fold"></a>
+<code class=proc-def>char-set-fold</code><var> kons knil cs -> object</var>
+<dd class=proc-def>
+    This is the fundamental iterator for character sets.  Applies the function
+    <var>kons</var> across the character set <var>cs</var> using initial state value <var>knil</var>.  That is,
+    if <var>cs</var> is the empty set, the procedure returns <var>knil</var>.  Otherwise, some
+    element <var>c</var> of <var>cs</var> is chosen; 
+    let <var>cs'</var> be the remaining, unchosen characters.
+    The procedure returns
+<pre class=code-example>
+(char-set-fold <var>kons</var> (<var>kons</var> <var>c</var> <var>knil</var>) <var>cs'</var>)
+</pre>
+    <p>
+    Examples:
+<pre class=code-example>
+;; CHAR-SET-MEMBERS
+(lambda (cs) (char-set-fold cons '() cs))
+
+;; CHAR-SET-SIZE
+(lambda (cs) (char-set-fold (lambda (c i) (+ i 1)) 0 cs))
+
+;; How many vowels in the char set?
+(lambda (cs) 
+  (char-set-fold (lambda (c i) (if (vowel? c) (+ i 1) i))
+                 0 cs))
+</pre>
+
+<!--
+==== char-set-unfold char-set-unfold!
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-unfold"></a>
+<a name="char-set-unfold!"></a>
+<code class=proc-def>char-set-unfold&nbsp;</code><var> f p g seed [base-cs] -> char-set</var>
+<dt class=proc-defn><code class=proc-def>char-set-unfold!</code><var> f p g seed base-cs -> char-set</var>
+<dd class=proc-def>
+    This is a fundamental constructor for char-sets. 
+<ul>
+    <li> <var>G</var> is used to generate a series of "seed" values from the initial seed:
+        <var>seed</var>, (<var>g</var> <var>seed</var>), (<var>g<sup>2</sup></var> <var>seed</var>), (<var>g<sup>3</sup></var> <var>seed</var>), ...
+    <li> <var>P</var> tells us when to stop -- when it returns true when applied to one 
+      of these seed values.
+    <li> <var>F</var> maps each seed value to a character. These characters are added
+      to the base character set <var>base-cs</var> to form the result; <var>base-cs</var> defaults to
+      the empty set. <code>char-set-unfold!</code> adds the characters to <var>base-cs</var> in a 
+      linear-update -- it is allowed, but not required, to side-effect
+      and use <var>base-cs</var>'s storage to construct the result.
+</ul>
+
+    <p>
+    More precisely, the following definitions hold, ignoring the
+    optional-argument issues:
+
+<pre class=code-example>
+(define (char-set-unfold p f g seed base-cs) 
+  (char-set-unfold! p f g seed (char-set-copy base-cs)))
+
+(define (char-set-unfold! p f g seed base-cs)
+  (let lp ((seed seed) (cs base-cs))
+        (if (p seed) cs                                 ; P says we are done.
+            (lp (g seed)                                ; Loop on (G SEED).
+                (char-set-adjoin! cs (f seed))))))      ; Add (F SEED) to set.
+</pre>
+
+    (Note that the actual implementation may be more efficient.)
+
+    <p>
+    Examples:
+<pre class=code-example>                         
+(port->char-set p) = (char-set-unfold eof-object? values
+                                      (lambda (x) (read-char p))
+                                      (read-char p))
+
+(list->char-set lis) = (char-set-unfold null? car cdr lis)
+</pre>
+<!--
+==== char-set-for-each
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-for-each"></a>
+<code class=proc-def>char-set-for-each</code><var> proc cs -> unspecified</var>
+<dd class=proc-def>
+    Apply procedure <var>proc</var> to each character in the character set <var>cs</var>.
+    Note that the order in which <var>proc</var> is applied to the characters in the
+    set is not specified, and may even change from one procedure application
+    to another.
+
+    <p>
+    Nothing at all is specified about the value returned by this procedure; it
+    is not even required to be consistent from call to call. It is simply
+    required to be a value (or values) that may be passed to a command
+    continuation, <em>e.g.</em> as the value of an expression appearing as a
+    non-terminal subform of a <code>begin</code> expression. 
+    Note that in 
+    <abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr>,
+    this restricts the procedure to returning a single value; 
+    non-R5RS systems may not even provide this restriction.
+
+<!--
+==== char-set-map
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-map"></a>
+<code class=proc-def>char-set-map</code><var> proc cs -> char-set</var>
+<dd class=proc-def>
+    <var>proc</var> is a char->char procedure. Apply it to all the characters in
+    the char-set <var>cs</var>, and collect the results into a new character set.
+
+    <p>
+    Essentially lifts <var>proc</var> from a char->char procedure to a char-set ->
+    char-set procedure.
+
+    <p>
+    Example:
+<pre class=code-example>
+(char-set-map char-downcase cset)
+</pre>
+</dl>
+
+
+<!--========================================================================-->
+<h2><a name="Creating">Creating character sets</a></h2>
+<dl>
+
+<!--
+==== char-set-copy
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-copy"></a>
+<code class=proc-def>char-set-copy</code><var> cs -> char-set</var>
+<dd class=proc-def>
+    Returns a copy of the character set <var>cs</var>.  "Copy" means that if either the
+    input parameter or the result value of this procedure is passed to one of
+    the linear-update procedures described below, the other character set is
+    guaranteed not to be altered.  
+
+    <p>
+    A system that provides pure-functional implementations of the
+    linear-operator suite could implement this procedure as the identity
+    function -- so copies are <em>not</em> guaranteed to be distinct by <code>eq?</code>.
+
+<!--
+==== char-set
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set"></a>
+<code class=proc-def>char-set</code><var> char<sub>1</sub> ... -> char-set</var>
+<dd class=proc-def>
+    Return a character set containing the given characters.
+
+<!--
+==== list->char-set list->char-set
+============================================================================-->
+<dt class=proc-def1>
+<a name="list->char-set"></a>
+<a name="list->char-set!"></a>
+<code class=proc-def>list->char-set&nbsp;</code><var> char-list [base-cs] -> char-set</var>
+<dt class=proc-defn><code class=proc-def>list->char-set!</code><var> char-list base-cs -> char-set</var>
+<dd class=proc-def>
+    Return a character set containing the characters in the list of
+    characters <var>char-list</var>.
+
+    <p>
+    If character set <var>base-cs</var> is provided, the characters from <var>char-list</var>
+    are added to it. <code>list->char-set!</code> is allowed, but not required,
+    to side-effect and reuse the storage in <var>base-cs</var>; 
+    <code>list->char-set</code> produces a fresh character set.
+
+<!--
+==== string->char-set string->char-set!
+============================================================================-->
+<dt class=proc-def1>
+<a name="string->char-set"></a>
+<a name="string->char-set!"></a>
+<code class=proc-def>string->char-set&nbsp;</code><var> s [base-cs] -> char-set</var>
+<dt class=proc-defn><code class=proc-def>string->char-set!</code><var> s base-cs -> char-set</var>
+<dd class=proc-def>
+
+    Return a character set containing the characters in the string <var>s</var>.
+
+    <p>
+    If character set <var>base-cs</var> is provided, the characters from <var>s</var> are added to
+    it. <code>string->char-set!</code> is allowed, but not required, to side-effect and
+    reuse the storage in <var>base-cs</var>; <code>string->char-set</code> produces a fresh character
+    set.
+
+<!--
+==== char-set-filter char-set-filter!
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-filter"></a>
+<a name="char-set-filter!"></a>
+<code class=proc-def>char-set-filter&nbsp;</code><var> pred cs [base-cs] -> char-set</var>
+<dt class=proc-defn><code class=proc-def>char-set-filter!</code><var> pred cs base-cs -> char-set</var>
+<dd class=proc-def>
+
+    Returns a character set containing every character <var>c</var> 
+    in <var>cs</var> such that <code>(<var>pred</var> <var>c</var>)</code> 
+    returns true.
+
+<p>
+    If character set <var>base-cs</var> is provided, the characters specified 
+    by <var>pred</var> are added to it. 
+    <code>char-set-filter!</code> is allowed, but not required,
+    to side-effect and reuse the storage in <var>base-cs</var>; 
+    <code>char-set-filter</code> produces a fresh character set.
+
+<p>
+    An implementation may not save away a reference to <var>pred</var> and
+    invoke it after <code>char-set-filter</code> or 
+    <code>char-set-filter!</code> returns -- that is, "lazy,"
+    on-demand implementations are not allowed, as <var>pred</var> may have
+    external dependencies on mutable data or have other side-effects.
+
+<p>
+    Rationale: This procedure provides a means of converting a character
+    predicate into its equivalent character set; the <var>cs</var> parameter
+    allows the programmer to bound the predicate's domain. Programmers should
+    be aware that filtering a character set such as <code>char-set:full</code>
+    could be a very expensive operation in an implementation that provided an
+    extremely large character type, such as 32-bit Unicode. An earlier draft
+    of this library provided a simple <code>predicate->char-set</code>
+    procedure, which was rejected in favor of <code>char-set-filter</code> for
+    this reason.
+
+
+<!--
+==== ucs-range->char-set ucs-range->char-set!
+============================================================================-->
+<dt class=proc-def1>
+<a name="ucs-range->char-set"></a>
+<a name="ucs-range->char-set!"></a>
+<code class=proc-def>ucs-range->char-set&nbsp;</code><var> lower upper [error? base-cs] -> char-set</var>
+<dt class=proc-defn><code class=proc-def>ucs-range->char-set!</code><var> lower upper error? base-cs -> char-set</var>
+<dd class=proc-def>
+    <var>Lower</var> and <var>upper</var> are exact non-negative integers; 
+    <var>lower</var> <= <var>upper</var>.
+
+    <p>
+    Returns a character set containing every character whose ISO/IEC 10646
+    UCS-4 code lies in the half-open range [<var>lower</var>,<var>upper</var>).
+
+<ul>
+    <li> If the requested range includes unassigned UCS values, these are
+      silently ignored (the current UCS specification has "holes" in the
+      space of assigned codes).
+    
+    <li> If the requested range includes "private" or "user space" codes, these
+      are handled in an implementation-specific manner; however, a UCS- or
+      Unicode-based Scheme implementation should pass them through
+      transparently.
+    
+    <li> If any code from the requested range specifies a valid, assigned
+      UCS character that has no corresponding representative in the
+      implementation's character type, then (1) an error is raised if <var>error?</var>
+      is true, and (2) the code is ignored if <var>error?</var> is false (the default).
+      This might happen, for example, if the implementation uses ASCII
+      characters, and the requested range includes non-ASCII characters.
+</ul>
+
+    <p>
+    If character set <var>base-cs</var> is provided, the characters specified by the
+    range are added to it. <code>ucs-range->char-set!</code> is allowed, but not required,
+    to side-effect and reuse the storage in <var>base-cs</var>; 
+    <code>ucs-range->char-set</code> produces a fresh character set.
+
+    <p>
+    Note that ASCII codes are a subset of the Latin-1 codes, which are in turn
+    a subset of the 16-bit Unicode codes, which are themselves a subset of the
+    32-bit UCS-4 codes. We commit to a specific encoding in this routine,
+    regardless of the underlying representation of characters, so that client
+    code using this library will be portable. <em>I.e.</em>, a conformant Scheme
+    implementation may use EBCDIC or SHIFT-JIS to encode characters; it must
+    simply map the UCS characters from the given range into the native
+    representation when possible, and report errors when not possible.
+
+<!--
+==== ->char-set
+============================================================================-->
+<dt class=proc-def>
+<a name="->char-set"></a>
+<code class=proc-def>->char-set</code><var> x -> char-set</var>
+<dd class=proc-def>
+    Coerces <var>x</var> into a char-set. 
+    <var>X</var> may be a string, character or
+    char-set. A string is converted to the set of its constituent characters;
+    a character is converted to a singleton set; a char-set is returned
+    as-is.
+    This procedure is intended for use by other procedures that want to 
+    provide "user-friendly," wide-spectrum interfaces to their clients.
+
+</dl>
+
+<!--========================================================================-->
+<h2><a name="Querying">Querying character sets</a></h2>
+<dl>
+
+<!--
+==== char-set-size
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-size"></a>
+<code class=proc-def>char-set-size</code><var> cs -> integer</var>
+<dd class=proc-def>
+    Returns the number of elements in character set <var>cs</var>.
+
+<!--
+==== char-set-count
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-count"></a>
+<code class=proc-def>char-set-count</code><var> pred cs -> integer</var>
+<dd class=proc-def>
+    Apply <var>pred</var> to the chars of character set <var>cs</var>, and return the number
+    of chars that caused the predicate to return true.
+
+<!--
+==== char-set->list
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set->list"></a>
+<code class=proc-def>char-set->list</code><var> cs -> character-list</var>
+<dd class=proc-def>
+    This procedure returns a list of the members of character set <var>cs</var>.
+    The order in which <var>cs</var>'s characters appear in the list is not defined,
+    and may be different from one call to another.
+
+<!--
+==== char-set->string
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set->string"></a>
+<code class=proc-def>char-set->string</code><var> cs -> string</var>
+<dd class=proc-def>
+    This procedure returns a string containing the members of character set <var>cs</var>.
+    The order in which <var>cs</var>'s characters appear in the string is not defined,
+    and may be different from one call to another.
+
+<!--
+==== char-set-contains?
+============================================================================-->
+<dt class=proc-def>
+<a name="char-set-contains-p"></a>
+<code class=proc-def>char-set-contains?</code><var> cs char -> boolean</var>
+<dd class=proc-def>
+    This procedure tests <var>char</var> for membership in character set <var>cs</var>.
+
+    <p>
+    The MIT Scheme character-set package called this procedure
+    <var>char-set-member?</var>, but the argument order isn't consistent with the name.
+
+<!--
+==== char-set-every char-set-any
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-every"></a>
+<a name="char-set-any"></a>
+<code class=proc-def>char-set-every</code><var> pred cs -> boolean</var>
+<dt class=proc-defn><code class=proc-def>char-set-any&nbsp;&nbsp;</code><var> pred cs -> boolean</var>
+<dd class=proc-def>
+    The <code>char-set-every</code> procedure returns true if predicate <var>pred</var>
+    returns true of every character in the character set <var>cs</var>.
+    Likewise, <code>char-set-any</code> applies <var>pred</var> to every character in
+    character set <var>cs</var>, and returns the first true value it finds.
+    If no character produces a true value, it returns false.
+    The order in which these procedures sequence through the elements of
+    <var>cs</var> is not specified.
+
+    <p>
+    Note that if you need to determine the actual character on which a 
+    predicate returns true, use <code>char-set-any</code> and arrange for the predicate 
+    to return the character parameter as its true value, <em>e.g.</em>
+<pre class=code-example>
+(char-set-any (lambda (c) (and (char-upper-case? c) c)) 
+              cs)
+</pre>
+</dl>
+
+<!--========================================================================-->
+<h2><a name="Algebra">Character-set algebra</a></h2>
+<dl>
+
+<!--
+==== char-set-adjoin char-set-delete
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-adjoin"></a>
+<a name="char-set-delete"></a>
+<code class=proc-def>char-set-adjoin</code><var> cs char<sub>1</sub> ... -> char-set</var>
+<dt class=proc-defn><code class=proc-def>char-set-delete</code><var> cs char<sub>1</sub> ... -> char-set</var>
+<dd class=proc-def>
+    Add/delete the <var>char<sub>i</sub></var> characters to/from character set <var>cs</var>.
+
+<!--
+==== char-set-adjoin! char-set-delete!
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-adjoin!"></a>
+<a name="char-set-delete!"></a>
+<code class=proc-def>char-set-adjoin!</code><var> cs char<sub>1</sub> ... -> char-set</var>
+<dt class=proc-defn><code class=proc-def>char-set-delete!</code><var> cs char<sub>1</sub> ... -> char-set</var>
+<dd class=proc-def>
+
+    Linear-update variants. These procedures are allowed, but not
+    required, to side-effect their first parameter.
+
+<!--
+==== char-set-complement char-set-union char-set-intersection 
+==== char-set-difference char-set-xor char-set-diff+intersection
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-complement"></a>
+<a name="char-set-union"></a>
+<a name="char-set-intersection"></a>
+<a name="char-set-difference"></a>
+<a name="char-set-xor"></a>
+<a name="char-set-diff+intersection"></a>
+<code class=proc-def>char-set-complement</code><var> cs                     -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-union</code><var> cs<sub>1</sub> ...                 -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-intersection</code><var> cs<sub>1</sub> ...          -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-difference</code><var> cs<sub>1</sub> cs<sub>2</sub> ...        -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-xor</code><var> cs<sub>1</sub> ...                   -> char-set</var>
+<dt class=proc-defn><code class=proc-def>char-set-diff+intersection</code><var> cs<sub>1</sub> cs<sub>2</sub> ... -> [char-set char-set]</var>
+<dd class=proc-def>
+    These procedures implement set complement, union, intersection,
+    difference, and exclusive-or for character sets. The union, intersection
+    and xor operations are n-ary. The difference function is also n-ary,
+    associates to the left (that is, it computes the difference between
+    its first argument and the union of all the other arguments),
+    and requires at least one argument.
+
+    <p>
+    Boundary cases:
+<pre class=code-example>
+(char-set-union) => char-set:empty
+(char-set-intersection) => char-set:full
+(char-set-xor) => char-set:empty
+(char-set-difference <var>cs</var>) => <var>cs</var>
+</pre>
+
+    <p>
+    <code>char-set-diff+intersection</code> returns both the difference and the
+    intersection of the arguments -- it partitions its first parameter.
+    It is equivalent to 
+<pre class=code-example>
+(values (char-set-difference <var>cs<sub>1</sub></var> <var>cs<sub>2</sub></var> ...)
+        (char-set-intersection <var>cs<sub>1</sub></var> (char-set-union <var>cs<sub>2</sub></var> ...)))
+</pre>
+    but can be implemented more efficiently.
+
+<p>
+    Programmers should be aware that <code>char-set-complement</code> could potentially
+    be a very expensive operation in Scheme implementations that provide
+    a very large character type, such as 32-bit Unicode. If this is a
+    possibility, sets can be complimented with respect to a smaller
+    universe using <code>char-set-difference</code>.
+
+
+<!--
+==== char-set-complement! char-set-union! char-set-intersection! 
+==== char-set-difference! char-set-xor! char-set-diff+intersection!
+============================================================================-->
+<dt class=proc-def1>
+<a name="char-set-complement!"></a>
+<a name="char-set-union!"></a>
+<a name="char-set-intersection!"></a>
+<a name="char-set-difference!"></a>
+<a name="char-set-xor!"></a>
+<a name="char-set-diff+intersection!"></a>
+<code class=proc-def>char-set-complement!</code><var> cs                     -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-union!</code><var>  cs<sub>1</sub> cs<sub>2</sub> ...                   -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-intersection!</code><var>  cs<sub>1</sub> cs<sub>2</sub> ...          -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-difference!</code><var>  cs<sub>1</sub> cs<sub>2</sub> ...            -> char-set</var>
+<dt class=proc-defi><code class=proc-def>char-set-xor!</code><var>  cs<sub>1</sub> cs<sub>2</sub> ...                   -> char-set</var>
+<dt class=proc-defn><code class=proc-def>char-set-diff+intersection!</code><var>  cs<sub>1</sub> cs<sub>2</sub> cs<sub>3</sub> ... -> [char-set char-set]</var>
+<dd class=proc-def>
+    These are linear-update variants of the set-algebra functions.
+    They are allowed, but not required, to side-effect their first (required)
+    parameter.
+
+    <p>
+    <code>char-set-diff+intersection!</code> is allowed to side-effect both
+    of its two required parameters, <var>cs<sub>1</sub></var>
+    and <var>cs<sub>2</sub></var>.
+</dl>
+
+<!--========================================================================-->
+<h2><a name="StandardCharsets">Standard character sets</a></h2>
+<p>
+Several character sets are predefined for convenience:
+<a name="char-set:lower-case"></a>
+<a name="char-set:lower-case"></a>
+<a name="char-set:upper-case"></a>
+<a name="char-set:title-case"></a>
+<a name="char-set:letter"></a>
+<a name="char-set:digit"></a>
+<a name="char-set:letter+digit"></a>
+<a name="char-set:graphic"></a>
+<a name="char-set:printing"></a>
+<a name="char-set:whitespace"></a>
+<a name="char-set:iso-control"></a>
+<a name="char-set:punctuation"></a>
+<a name="char-set:symbol"></a>
+<a name="char-set:hex-digit"></a>
+<a name="char-set:blank"></a>
+<a name="char-set:ascii"></a>
+<a name="char-set:empty"></a>
+<a name="char-set:full"></a>
+<div class=inset>
+<table cellpadding=0 cellspacing=0>
+<tr><td><code>char-set:lower-case</code> </td><td>Lower-case letters</td></tr>
+<tr><td><code>char-set:upper-case</code> </td><td>Upper-case letters</td></tr>
+<tr><td><code>char-set:title-case</code> </td><td>Title-case letters</td></tr>
+<tr><td><code>char-set:letter</code> </td><td>Letters</td></tr>
+<tr><td><code>char-set:digit</code> </td><td>Digits</td></tr>
+<tr><td><code>char-set:letter+digit</code> </td><td>Letters and digits</td></tr>
+<tr><td><code>char-set:graphic</code> </td><td>Printing characters except spaces</td></tr>
+<tr><td><code>char-set:printing</code> </td><td>Printing characters including spaces</td></tr>
+<tr><td><code>char-set:whitespace</code> </td><td>Whitespace characters </td></tr>
+<tr><td><code>char-set:iso-control</code> </td><td>The ISO control characters </td></tr>
+<tr><td><code>char-set:punctuation</code> </td><td>Punctuation characters</td></tr>
+<tr><td><code>char-set:symbol</code> </td><td>Symbol characters</td></tr>
+<tr><td><code>char-set:hex-digit</code> </td><td>A hexadecimal digit: 0-9, A-F, a-f </td></tr>
+<tr><td><code>char-set:blank</code> </td><td>Blank characters -- horizontal whitespace</td></tr>
+<tr><td><code>char-set:ascii</code> </td><td>All characters in the ASCII set. </td></tr>
+<tr><td><code>char-set:empty</code> </td><td>Empty set </td></tr>
+<tr><td><code>char-set:full</code> </td><td>All characters </td></tr>
+</table>
+</div>
+
+<p>
+Note that there may be characters in <code>char-set:letter</code> that are neither upper or
+lower case---this might occur in implementations that use a character type
+richer than ASCII, such as Unicode. A "graphic character" is one that would
+put ink on your page. While the exact composition of these sets may vary
+depending upon the character type provided by the underlying Scheme system,
+here are the definitions for some of the sets in an ASCII implementation:
+<div class=inset>
+<table cellpadding=0 cellspacing=0>
+<tr><td><code>char-set:lower-case</code> </td><td>a-z </td></tr>
+<tr><td><code>char-set:upper-case</code> </td><td>A-Z </td></tr>
+<tr><td><code>char-set:letter</code> </td><td>A-Z and a-z </td></tr>
+<tr><td><code>char-set:digit</code> </td><td>0123456789</td></tr>
+<tr><td><code>char-set:punctuation</code> </td><td><code>!"#%&amp;'()*,-./:;?@[\]_{}</code></td></tr>
+<tr><td><code>char-set:symbol</code> </td><td><code>$+&lt;=&gt;^`|~</code></td></tr>
+<tr><td><code>char-set:whitespace</code> </td><td>Space, newline, tab, form feed, </td></tr>
+<tr><td></td><td>                               vertical tab, carriage return </td></tr>
+<tr><td><code>char-set:blank</code> </td><td>Space and tab </td></tr>
+<tr><td><code>char-set:graphic</code> </td><td>letter + digit + punctuation + symbol</td></tr>
+<tr><td><code>char-set:printing</code> </td><td>graphic + whitespace</td></tr>
+<tr><td><code>char-set:iso-control</code> </td><td>ASCII 0-31 and 127 </td></tr>
+</table>
+</div>
+
+<p>
+Note that the existence of the <code>char-set:ascii</code> set implies that the underlying
+character set is required to be at least as rich as ASCII (including
+ASCII's control characters).
+
+<p>
+Rationale: The name choices reflect a shift from the older "alphabetic/numeric"
+terms found in 
+<abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr>
+and Posix to newer, Unicode-influenced "letter/digit" lexemes.
+
+<!--========================================================================-->
+<h1><a name="StandardCharsetDefs">
+    Unicode, Latin-1 and ASCII definitions of the standard character sets</a>
+</h1>
+<p>
+In Unicode Scheme implementations, the base character sets are compatible with
+Java's Unicode specifications. For ASCII or Latin-1, we simply restrict the
+Unicode set specifications to their first 128 or 256 codes, respectively.
+Scheme implementations that are not based on ASCII, Latin-1 or Unicode should
+attempt to preserve the sense or spirit of these definitions.
+
+<p>
+The following descriptions frequently make reference to the "Unicode character
+database." This is a file, available at URL
+<div class=inset>
+<a href="ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt">
+ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt</a>
+</div>
+<p class=continue>
+Each line contains a description of a Unicode character. The first
+semicolon-delimited field of the line gives the hex value of the character's
+code; the second field gives the name of the character, and the third field
+gives a two-letter category. Other fields give simple 1-1 case-mappings for
+the character and other information; see
+<div class=inset>
+<a href="ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.html">
+ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.html</a>
+</div>
+<p class=continue>
+for further description of the file's format. Note in particular the
+two-letter category specified in the the third field, which is referenced
+frequently in the descriptions below.
+
+<!--========================================================================-->
+<h2><a name="lower-case-def">char-set:lower-case</a></h2>
+<p>
+For Unicode, we follow Java's specification: a character is lowercase if
+<ul>
+<li> it is not in the range [U+2000,U+2FFF], and
+<li> the Unicode attribute table does not give a lowercase mapping for it, and
+<li> at least one of the following is true:
+  <ul>
+  <li> the Unicode attribute table gives a mapping to uppercase 
+    for the character, or
+  <li> the name for the character in the Unicode attribute table contains
+    the words "SMALL LETTER" or "SMALL LIGATURE".
+  </ul>
+</ul>
+
+<p>
+The lower-case ASCII characters are 
+<div class=inset>
+    abcdefghijklmnopqrstuvwxyz
+</div>
+<p class=continue>
+Latin-1 adds another 33 lower-case characters to the ASCII set:
+<div class=inset>
+<table cellpadding=0 cellspacing=0>
+<tr><td>00B5</td> <td>MICRO SIGN</td></tr>
+<tr><td>00DF</td> <td>LATIN SMALL LETTER SHARP S</td></tr>
+<tr><td>00E0</td> <td>LATIN SMALL LETTER A WITH GRAVE</td></tr>
+<tr><td>00E1</td> <td>LATIN SMALL LETTER A WITH ACUTE</td></tr>
+<tr><td>00E2</td> <td>LATIN SMALL LETTER A WITH CIRCUMFLEX</td></tr>
+<tr><td>00E3</td> <td>LATIN SMALL LETTER A WITH TILDE</td></tr>
+<tr><td>00E4</td> <td>LATIN SMALL LETTER A WITH DIAERESIS</td></tr>
+<tr><td>00E5</td> <td>LATIN SMALL LETTER A WITH RING ABOVE</td></tr>
+<tr><td>00E6</td> <td>LATIN SMALL LETTER AE</td></tr>
+<tr><td>00E7</td> <td>LATIN SMALL LETTER C WITH CEDILLA</td></tr>
+<tr><td>00E8</td> <td>LATIN SMALL LETTER E WITH GRAVE</td></tr>
+<tr><td>00E9</td> <td>LATIN SMALL LETTER E WITH ACUTE</td></tr>
+<tr><td>00EA</td> <td>LATIN SMALL LETTER E WITH CIRCUMFLEX</td></tr>
+<tr><td>00EB</td> <td>LATIN SMALL LETTER E WITH DIAERESIS</td></tr>
+<tr><td>00EC</td> <td>LATIN SMALL LETTER I WITH GRAVE</td></tr>
+<tr><td>00ED</td> <td>LATIN SMALL LETTER I WITH ACUTE</td></tr>
+<tr><td>00EE</td> <td>LATIN SMALL LETTER I WITH CIRCUMFLEX</td></tr>
+<tr><td>00EF</td> <td>LATIN SMALL LETTER I WITH DIAERESIS</td></tr>
+<tr><td>00F0</td> <td>LATIN SMALL LETTER ETH</td></tr>
+<tr><td>00F1</td> <td>LATIN SMALL LETTER N WITH TILDE</td></tr>
+<tr><td>00F2</td> <td>LATIN SMALL LETTER O WITH GRAVE</td></tr>
+<tr><td>00F3</td> <td>LATIN SMALL LETTER O WITH ACUTE</td></tr>
+<tr><td>00F4</td> <td>LATIN SMALL LETTER O WITH CIRCUMFLEX</td></tr>
+<tr><td>00F5</td> <td>LATIN SMALL LETTER O WITH TILDE</td></tr>
+<tr><td>00F6</td> <td>LATIN SMALL LETTER O WITH DIAERESIS</td></tr>
+<tr><td>00F8</td> <td>LATIN SMALL LETTER O WITH STROKE</td></tr>
+<tr><td>00F9</td> <td>LATIN SMALL LETTER U WITH GRAVE</td></tr>
+<tr><td>00FA</td> <td>LATIN SMALL LETTER U WITH ACUTE</td></tr>
+<tr><td>00FB</td> <td>LATIN SMALL LETTER U WITH CIRCUMFLEX</td></tr>
+<tr><td>00FC</td> <td>LATIN SMALL LETTER U WITH DIAERESIS</td></tr>
+<tr><td>00FD</td> <td>LATIN SMALL LETTER Y WITH ACUTE</td></tr>
+<tr><td>00FE</td> <td>LATIN SMALL LETTER THORN</td></tr>
+<tr><td>00FF</td> <td>LATIN SMALL LETTER Y WITH DIAERESIS</td></tr>
+</table>
+</div>
+<p class=continue>
+Note that three of these have no corresponding Latin-1 upper-case character:
+<div class=inset>
+<table cellpadding=0 cellspacing=0>
+<tr><td>00B5</td> <td>MICRO SIGN</td></tr>
+<tr><td>00DF</td> <td>LATIN SMALL LETTER SHARP S</td></tr>
+<tr><td>00FF</td> <td>LATIN SMALL LETTER Y WITH DIAERESIS</td></tr>
+</table>
+</div>
+<p class=continue>
+(The compatibility micro character uppercases to the non-Latin-1 Greek capital
+mu; the German sharp s character uppercases to the pair of characters "SS,"
+and the capital y-with-diaeresis is non-Latin-1.)
+
+<p>
+(Note that the Java spec for lowercase characters given at
+<div class=inset>
+<a href="http://java.sun.com/docs/books/jls/html/javalang.doc4.html#14345">
+http://java.sun.com/docs/books/jls/html/javalang.doc4.html#14345</a>
+</div>
+<p class=continue>
+is inconsistent. U+00B5 MICRO SIGN fulfills the requirements for a lower-case
+character (as of Unicode 3.0), but is not given in the numeric list of
+lower-case character codes.)
+
+<p>
+(Note that the Java spec for <code>isLowerCase()</code> given at
+<div class=inset>
+<a href="http://java.sun.com/products/jdk/1.2/docs/api/java/lang/Character.html#isLowerCase(char)">
+http://java.sun.com/products/jdk/1.2/docs/api/java/lang/Character.html#isLowerCase(char)</a>
+</div>
+<p class=continue>
+gives three mutually inconsistent definitions of "lower case." The first is
+the definition used in this SRFI. Following text says "A character is
+considered to be lowercase if and only if it is specified to be lowercase by
+the Unicode 2.0 standard (category Ll in the Unicode specification data
+file)." The former spec excludes U+00AA FEMININE ORDINAL INDICATOR and
+U+00BA MASCULINE ORDINAL INDICATOR; the later spec includes them. Finally,
+the spec enumerates a list of characters in the Latin-1 subset; this list
+excludes U+00B5 MICRO SIGN, which is included in both of the previous specs.) 
+
+<!--========================================================================-->
+<h2><a name="upper-case-def">char-set:upper-case</a></h2>
+<p>
+For Unicode, we follow Java's specification: a character is uppercase if
+<ul>
+<li> it is not in the range [U+2000,U+2FFF], and
+<li> the Unicode attribute table does not give an uppercase mapping for it
+(this excludes titlecase characters), and
+<li> at least one of the following is true:
+  <ul>
+  <li> the Unicode attribute table gives a mapping to lowercase 
+    for the character, or
+  <li> the name for the character in the Unicode attribute table contains
+    the words "CAPITAL LETTER" or "CAPITAL LIGATURE".
+  </ul>
+</ul>
+
+<p>
+The upper-case ASCII characters are 
+<div class=inset>
+ABCDEFGHIJKLMNOPQRSTUVWXYZ
+</div>
+<p class=continue>
+Latin-1 adds another 30 upper-case characters to the ASCII set:
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>00C0</td> <td>LATIN CAPITAL LETTER A WITH GRAVE</td></tr>
+<tr><td>00C1</td> <td>LATIN CAPITAL LETTER A WITH ACUTE</td></tr>
+<tr><td>00C2</td> <td>LATIN CAPITAL LETTER A WITH CIRCUMFLEX</td></tr>
+<tr><td>00C3</td> <td>LATIN CAPITAL LETTER A WITH TILDE</td></tr>
+<tr><td>00C4</td> <td>LATIN CAPITAL LETTER A WITH DIAERESIS</td></tr>
+<tr><td>00C5</td> <td>LATIN CAPITAL LETTER A WITH RING ABOVE</td></tr>
+<tr><td>00C6</td> <td>LATIN CAPITAL LETTER AE</td></tr>
+<tr><td>00C7</td> <td>LATIN CAPITAL LETTER C WITH CEDILLA</td></tr>
+<tr><td>00C8</td> <td>LATIN CAPITAL LETTER E WITH GRAVE</td></tr>
+<tr><td>00C9</td> <td>LATIN CAPITAL LETTER E WITH ACUTE</td></tr>
+<tr><td>00CA</td> <td>LATIN CAPITAL LETTER E WITH CIRCUMFLEX</td></tr>
+<tr><td>00CB</td> <td>LATIN CAPITAL LETTER E WITH DIAERESIS</td></tr>
+<tr><td>00CC</td> <td>LATIN CAPITAL LETTER I WITH GRAVE</td></tr>
+<tr><td>00CD</td> <td>LATIN CAPITAL LETTER I WITH ACUTE</td></tr>
+<tr><td>00CE</td> <td>LATIN CAPITAL LETTER I WITH CIRCUMFLEX</td></tr>
+<tr><td>00CF</td> <td>LATIN CAPITAL LETTER I WITH DIAERESIS</td></tr>
+<tr><td>00D0</td> <td>LATIN CAPITAL LETTER ETH</td></tr>
+<tr><td>00D1</td> <td>LATIN CAPITAL LETTER N WITH TILDE</td></tr>
+<tr><td>00D2</td> <td>LATIN CAPITAL LETTER O WITH GRAVE</td></tr>
+<tr><td>00D3</td> <td>LATIN CAPITAL LETTER O WITH ACUTE</td></tr>
+<tr><td>00D4</td> <td>LATIN CAPITAL LETTER O WITH CIRCUMFLEX</td></tr>
+<tr><td>00D5</td> <td>LATIN CAPITAL LETTER O WITH TILDE</td></tr>
+<tr><td>00D6</td> <td>LATIN CAPITAL LETTER O WITH DIAERESIS</td></tr>
+<tr><td>00D8</td> <td>LATIN CAPITAL LETTER O WITH STROKE</td></tr>
+<tr><td>00D9</td> <td>LATIN CAPITAL LETTER U WITH GRAVE</td></tr>
+<tr><td>00DA</td> <td>LATIN CAPITAL LETTER U WITH ACUTE</td></tr>
+<tr><td>00DB</td> <td>LATIN CAPITAL LETTER U WITH CIRCUMFLEX</td></tr>
+<tr><td>00DC</td> <td>LATIN CAPITAL LETTER U WITH DIAERESIS</td></tr>
+<tr><td>00DD</td> <td>LATIN CAPITAL LETTER Y WITH ACUTE</td></tr>
+<tr><td>00DE</td> <td>LATIN CAPITAL LETTER THORN</td></tr>
+</table>
+</div>
+<!--========================================================================-->
+<h2><a name="title-case-def">char-set:title-case</a></h2>
+<p>
+In Unicode, a character is titlecase if it has the category Lt in
+the character attribute database. There are very few of these characters;
+here is the entire 31-character list as of Unicode 3.0:
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>01C5 </td><td nowrap> LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON
+</td></tr>
+<tr><td>01C8 </td><td nowrap> LATIN CAPITAL LETTER L WITH SMALL LETTER J
+</td></tr>
+<tr><td>01CB </td><td nowrap> LATIN CAPITAL LETTER N WITH SMALL LETTER J
+</td></tr>
+<tr><td>01F2 </td><td nowrap> LATIN CAPITAL LETTER D WITH SMALL LETTER Z
+</td></tr>
+<tr><td>1F88 </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH PSILI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F89 </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH DASIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F8A </td><td nowrap>GREEK CAPITAL LETTER ALPHA WITH PSILI AND VARIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F8B </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH DASIA AND VARIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F8C </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH PSILI AND OXIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F8D </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH DASIA AND OXIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F8E </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F8F </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F98 </td><td nowrap> GREEK CAPITAL LETTER ETA WITH PSILI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F99 </td><td nowrap> GREEK CAPITAL LETTER ETA WITH DASIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F9A </td><td nowrap> GREEK CAPITAL LETTER ETA WITH PSILI AND VARIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F9B </td><td nowrap> GREEK CAPITAL LETTER ETA WITH DASIA AND VARIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F9C </td><td nowrap> GREEK CAPITAL LETTER ETA WITH PSILI AND OXIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F9D </td><td nowrap> GREEK CAPITAL LETTER ETA WITH DASIA AND OXIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F9E </td><td nowrap> GREEK CAPITAL LETTER ETA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1F9F </td><td nowrap> GREEK CAPITAL LETTER ETA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FA8 </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH PSILI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FA9 </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH DASIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FAA </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH PSILI AND VARIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FAB </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH DASIA AND VARIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FAC </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH PSILI AND OXIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FAD </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH DASIA AND OXIA AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FAE </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FAF </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FBC </td><td nowrap> GREEK CAPITAL LETTER ALPHA WITH PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FCC </td><td nowrap> GREEK CAPITAL LETTER ETA WITH PROSGEGRAMMENI
+</td></tr>
+<tr><td>1FFC </td><td nowrap> GREEK CAPITAL LETTER OMEGA WITH PROSGEGRAMMENI
+</td></tr>
+</table>
+</div>
+<p>
+There are no ASCII or Latin-1 titlecase characters.
+
+
+<!--========================================================================-->
+<h2><a name="letter-def">char-set:letter</a></h2>
+<p>
+In Unicode, a letter is any character with one of the letter categories
+(Lu, Ll, Lt, Lm, Lo) in the Unicode character database. 
+
+<p>
+There are 52 ASCII letters
+<div class=indent>
+    abcdefghijklmnopqrstuvwxyz <br>
+    ABCDEFGHIJKLMNOPQRSTUVWXYZ <br>
+</div>
+<p>
+There are 117 Latin-1 letters. These are the 115 characters that are
+members of the Latin-1 <code>char-set:lower-case</code> and <code>char-set:upper-case</code> sets, 
+plus
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>00AA</td> <td>FEMININE ORDINAL INDICATOR</td></tr>
+<tr><td>00BA</td> <td>MASCULINE ORDINAL INDICATOR</td></tr>
+</table>
+</div>
+<p class=continue>
+(These two letters are considered lower-case by Unicode, but not by
+Java or SRFI 14.)
+
+<!--========================================================================-->
+<h2><a name="digit-def">char-set:digit</a></h2>
+
+<p>
+In Unicode, a character is a digit if it has the category Nd in
+the character attribute database. In Latin-1 and ASCII, the only
+such characters are 0123456789. In Unicode, there are other digit
+characters in other code blocks, such as Gujarati digits and Tibetan
+digits.
+
+
+<!--========================================================================-->
+<h2><a name="hex-digit-def">char-set:hex-digit</a></h2>
+<p>
+The only hex digits are 0123456789abcdefABCDEF.
+
+
+<!--========================================================================-->
+<h2><a name="letter+digit-def">char-set:letter+digit</a></h2>
+<p>
+The union of <code>char-set:letter</code> and <code>char-set:digit.</code>
+
+<!--========================================================================-->
+<h2><a name="graphic-def">char-set:graphic</a></h2>
+<p>
+A graphic character is one that would put ink on paper. The ASCII and Latin-1
+graphic characters are the members of
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td><code>char-set:letter</code></td></tr>
+<tr><td><code>char-set:digit</code></td></tr>
+<tr><td><code>char-set:punctuation</code></td></tr>
+<tr><td><code>char-set:symbol</code></td></tr>
+</table>
+</div>
+
+<!--========================================================================-->
+<h2><a name="printing-def">char-set:printing</a></h2>
+<p>
+A printing character is one that would occupy space when printed, <em>i.e.</em>,
+a graphic character or a space character. <code>char-set:printing</code> is the union
+of <code>char-set:whitespace</code> and <code>char-set:graphic.</code>
+
+<!--========================================================================-->
+<h2><a name="whitespace-def">char-set:whitespace</a></h2>
+<p>
+In Unicode, a whitespace character is either
+<ul>
+  <li> a character with one of the space, line, or paragraph separator categories
+    (Zs, Zl or Zp) of the Unicode character database.
+  <li> U+0009 Horizontal tabulation (\t control-I)
+  <li> U+000A Line feed (\n control-J)
+  <li> U+000B Vertical tabulation (\v control-K)
+  <li> U+000C Form feed (\f control-L)
+  <li> U+000D Carriage return (\r control-M)
+</ul>
+
+<p>
+There are 24 whitespace characters in Unicode 3.0:
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>0009</td> <td>HORIZONTAL TABULATION </td> <td>  \t control-I</td></tr>
+<tr><td>000A</td> <td>LINE FEED         </td> <td> \n control-J</td></tr>
+<tr><td>000B</td> <td>VERTICAL TABULATION       </td> <td> \v control-K</td></tr>
+<tr><td>000C</td> <td>FORM FEED         </td> <td> \f control-L</td></tr>
+<tr><td>000D</td> <td>CARRIAGE RETURN   </td> <td> \r control-M</td></tr>
+<tr><td>0020</td> <td>SPACE                     </td> <td> Zs</td></tr>
+<tr><td>00A0</td> <td>NO-BREAK SPACE    </td> <td> Zs</td></tr>
+<tr><td>1680</td> <td>OGHAM SPACE MARK  </td> <td> Zs</td></tr>
+<tr><td>2000</td> <td>EN QUAD           </td> <td> Zs</td></tr>
+<tr><td>2001</td> <td>EM QUAD           </td> <td> Zs</td></tr>
+<tr><td>2002</td> <td>EN SPACE          </td> <td> Zs</td></tr>
+<tr><td>2003</td> <td>EM SPACE          </td> <td> Zs</td></tr>
+<tr><td>2004</td> <td>THREE-PER-EM SPACE        </td> <td> Zs</td></tr>
+<tr><td>2005</td> <td>FOUR-PER-EM SPACE </td> <td> Zs</td></tr>
+<tr><td>2006</td> <td>SIX-PER-EM SPACE  </td> <td> Zs</td></tr>
+<tr><td>2007</td> <td>FIGURE SPACE              </td> <td> Zs</td></tr>
+<tr><td>2008</td> <td>PUNCTUATION SPACE </td> <td> Zs</td></tr>
+<tr><td>2009</td> <td>THIN SPACE                </td> <td> Zs</td></tr>
+<tr><td>200A</td> <td>HAIR SPACE                </td> <td> Zs</td></tr>
+<tr><td>200B</td> <td>ZERO WIDTH SPACE  </td> <td> Zs</td></tr>
+<tr><td>2028</td> <td>LINE SEPARATOR    </td> <td> Zl</td></tr>
+<tr><td>2029</td> <td>PARAGRAPH SEPARATOR       </td> <td> Zp</td></tr>
+<tr><td>202F</td> <td>NARROW NO-BREAK SPACE     </td> <td> Zs</td></tr>
+<tr><td>3000</td> <td>IDEOGRAPHIC SPACE </td> <td> Zs</td></tr>
+</table>
+</div>
+<p>
+The ASCII whitespace characters are the first six characters in the above list
+-- line feed, horizontal tabulation, vertical tabulation, form feed, carriage
+return, and space. These are also exactly the characters recognised by the
+Posix <code>isspace()</code> procedure. Latin-1 adds the no-break space.
+
+<p>
+Note: Java's <code>isWhitespace()</code> method is incompatible, including
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>0009</td> <td>HORIZONTAL TABULATION </td> <td>  (\t control-I)</td></tr>
+<tr><td>001C</td> <td>FILE SEPARATOR   </td> <td> (control-\)</td></tr>
+<tr><td>001D</td> <td>GROUP SEPARATOR  </td> <td>(control-])</td></tr>
+<tr><td>001E</td> <td>RECORD SEPARATOR </td> <td>(control-^)</td></tr>
+<tr><td>001F</td> <td>UNIT SEPARATOR   </td> <td>(control-_)</td></tr>
+</table>
+</div>
+<p class=continue>
+and excluding
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>00A0</td> <td>NO-BREAK SPACE</td></tr>
+</table>
+</div>
+<p>
+Java's excluding the no-break space means that tokenizers can simply break
+character streams at "whitespace" boundaries. However, the exclusion introduces
+exceptions in other places, <em>e.g.</em> <code>char-set:printing</code> is no longer simply the
+union of <code>char-set:graphic</code> and <code>char-set:whitespace.</code>
+
+
+<!--========================================================================-->
+<h2><a name="iso-control-def">char-set:iso-control</a></h2>
+<p>
+The ISO control characters are the Unicode/Latin-1 characters in the ranges
+[U+0000,U+001F] and [U+007F,U+009F].
+
+<p>
+ASCII restricts this set to the characters in the range [U+0000,U+001F] 
+plus the character U+007F.
+
+<p>
+Note that Unicode defines other control characters which do not belong to this
+set (hence the qualifying prefix "iso-" in the name). This restriction is
+compatible with the Java <code>IsISOControl()</code> method.
+
+
+<!--========================================================================-->
+<h2><a name="punctuation-def">char-set:punctuation</a></h2>
+<p>
+In Unicode, a punctuation character is any character that has one of the
+punctuation categories in the Unicode character database (Pc, Pd, Ps,
+Pe, Pi, Pf, or Po.)
+
+<p>
+ASCII has 23 punctuation characters:
+<pre class=code-example>
+!"#%&amp;'()*,-./:;?@[\]_{}
+</pre>
+<p>
+Latin-1 adds six more:
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>00A1 </td> <td> INVERTED EXCLAMATION MARK
+<tr><td>00AB </td> <td> LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+<tr><td>00AD </td> <td> SOFT HYPHEN
+<tr><td>00B7 </td> <td> MIDDLE DOT
+<tr><td>00BB </td> <td> RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+<tr><td>00BF </td> <td> INVERTED QUESTION MARK
+</table>
+</div>
+
+<p>
+Note that the nine ASCII characters <code>$+<=>^`|~</code> are <em>not</em>
+punctuation. They are "symbols."
+
+
+<!--========================================================================-->
+<h2><a name="symbol-def">char-set:symbol</a></h2>
+<p>
+In Unicode, a symbol is any character that has one of the symbol categories
+in the Unicode character database (Sm, Sc, Sk, or So). There
+are nine ASCII symbol characters:
+<pre class=code-example>
+$+&lt;=&gt;^`|~
+</pre>
+<p>
+Latin-1 adds 18 more:
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>00A2 </td> <td> CENT SIGN </td></tr>
+<tr><td>00A3 </td> <td> POUND SIGN </td></tr>
+<tr><td>00A4 </td> <td> CURRENCY SIGN </td></tr>
+<tr><td>00A5 </td> <td> YEN SIGN </td></tr>
+<tr><td>00A6 </td> <td> BROKEN BAR </td></tr>
+<tr><td>00A7 </td> <td> SECTION SIGN </td></tr>
+<tr><td>00A8 </td> <td> DIAERESIS </td></tr>
+<tr><td>00A9 </td> <td> COPYRIGHT SIGN </td></tr>
+<tr><td>00AC </td> <td> NOT SIGN </td></tr>
+<tr><td>00AE </td> <td> REGISTERED SIGN </td></tr>
+<tr><td>00AF </td> <td> MACRON </td></tr>
+<tr><td>00B0 </td> <td> DEGREE SIGN </td></tr>
+<tr><td>00B1 </td> <td> PLUS-MINUS SIGN </td></tr>
+<tr><td>00B4 </td> <td> ACUTE ACCENT </td></tr>
+<tr><td>00B6 </td> <td> PILCROW SIGN </td></tr>
+<tr><td>00B8 </td> <td> CEDILLA </td></tr>
+<tr><td>00D7 </td> <td> MULTIPLICATION SIGN </td></tr>
+<tr><td>00F7 </td> <td> DIVISION SIGN </td></tr>
+</table>
+</div>
+
+<!--========================================================================-->
+<h2><a name="blank-def">char-set:blank</a></h2>
+
+<p>
+Blank chars are horizontal whitespace. In Unicode, a blank character is either
+<ul>
+  <li> a character with the space separator category (Zs) in the Unicode 
+    character database.
+  <li> U+0009 Horizontal tabulation (\t control-I)
+</ul>
+
+<p>
+There are eighteen blank characters in Unicode 3.0:
+<div class=inset>
+<table cellspacing=0 cellpadding=0>
+<tr><td>0009 </td> <td> HORIZONTAL TABULATION   </td> <td> \t control-I </td></tr>
+<tr><td>0020 </td> <td> SPACE                   </td> <td> Zs </td></tr>
+<tr><td>00A0 </td> <td> NO-BREAK SPACE  </td> <td> Zs </td></tr>
+<tr><td>1680 </td> <td> OGHAM SPACE MARK        </td> <td> Zs </td></tr>
+<tr><td>2000 </td> <td> EN QUAD         </td> <td> Zs </td></tr>
+<tr><td>2001 </td> <td> EM QUAD         </td> <td> Zs </td></tr>
+<tr><td>2002 </td> <td> EN SPACE                </td> <td> Zs </td></tr>
+<tr><td>2003 </td> <td> EM SPACE                </td> <td> Zs </td></tr>
+<tr><td>2004 </td> <td> THREE-PER-EM SPACE      </td> <td> Zs </td></tr>
+<tr><td>2005 </td> <td> FOUR-PER-EM SPACE       </td> <td> Zs </td></tr>
+<tr><td>2006 </td> <td> SIX-PER-EM SPACE        </td> <td> Zs </td></tr>
+<tr><td>2007 </td> <td> FIGURE SPACE            </td> <td> Zs </td></tr>
+<tr><td>2008 </td> <td> PUNCTUATION SPACE       </td> <td> Zs </td></tr>
+<tr><td>2009 </td> <td> THIN SPACE              </td> <td> Zs </td></tr>
+<tr><td>200A </td> <td> HAIR SPACE              </td> <td> Zs </td></tr>
+<tr><td>200B </td> <td> ZERO WIDTH SPACE        </td> <td> Zs </td></tr>
+<tr><td>202F </td> <td> NARROW NO-BREAK SPACE   </td> <td> Zs </td></tr>
+<tr><td>3000 </td> <td> IDEOGRAPHIC SPACE       </td> <td> Zs </td></tr>
+</table>
+</div>
+<p>
+The ASCII blank characters are the first two characters above --
+horizontal tab and space. Latin-1 adds the no-break space.
+
+<p>
+Java doesn't have the concept of "blank" characters, so there are no
+compatibility issues.
+
+
+<!--========================================================================-->
+<h1><a name="ReferenceImp">Reference implementation</a></h1>
+<p>
+This SRFI comes with a reference implementation. It resides at:
+<div class=inset>
+    <a href="http://srfi.schemers.org/srfi-14/srfi-14.scm">
+http://srfi.schemers.org/srfi-14/srfi-14.scm</a>
+</div>
+<p class=continue>
+I have placed this source on the Net with an unencumbered, "open" copyright.
+Some of the code in the reference implementation bears a distant family
+relation to the MIT Scheme implementation, and being derived from that code,
+is covered by the MIT Scheme copyright (which is a generic BSD-style
+open-source copyright -- see the source file for details). The remainder of
+the code was written by myself for scsh or for this SRFI; I have placed this
+code under the scsh copyright, which is also a generic BSD-style open-source
+copyright.
+
+<p>
+The code is written for portability and should be simple to port to
+any Scheme. It has only the following deviations from R4RS, clearly
+discussed in the comments:
+<ul>
+  <li> an <code>error</code> procedure;
+  <li> the R5RS <code>values</code> procedure for producing multiple return values;
+  <li> a simple <code>check-arg</code> procedure for argument checking;
+  <li> <code>let-optionals*</code> and <code>:optional</code> macros for for parsing, checking and defaulting
+    optional arguments from rest lists;
+  <li> The SRFI-19 <code>define-record-type</code> form;
+  <li> <code>bitwise-and</code> for the hash function;
+  <li> <code>%latin1->char</code> and <code>%char->latin1</code>.
+</ul>
+
+<p>
+The library is written for clarity and well-commented; the current source is
+about 375 lines of source code and 375 lines of comments and white space.
+It is also written for efficiency. Fast paths are provided for common cases.
+
+<p>
+This is not to say that the implementation can't be tuned up for
+a specific Scheme implementation. There are notes in comments addressing
+ways implementors can tune the reference implementation for performance.
+
+<p>
+In short, I've written the reference implementation to make it as painless
+as possible for an implementor -- or a regular programmer -- to adopt this
+library and get good results with it.
+
+<p>
+The code uses a rather simple-minded, inefficient representation for
+ASCII/Latin-1 char-sets -- a 256-character string. The character whose code is
+<var>i</var> is in the set if <var>s[i]</var> = ASCII 1 (soh, or ^a); 
+not in the set if <var>s[i]</var> = ASCII 0 (nul). 
+A much faster and denser representation would be 16 or 32 bytes worth
+of bit string. A portable implementation using bit sets awaits standards for
+bitwise logical-ops and byte vectors.
+
+<p>
+"Large" character types, such as Unicode, should use a sparse representation,
+taking care that the Latin-1 subset continues to be represented with a
+dense 32-byte bit set.
+
+
+<!--========================================================================-->
+<h1><a name="Acknowledgements">Acknowledgements</a></h1>
+<p>
+The design of this library benefited greatly from the feedback provided during
+the SRFI discussion phase. Among those contributing thoughtful commentary and
+suggestions, both on the mailing list and by private discussion, were Paolo
+Amoroso, Lars Arvestad, Alan Bawden, Jim Bender, Dan Bornstein, Per Bothner,
+Will Clinger, Brian Denheyer, Kent Dybvig, Sergei Egorov, Marc Feeley,
+Matthias Felleisen, Will Fitzgerald, Matthew Flatt, Arthur A. Gleckler, Ben
+Goetter, Sven Hartrumpf, Erik Hilsdale, Shiro Kawai, Richard Kelsey, Oleg
+Kiselyov, Bengt Kleberg, Donovan Kolbly, Bruce Korb, Shriram Krishnamurthi,
+Bruce Lewis, Tom Lord, Brad Lucier, Dave Mason, David Rush, Klaus Schilling,
+Jonathan Sobel, Mike Sperber, Mikael Staldal, Vladimir Tsyshevsky, Donald
+Welsh, and Mike Wilson. I am grateful to them for their assistance.
+
+<p>
+I am also grateful the authors, implementors and documentors of all the
+systems mentioned in the introduction. Aubrey Jaffer should be noted for his
+work in producing Web-accessible versions of the R5RS spec, which was a
+tremendous aid.
+
+<p>
+This is not to imply that these individuals necessarily endorse the final
+results, of course. 
+
+<p>
+During this document's long development period, great patience was exhibited
+by Mike Sperber, who is the editor for the SRFI, and by Hillary Sullivan,
+who is not.
+
+<!--========================================================================-->
+<h1><a name="Links">References &amp; links</a></h1>
+
+<dl>
+<dt class=biblio><strong><a name="Java">[Java]</a></strong>
+<dd>
+    The following URLs provide documentation on relevant Java classes. <br>
+
+    <a href="http://java.sun.com/products/jdk/1.2/docs/api/java/lang/Character.html">http://java.sun.com/products/jdk/1.2/docs/api/java/lang/Character.html</a>
+    <br>
+    <a href="http://java.sun.com/products/jdk/1.2/docs/api/java/lang/String.html">http://java.sun.com/products/jdk/1.2/docs/api/java/lang/String.html</a>
+    <br>
+    <a href="http://java.sun.com/products/jdk/1.2/docs/api/java/lang/StringBuffer.html">http://java.sun.com/products/jdk/1.2/docs/api/java/lang/StringBuffer.html</a>
+    <br>
+    <a href="http://java.sun.com/products/jdk/1.2/docs/api/java/text/Collator.html">http://java.sun.com/products/jdk/1.2/docs/api/java/text/Collator.html</a>
+    <br>
+    <a href="http://java.sun.com/products/jdk/1.2/docs/api/java/text/package-summary.html">http://java.sun.com/products/jdk/1.2/docs/api/java/text/package-summary.html</a>
+
+<dt class=biblio><strong><a name="MIT-Scheme">[MIT-Scheme]</a></strong>
+<dd>
+    <a href="http://www.swiss.ai.mit.edu/projects/scheme/">http://www.swiss.ai.mit.edu/projects/scheme/</a>
+
+<dt class=biblio><strong><a name="R5RS">[R5RS]</a></strong></dt>
+<dd>Revised<sup>5</sup> report on the algorithmic language Scheme.<br>
+    R. Kelsey, W. Clinger, J. Rees (editors). <br>
+    Higher-Order and Symbolic Computation, Vol. 11, No. 1, September, 1998. <br>
+    and ACM SIGPLAN Notices, Vol. 33, No. 9, October, 1998. <br>
+    Available at <a href="http://www.schemers.org/Documents/Standards/">
+    http://www.schemers.org/Documents/Standards/</a>.
+
+<dt class=biblio><strong>[SRFI]</strong></dt>
+<dd>
+    The SRFI web site. <br>
+    <a href="http://srfi.schemers.org/">http://srfi.schemers.org/</a>
+
+<dt class=biblio><strong>[SRFI-14]</strong></dt>
+<dd>
+    SRFI-14: String libraries. <br>
+    <a href="http://srfi.schemers.org/srfi-14/">http://srfi.schemers.org/srfi-14/</a>
+
+    <dl>    
+    <dt>
+      This document, in HTML:
+    <dd><a href="http://srfi.schemers.org/srfi-14/srfi-14.html">
+        http://srfi.schemers.org/srfi-14/srfi-14.html</a>
+
+    <dt>
+      This document, in plain text format:
+    <dd><a href="http://srfi.schemers.org/srfi-14/srfi-14.txt">
+        http://srfi.schemers.org/srfi-14/srfi-14.txt</a>
+
+    <dt> Source code for the reference implementation:
+    <dd>
+      <a href="http://srfi.schemers.org/srfi-14/srfi-14.scm">
+         http://srfi.schemers.org/srfi-14/srfi-14.scm</a>
+
+    <dt> Scheme 48 module specification, with typings:
+    <dd>
+      <a href="http://srfi.schemers.org/srfi-14/srfi-14-s48-module.scm">
+        http://srfi.schemers.org/srfi-14/srfi-14-s48-module.scm</a>
+
+    <dt> Regression-test suite:
+    <dd> <a href="http://srfi.schemers.org/srfi-14/srfi-14-tests.scm">
+         http://srfi.schemers.org/srfi-14/srfi-14-tests.scm</a>
+
+    </dl>
+</dd>
+
+<dt class=biblio><strong><a name="Unicode">[Unicode]</a></strong>
+<dd>
+    <a href="http://www.unicode.org/">http://www.unicode.org/</a>
+
+<dt class=biblio><strong><a name="UnicodeData">[UnicodeData]</a></strong>
+<dd>
+    The Unicode character database. <br>
+    <a href="ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt">ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt</a>
+    <br>
+    <a href="ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.html">ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.html</a>
+</dl>
+
+<!--========================================================================-->
+<h1><a name="Copyright">Copyright</a></h1>
+
+<p>
+Certain portions of this document -- the specific, marked segments of text
+describing the <abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr> procedures -- were adapted with permission from the R5RS
+report.
+    
+<p>
+All other text is copyright (C) Olin Shivers (1998, 1999, 2000). 
+All Rights Reserved. 
+
+<p>
+This document and translations of it may be copied and furnished to others,
+and derivative works that comment on or otherwise explain it or assist in its
+implementation may be prepared, copied, published and distributed, in whole or
+in part, without restriction of any kind, provided that the above copyright
+notice and this paragraph are included on all such copies and derivative
+works. However, this document itself may not be modified in any way, such as
+by removing the copyright notice or references to the Scheme Request For
+Implementation process or editors, except as needed for the purpose of
+developing SRFIs in which case the procedures for copyrights defined in the
+SRFI process must be followed, or as required to translate it into languages
+other than English.
+
+<p>
+The limited permissions granted above are perpetual and will not be revoked by
+the authors or their successors or assigns.
+
+<p>
+This document and the information contained herein is provided on an
+"<strong>as is</strong>" basis and <strong>the authors and the SRFI editors
+disclaim all warranties, express or implied, including but not limited to any
+warranty that the use of the information herein will not infringe any rights
+or any implied warranties of merchantability or fitness for a particular
+purpose.</strong>
+
+</body>
+</html>
+<!--
+  LocalWords:  SRFI refs HTML css hackery sans Netscape td pre div para
+  LocalWords:  proc def procs defi's defn dl dt defi dd NS RS rs procx
+  LocalWords:  stylesheet IE biblio IE's Internationalisation ascii doc
+  LocalWords:  normalisation lib ref ci ok titlecase upcase downcase
+  LocalWords:  xsubstring xcopy tokenize kmp slib RScheme MzScheme init
+  LocalWords:  Bigloo Chez APL SML Unicode API eszet SS dz downcases
+  LocalWords:  titlecasing normalised normalise underbar ss eq vs dict
+  LocalWords:  backquote parameterised denmark taiwan UnicodeData txt
+  LocalWords:  pred nchars obj len cBa epilog foo baz wrt subst tstart
+  LocalWords:  Szilagyi zilagyi cs abcdefgh ca cd cond eek ee tHIS com
+  LocalWords:  elba elbA ary consed XXXX ac bc kons knil ans plusses 
+  LocalWords:  catamorphism lp eof lis cdr knull kar kdr anamorphism
+  LocalWords:  abcdefg sfrom sto TCL perl slen rv exp initialisation
+  LocalWords:  plen SJ PJ si sj pj IPORT iport patlen DF buf Bevan
+  LocalWords:  Denheyer scsh Paolo Amoroso Arvestad Bawden Dybvig
+  LocalWords:  Bornstein Bothner Egorov Feeley Matthias Felleisen
+  LocalWords:  Flatt ucs Gleckler Goetter Sven Hartrumpf Hilsdale
+  LocalWords:  Kiselyov Bengt Korb Kleberg Kolbly Shriram  bignum
+  LocalWords:  Krishnamurthi Lucier Schilling Sobel Mikael Staldal
+  LocalWords:  Tsyshevsky documentors Jaffer Sperber cltl AE fixnum
+  LocalWords:  CommonLisp HyperSpec Clinger Rees SIGPLAN uniquified
+  LocalWords:  cset EA DrScheme IEC conformant JIS xor diff Posix URL
+  LocalWords:  FFF DIAERESIS abcdefghijklmnopqrstuvwxyz EB EC EF ETH
+  LocalWords:  FA FB FC FD FF Ll AA diaeresis isLowerCase BA CB CC CE
+  LocalWords:  CF DA DC Lt CARON PSILI Lu PROSGEGRAMMENI DASIA VARIA
+  LocalWords:  OXIA PERISPOMENI FAA FAB FAC FAE FAF FBC FFC Lm Lo
+  LocalWords:  abcdefABCDEF Zs Zl Zp OGHAM IDEOGRAPHIC Pc recognised
+  LocalWords:  tokenizers iso Pd Ps Pe Pf AB BB BF Sm Sc Sk AF MACRON
+  LocalWords:  PILCROW soh nul ops Shiro Kawai subform
+-->
diff --git a/scsh/lib/cset-lib.scm b/scsh/lib/cset-lib.scm
new file mode 100644
index 0000000..2effd4b
--- /dev/null
+++ b/scsh/lib/cset-lib.scm
@@ -0,0 +1,804 @@
+;;; SRFI-14 character-sets library				-*- Scheme -*-
+;;;
+;;; - Ported from MIT Scheme runtime by Brian D. Carlstrom.
+;;; - Massively rehacked & extended by Olin Shivers 6/98.
+;;; - Massively redesigned and rehacked 5/2000 during SRFI process.
+;;; At this point, the code bears the following relationship to the
+;;; MIT Scheme code: "This is my grandfather's axe. My father replaced
+;;; the head, and I have replaced the handle." Nonetheless, we preserve
+;;; the MIT Scheme copyright:
+;;;     Copyright (c) 1988-1995 Massachusetts Institute of Technology
+;;; The MIT Scheme license is a "free software" license. See the end of
+;;; this file for the tedious details. 
+
+;;; Exports:
+;;; char-set? char-set= char-set<=
+;;; char-set-hash 
+;;; char-set-cursor char-set-ref char-set-cursor-next end-of-char-set?
+;;; char-set-fold char-set-unfold char-set-unfold!
+;;; char-set-for-each char-set-map
+;;; char-set-copy char-set
+;;;
+;;; list->char-set  string->char-set 
+;;; list->char-set! string->char-set! 
+;;;
+;;; filterchar-set  ucs-range->char-set  ->char-set
+;;; filterchar-set! ucs-range->char-set!
+;;;
+;;; char-set->list char-set->string
+;;;
+;;; char-set-size char-set-count char-set-contains?
+;;; char-set-every char-set-any
+;;;
+;;; char-set-adjoin  char-set-delete 
+;;; char-set-adjoin! char-set-delete!
+;;; 
+
+;;; char-set-complement  char-set-union  char-set-intersection  
+;;; char-set-complement! char-set-union! char-set-intersection! 
+;;;
+;;; char-set-difference  char-set-xor  char-set-diff+intersection
+;;; char-set-difference! char-set-xor! char-set-diff+intersection!
+;;;
+;;; char-set:lower-case		char-set:upper-case	char-set:title-case
+;;; char-set:letter		char-set:digit		char-set:letter+digit
+;;; char-set:graphic		char-set:printing	char-set:whitespace
+;;; char-set:iso-control	char-set:punctuation	char-set:symbol
+;;; char-set:hex-digit		char-set:blank		char-set:ascii
+;;; char-set:empty		char-set:full
+
+;;; Imports
+;;; This code has the following non-R5RS dependencies:
+;;; - ERROR
+;;; - %LATIN1->CHAR %CHAR->LATIN1
+;;; - LET-OPTIONALS* and :OPTIONAL macros for parsing, checking & defaulting
+;;;   optional arguments from rest lists.
+;;; - BITWISE-AND for CHAR-SET-HASH
+;;; - The SRFI-19 DEFINE-RECORD-TYPE record macro
+;;; - A simple CHECK-ARG procedure: 
+;;;   (lambda (pred val caller) (if (not (pred val)) (error val caller)))
+
+;;; This is simple code, not great code. Char sets are represented as 256-char
+;;; strings. If char I is ASCII/Latin-1 0, then it isn't in the set; if char I
+;;; is ASCII/Latin-1 1, then it is in the set.
+;;; - Should be rewritten to use bit strings or byte vecs.
+;;; - Is Latin-1 specific. Would certainly have to be rewritten for Unicode.
+
+;;; See the end of the file for porting and performance-tuning notes.
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+
+(define-record-type :char-set
+  (make-char-set s)
+  char-set?
+  (s char-set:s))
+
+
+(define (%string-copy s) (substring s 0 (string-length s)))
+
+;;; Parse, type-check & default a final optional BASE-CS parameter from
+;;; a rest argument. Return a *fresh copy* of the underlying string.
+;;; The default is the empty set. The PROC argument is to help us
+;;; generate informative error exceptions.
+
+(define (%default-base maybe-base proc)
+  (if (pair? maybe-base)
+      (let ((bcs  (car maybe-base))
+	    (tail (cdr maybe-base)))
+	(if (null? tail)
+	    (if (char-set? bcs) (%string-copy (char-set:s bcs))
+		(error "BASE-CS parameter not a char-set" proc bcs))
+	    (error "Expected final base char set -- too many parameters"
+		   proc maybe-base)))
+      (make-string 256 (%latin1->char 0))))
+
+;;; If CS is really a char-set, do CHAR-SET:S, otw report an error msg on
+;;; behalf of our caller, PROC. This procedure exists basically to provide
+;;; explicit error-checking & reporting.
+
+(define (%char-set:s/check cs proc)
+  (let lp ((cs cs))
+    (if (char-set? cs) (char-set:s cs)
+	(lp (error "Not a char-set" cs proc)))))
+
+
+
+;;; These internal functions hide a lot of the dependency on the
+;;; underlying string representation of char sets. They should be
+;;; inlined if possible.
+
+(define (si=0? s i) (zero? (%char->latin1 (string-ref s i))))
+(define (si=1? s i) (not (si=0? s i)))
+(define c0 (%latin1->char 0))
+(define c1 (%latin1->char 1))
+(define (si s i) (%char->latin1 (string-ref s i)))
+(define (%set0! s i) (string-set! s i c0))
+(define (%set1! s i) (string-set! s i c1))
+
+;;; These do various "s[i] := s[i] op val" operations -- see 
+;;; %CHAR-SET-ALGEBRA. They are used to implement the various
+;;; set-algebra procedures.
+(define (setv!   s i v) (string-set! s i (%latin1->char v))) ; SET to a Value.
+(define (%not!   s i v) (setv! s i (- 1 v)))
+(define (%and!   s i v) (if (zero? v) (%set0! s i)))
+(define (%or!    s i v) (if (not (zero? v)) (%set1! s i)))
+(define (%minus! s i v) (if (not (zero? v)) (%set0! s i)))
+(define (%xor!   s i v) (if (not (zero? v)) (setv! s i (- 1 (si s i)))))
+
+
+(define (char-set-copy cs)
+  (make-char-set (%string-copy (%char-set:s/check cs char-set-copy))))
+
+(define (char-set= . rest)
+  (or (null? rest)
+      (let* ((cs1  (car rest))
+	     (rest (cdr rest))
+	     (s1 (%char-set:s/check cs1 char-set=)))
+	(let lp ((rest rest))
+	  (or (not (pair? rest))
+	      (and (string=? s1 (%char-set:s/check (car rest) char-set=))
+		   (lp (cdr rest))))))))
+
+(define (char-set<= . rest)
+  (or (null? rest)
+      (let ((cs1  (car rest))
+	    (rest (cdr rest)))
+	(let lp ((s1 (%char-set:s/check cs1 char-set<=))  (rest rest))
+	  (or (not (pair? rest))
+	      (let ((s2 (%char-set:s/check (car rest) char-set<=))
+		    (rest (cdr rest)))
+		(if (eq? s1 s2) (lp s2 rest)	; Fast path
+		    (let lp2 ((i 255))		; Real test
+		      (if (< i 0) (lp s2 rest)
+			  (and (<= (si s1 i) (si s2 i))
+			       (lp2 (- i 1))))))))))))
+
+;;; Hash
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Compute (c + 37 c + 37^2 c + ...) modulo BOUND, with sleaze thrown in
+;;; to keep the intermediate values small. (We do the calculation with just
+;;; enough bits to represent BOUND, masking off high bits at each step in
+;;; calculation. If this screws up any important properties of the hash
+;;; function I'd like to hear about it. -Olin)
+;;;
+;;; If you keep BOUND small enough, the intermediate calculations will 
+;;; always be fixnums. How small is dependent on the underlying Scheme system; 
+;;; we use a default BOUND of 2^22 = 4194304, which should hack it in
+;;; Schemes that give you at least 29 signed bits for fixnums. The core 
+;;; calculation that you don't want to overflow is, worst case,
+;;;     (+ 65535 (* 37 (- bound 1)))
+;;; where 65535 is the max character code. Choose the default BOUND to be the
+;;; biggest power of two that won't cause this expression to fixnum overflow, 
+;;; and everything will be copacetic.
+
+(define (char-set-hash cs . maybe-bound)
+  (let* ((bound (:optional maybe-bound 4194304 (lambda (n) (and (integer? n)
+								(exact? n)
+								(<= 0 n)))))
+	 (bound (if (zero? bound) 4194304 bound))	; 0 means default.
+	 (s (%char-set:s/check cs char-set-hash))
+	 ;; Compute a 111...1 mask that will cover BOUND-1:
+	 (mask (let lp ((i #x10000)) ; Let's skip first 16 iterations, eh?
+		 (if (>= i bound) (- i 1) (lp (+ i i))))))
+
+      (let lp ((i 255) (ans 0))
+	(if (< i 0) (modulo ans bound)
+	    (lp (- i 1)
+		(if (si=0? s i) ans
+		    (bitwise-and mask (+ (* 37 ans) i))))))))
+
+
+(define (char-set-contains? cs char)
+  (si=1? (%char-set:s/check cs char-set-contains?)
+	 (%char->latin1 (check-arg char? char char-set-contains?))))
+
+(define (char-set-size cs)
+  (let ((s (%char-set:s/check cs char-set-size)))
+    (let lp ((i 255) (size 0))
+      (if (< i 0) size
+	  (lp (- i 1) (+ size (si s i)))))))
+
+(define (char-set-count pred cset)
+  (check-arg procedure? pred char-set-count)
+  (let ((s (%char-set:s/check cset char-set-count)))
+    (let lp ((i 255) (count 0))
+      (if (< i 0) count
+	  (lp (- i 1)
+	      (if (and (si=1? s i) (pred (%latin1->char i)))
+		  (+ count 1)
+		  count))))))
+
+
+;;; -- Adjoin & delete
+
+(define (%set-char-set set proc cs chars)
+  (let ((s (%string-copy (%char-set:s/check cs proc))))
+    (for-each (lambda (c) (set s (%char->latin1 c)))
+	      chars)
+    (make-char-set s)))
+
+(define (%set-char-set! set proc cs chars)
+  (let ((s (%char-set:s/check cs proc)))
+    (for-each (lambda (c) (set s (%char->latin1 c)))
+	      chars))
+  cs)
+
+(define (char-set-adjoin cs . chars)
+  (%set-char-set  %set1! char-set-adjoin cs chars))
+(define (char-set-adjoin! cs . chars)
+  (%set-char-set! %set1! char-set-adjoin! cs chars))
+(define (char-set-delete cs . chars)
+  (%set-char-set  %set0! char-set-delete cs chars))
+(define (char-set-delete! cs . chars)
+  (%set-char-set! %set0! char-set-delete! cs chars))
+
+
+;;; Cursors
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Simple implementation. A cursors is an integer index into the
+;;; mark vector, and -1 for the end-of-char-set cursor.
+;;;
+;;; If we represented char sets as a bit set, we could do the following
+;;; trick to pick the lowest bit out of the set: 
+;;;   (count-bits (xor (- cset 1) cset))
+;;; (But first mask out the bits already scanned by the cursor first.)
+
+(define (char-set-cursor cset)
+  (%char-set-cursor-next cset 256 char-set-cursor))
+  
+(define (end-of-char-set? cursor) (< cursor 0))
+
+(define (char-set-ref cset cursor) (%latin1->char cursor))
+
+(define (char-set-cursor-next cset cursor)
+  (check-arg (lambda (i) (and (integer? i) (exact? i) (<= 0 i 255))) cursor
+	     char-set-cursor-next)
+  (%char-set-cursor-next cset cursor char-set-cursor-next))
+
+(define (%char-set-cursor-next cset cursor proc)	; Internal
+  (let ((s (%char-set:s/check cset proc)))
+    (let lp ((cur cursor))
+      (let ((cur (- cur 1)))
+	(if (or (< cur 0) (si=1? s cur)) cur
+	    (lp cur))))))
+
+
+;;; -- for-each map fold unfold every any
+
+(define (char-set-for-each proc cs)
+  (check-arg procedure? proc char-set-for-each)
+  (let ((s (%char-set:s/check cs char-set-for-each)))
+    (let lp ((i 255))
+      (cond ((>= i 0)
+	     (if (si=1? s i) (proc (%latin1->char i)))
+	     (lp (- i 1)))))))
+
+(define (char-set-map proc cs)
+  (check-arg procedure? proc char-set-map)
+  (let ((s (%char-set:s/check cs char-set-map))
+	(ans (make-string 256 c0)))
+    (let lp ((i 255))
+      (cond ((>= i 0)
+	     (if (si=1? s i)
+		 (%set1! ans (%char->latin1 (proc (%latin1->char i)))))
+	     (lp (- i 1)))))
+    (make-char-set ans)))
+
+(define (char-set-fold kons knil cs)
+  (check-arg procedure? kons char-set-fold)
+  (let ((s (%char-set:s/check cs char-set-fold)))
+    (let lp ((i 255) (ans knil))
+      (if (< i 0) ans
+	  (lp (- i 1)
+	      (if (si=0? s i) ans
+		  (kons (%latin1->char i) ans)))))))
+
+(define (char-set-every pred cs)
+  (check-arg procedure? pred char-set-every)
+  (let ((s (%char-set:s/check cs char-set-every)))
+    (let lp ((i 255))
+      (or (< i 0)
+	  (and (or (si=0? s i) (pred (%latin1->char i)))
+	       (lp (- i 1)))))))
+
+(define (char-set-any pred cs)
+  (check-arg procedure? pred char-set-any)
+  (let ((s (%char-set:s/check cs char-set-any)))
+    (let lp ((i 255))
+      (and (>= i 0)
+	   (or (and (si=1? s i) (pred (%latin1->char i)))
+	       (lp (- i 1)))))))
+
+
+(define (%char-set-unfold! proc p f g s seed)
+  (check-arg procedure? p proc)
+  (check-arg procedure? f proc)
+  (check-arg procedure? g proc)
+  (let lp ((seed seed))
+    (cond ((not (p seed))			; P says we are done.
+	   (%set1! s (%char->latin1 (f seed)))	; Add (F SEED) to set.
+	   (lp (g seed))))))			; Loop on (G SEED).
+
+(define (char-set-unfold p f g seed . maybe-base)
+  (let ((bs (%default-base maybe-base char-set-unfold)))
+    (%char-set-unfold! char-set-unfold p f g bs seed)
+    (make-char-set bs)))
+
+(define (char-set-unfold! p f g seed base-cset)
+  (%char-set-unfold! char-set-unfold! p f g
+		     (%char-set:s/check base-cset char-set-unfold!)
+		     seed)
+  base-cset)
+
+
+
+;;; list <--> char-set
+
+(define (%list->char-set! chars s)
+  (for-each (lambda (char) (%set1! s (%char->latin1 char)))
+	    chars))
+
+(define (char-set . chars)
+  (let ((s (make-string 256 c0)))
+    (%list->char-set! chars s)
+    (make-char-set s)))
+
+(define (list->char-set chars . maybe-base)
+  (let ((bs (%default-base maybe-base list->char-set)))
+    (%list->char-set! chars bs)
+    (make-char-set bs)))
+
+(define (list->char-set! chars base-cs)
+  (%list->char-set! chars (%char-set:s/check base-cs list->char-set!))
+  base-cs)
+
+
+(define (char-set->list cs)
+  (let ((s (%char-set:s/check cs char-set->list)))
+    (let lp ((i 255) (ans '()))
+      (if (< i 0) ans
+	  (lp (- i 1)
+	      (if (si=0? s i) ans
+		  (cons (%latin1->char i) ans)))))))
+
+
+
+;;; string <--> char-set
+
+(define (%string->char-set! str bs proc)
+  (check-arg string? str proc)
+  (do ((i (- (string-length str) 1) (- i 1)))
+      ((< i 0))
+    (%set1! bs (%char->latin1 (string-ref str i)))))
+
+(define (string->char-set str . maybe-base)
+  (let ((bs (%default-base maybe-base string->char-set)))
+    (%string->char-set! str bs string->char-set)
+    (make-char-set bs)))
+
+(define (string->char-set! str base-cs)
+  (%string->char-set! str (%char-set:s/check base-cs string->char-set!)
+		      string->char-set!)
+  base-cs)
+
+
+(define (char-set->string cs)
+  (let* ((s (%char-set:s/check cs char-set->string))
+	 (ans (make-string (char-set-size cs))))
+    (let lp ((i 255) (j 0))
+      (if (< i 0) ans
+	  (let ((j (if (si=0? s i) j
+		       (begin (string-set! ans j (%latin1->char i))
+			      (+ j 1)))))
+	    (lp (- i 1) j))))))
+
+
+;;; -- UCS-range -> char-set
+
+(define (%ucs-range->char-set! lower upper error? bs proc)
+  (check-arg (lambda (x) (and (integer? x) (exact? x) (<= 0 x))) lower proc)
+  (check-arg (lambda (x) (and (integer? x) (exact? x) (<= lower x))) upper proc)
+
+  (if (and (< lower upper) (< 256 upper) error?)
+      (error "Requested UCS range contains unavailable characters -- this implementation only supports Latin-1"
+	     proc lower upper))
+
+  (let lp ((i (- (min upper 256) 1)))
+    (cond ((<= lower i) (%set1! bs i) (lp (- i 1))))))
+
+(define (ucs-range->char-set lower upper . rest)
+  (let-optionals* rest ((error? #f) rest)
+    (let ((bs (%default-base rest ucs-range->char-set)))
+      (%ucs-range->char-set! lower upper error? bs ucs-range->char-set)
+      (make-char-set bs))))
+
+(define (ucs-range->char-set! lower upper error? base-cs)
+  (%ucs-range->char-set! lower upper error?
+			 (%char-set:s/check base-cs ucs-range->char-set!)
+			 ucs-range->char-set)
+  base-cs)
+
+
+;;; -- predicate -> char-set
+
+(define (%char-set-filter! pred ds bs proc)
+  (check-arg procedure? pred proc)
+  (let lp ((i 255))
+    (cond ((>= i 0)
+	   (if (and (si=1? ds i) (pred (%latin1->char i)))
+	       (%set1! bs i))
+	   (lp (- i 1))))))
+
+(define (char-set-filter predicate domain . maybe-base)
+  (let ((bs (%default-base maybe-base char-set-filter)))
+    (%char-set-filter! predicate
+		       (%char-set:s/check domain char-set-filter!)
+		       bs
+		       char-set-filter)
+    (make-char-set bs)))
+
+(define (char-set-filter! predicate domain base-cs)
+  (%char-set-filter! predicate
+		     (%char-set:s/check domain char-set-filter!)
+		     (%char-set:s/check base-cs char-set-filter!)
+		     char-set-filter!)
+  base-cs)
+
+
+;;; {string, char, char-set, char predicate} -> char-set
+
+(define (->char-set x)
+  (cond ((char-set? x) x)
+	((string? x) (string->char-set x))
+	((char? x) (char-set x))
+	(else (error "->char-set: Not a charset, string or char." x))))
+
+
+
+;;; Set algebra
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; The exported ! procs are "linear update" -- allowed, but not required, to
+;;; side-effect their first argument when computing their result. In other
+;;; words, you must use them as if they were completely functional, just like
+;;; their non-! counterparts, and you must additionally ensure that their
+;;; first arguments are "dead" at the point of call. In return, we promise a
+;;; more efficient result, plus allowing you to always assume char-sets are
+;;; unchangeable values.
+
+;;; Apply P to each index and its char code in S: (P I VAL).
+;;; Used by the set-algebra ops.
+
+(define (%string-iter p s)
+  (let lp ((i (- (string-length s) 1)))
+    (cond ((>= i 0)
+	   (p i (%char->latin1 (string-ref s i)))
+	   (lp (- i 1))))))
+
+;;; String S represents some initial char-set. (OP s i val) does some
+;;; kind of s[i] := s[i] op val update. Do
+;;;     S := S OP CSETi
+;;; for all the char-sets in the list CSETS. The n-ary set-algebra ops
+;;; all use this internal proc.
+
+(define (%char-set-algebra s csets op proc)
+  (for-each (lambda (cset)
+	      (let ((s2 (%char-set:s/check cset proc)))
+		(let lp ((i 255))
+		  (cond ((>= i 0)
+			 (op s i (si s2 i))
+			 (lp (- i 1)))))))
+	    csets))
+
+
+;;; -- Complement
+
+(define (char-set-complement cs)
+  (let ((s (%char-set:s/check cs char-set-complement))
+	(ans (make-string 256)))
+    (%string-iter (lambda (i v) (%not! ans i v)) s)
+    (make-char-set ans)))
+
+(define (char-set-complement! cset)
+  (let ((s (%char-set:s/check cset char-set-complement!)))
+    (%string-iter (lambda (i v) (%not! s i v)) s))
+  cset)
+
+
+;;; -- Union
+
+(define (char-set-union! cset1 . csets)
+  (%char-set-algebra (%char-set:s/check cset1 char-set-union!)
+		     csets %or! char-set-union!)
+  cset1)
+
+(define (char-set-union . csets)
+  (if (pair? csets)
+      (let ((s (%string-copy (%char-set:s/check (car csets) char-set-union))))
+	(%char-set-algebra s (cdr csets) %or! char-set-union)
+	(make-char-set s))
+      (char-set-copy char-set:empty)))
+
+
+;;; -- Intersection
+
+(define (char-set-intersection! cset1 . csets)
+  (%char-set-algebra (%char-set:s/check cset1 char-set-intersection!)
+		     csets %and! char-set-intersection!)
+  cset1)
+
+(define (char-set-intersection . csets)
+  (if (pair? csets)
+      (let ((s (%string-copy (%char-set:s/check (car csets) char-set-intersection))))
+	(%char-set-algebra s (cdr csets) %and! char-set-intersection)
+	(make-char-set s))
+      (char-set-copy char-set:full)))
+
+
+;;; -- Difference
+
+(define (char-set-difference! cset1 . csets)
+  (%char-set-algebra (%char-set:s/check cset1 char-set-difference!)
+		     csets %minus! char-set-difference!)
+  cset1)
+
+(define (char-set-difference cs1 . csets)
+  (if (pair? csets)
+      (let ((s (%string-copy (%char-set:s/check cs1 char-set-difference))))
+	(%char-set-algebra s csets %minus! char-set-difference)
+	(make-char-set s))
+      (char-set-copy cs1)))
+
+
+;;; -- Xor
+
+(define (char-set-xor! cset1 . csets)
+  (%char-set-algebra (%char-set:s/check cset1 char-set-xor!)
+		      csets %xor! char-set-xor!)
+  cset1)
+
+(define (char-set-xor . csets)
+  (if (pair? csets)
+      (let ((s (%string-copy (%char-set:s/check (car csets) char-set-xor))))
+	(%char-set-algebra s (cdr csets) %xor! char-set-xor)
+	(make-char-set s))
+      (char-set-copy char-set:empty)))
+
+
+;;; -- Difference & intersection
+
+(define (%char-set-diff+intersection! diff int csets proc)
+  (for-each (lambda (cs)
+	      (%string-iter (lambda (i v)
+			      (if (not (zero? v))
+				  (cond ((si=1? diff i)
+					 (%set0! diff i)
+					 (%set1! int  i)))))
+			    (%char-set:s/check cs proc)))
+	    csets))
+
+(define (char-set-diff+intersection! cs1 cs2 . csets)
+  (let ((s1 (%char-set:s/check cs1 char-set-diff+intersection!))
+	(s2 (%char-set:s/check cs2 char-set-diff+intersection!)))
+    (%string-iter (lambda (i v) (if (zero? v)
+				    (%set0! s2 i)
+				    (if (si=1? s2 i) (%set0! s1 i))))
+		  s1)
+    (%char-set-diff+intersection! s1 s2 csets char-set-diff+intersection!))
+  (values cs1 cs2))
+
+(define (char-set-diff+intersection cs1 . csets)
+  (let ((diff (string-copy (%char-set:s/check cs1 char-set-diff+intersection)))
+	(int  (make-string 256 c0)))
+    (%char-set-diff+intersection! diff int csets char-set-diff+intersection)
+    (values (make-char-set diff) (make-char-set int))))
+
+
+;;;; System character sets
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; These definitions are for Latin-1.
+;;;
+;;; If your Scheme implementation allows you to mark the underlying strings
+;;; as immutable, you should do so -- it would be very, very bad if a client's
+;;; buggy code corrupted these constants.
+
+(define char-set:empty (char-set))
+(define char-set:full (char-set-complement char-set:empty))
+
+(define char-set:lower-case
+  (let* ((a-z (ucs-range->char-set #x61 #x7B))
+	 (latin1 (ucs-range->char-set! #xdf #xf7  #t a-z))
+	 (latin2 (ucs-range->char-set! #xf8 #x100 #t latin1)))
+    (char-set-adjoin! latin2 (%latin1->char #xb5))))
+
+(define char-set:upper-case
+  (let ((A-Z (ucs-range->char-set #x41 #x5B)))
+    ;; Add in the Latin-1 upper-case chars.
+    (ucs-range->char-set! #xd8 #xdf #t
+			  (ucs-range->char-set! #xc0 #xd7 #t A-Z))))
+
+(define char-set:title-case char-set:empty)
+
+(define char-set:letter
+  (let ((u/l (char-set-union char-set:upper-case char-set:lower-case)))
+    (char-set-adjoin! u/l
+		      (%latin1->char #xaa)	; FEMININE ORDINAL INDICATOR
+		      (%latin1->char #xba))))	; MASCULINE ORDINAL INDICATOR
+
+(define char-set:digit     (string->char-set "0123456789"))
+(define char-set:hex-digit (string->char-set "0123456789abcdefABCDEF"))
+
+(define char-set:letter+digit
+  (char-set-union char-set:letter char-set:digit))
+
+(define char-set:punctuation
+  (let ((ascii (string->char-set "!\"#%&'()*,-./:;?@[\\]_{}"))
+	(latin-1-chars (map %latin1->char '(#xA1 ; INVERTED EXCLAMATION MARK
+					    #xAB ; LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+					    #xAD ; SOFT HYPHEN
+					    #xB7 ; MIDDLE DOT
+					    #xBB ; RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+					    #xBF)))) ; INVERTED QUESTION MARK
+    (list->char-set! latin-1-chars ascii)))
+
+(define char-set:symbol
+  (let ((ascii (string->char-set "$+<=>^`|~"))
+	(latin-1-chars (map %latin1->char '(#x00A2 ; CENT SIGN
+					    #x00A3 ; POUND SIGN
+					    #x00A4 ; CURRENCY SIGN
+					    #x00A5 ; YEN SIGN
+					    #x00A6 ; BROKEN BAR
+					    #x00A7 ; SECTION SIGN
+					    #x00A8 ; DIAERESIS
+					    #x00A9 ; COPYRIGHT SIGN
+					    #x00AC ; NOT SIGN
+					    #x00AE ; REGISTERED SIGN
+					    #x00AF ; MACRON
+					    #x00B0 ; DEGREE SIGN
+					    #x00B1 ; PLUS-MINUS SIGN
+					    #x00B4 ; ACUTE ACCENT
+					    #x00B6 ; PILCROW SIGN
+					    #x00B8 ; CEDILLA
+					    #x00D7 ; MULTIPLICATION SIGN
+					    #x00F7)))) ; DIVISION SIGN
+    (list->char-set! latin-1-chars ascii)))
+  
+
+(define char-set:graphic
+  (char-set-union char-set:letter+digit char-set:punctuation char-set:symbol))
+
+(define char-set:whitespace
+  (list->char-set (map %latin1->char '(#x09 ; HORIZONTAL TABULATION
+				       #x0A ; LINE FEED		
+				       #x0B ; VERTICAL TABULATION
+				       #x0C ; FORM FEED
+				       #x0D ; CARRIAGE RETURN
+				       #x20 ; SPACE
+				       #xA0))))
+
+(define char-set:printing (char-set-union char-set:whitespace char-set:graphic)) ; NO-BREAK SPACE
+
+(define char-set:blank
+  (list->char-set (map %latin1->char '(#x09 ; HORIZONTAL TABULATION
+				       #x20 ; SPACE
+				       #xA0)))) ; NO-BREAK SPACE
+
+
+(define char-set:iso-control
+  (ucs-range->char-set! #x7F #xA0 #t (ucs-range->char-set 0 32)))
+
+(define char-set:ascii (ucs-range->char-set 0 128))
+
+
+;;; Porting & performance-tuning notes
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; See the section at the beginning of this file on external dependencies.
+;;;
+;;; First and foremost, rewrite this code to use bit vectors of some sort.
+;;; This will give big speedup and memory savings.
+;;;
+;;; - LET-OPTIONALS* macro.
+;;; This is only used once. You can rewrite the use, port the hairy macro
+;;; definition (which is implemented using a Clinger-Rees low-level
+;;; explicit-renaming macro system), or port the simple, high-level
+;;; definition, which is less efficient.
+;;;
+;;; - :OPTIONAL macro
+;;; Very simply defined using an R5RS high-level macro.
+;;;
+;;; Implementations that can arrange for the base char sets to be immutable
+;;; should do so. (E.g., Scheme 48 allows one to mark a string as immutable,
+;;; which can be used to protect the underlying strings.) It would be very,
+;;; very bad if a client's buggy code corrupted these constants.
+;;;
+;;; There is a fair amount of argument checking. This is, strictly speaking,
+;;; unnecessary -- the actual body of the procedures will blow up if an
+;;; illegal value is passed in. However, the error message will not be as good
+;;; as if the error were caught at the "higher level." Also, a very, very
+;;; smart Scheme compiler may be able to exploit having the type checks done
+;;; early, so that the actual body of the procedures can assume proper values.
+;;; This isn't likely; this kind of compiler technology isn't common any
+;;; longer.
+;;; 
+;;; The overhead of optional-argument parsing is irritating. The optional
+;;; arguments must be consed into a rest list on entry, and then parsed out.
+;;; Function call should be a matter of a few register moves and a jump; it
+;;; should not involve heap allocation! Your Scheme system may have a superior
+;;; non-R5RS optional-argument system that can eliminate this overhead. If so,
+;;; then this is a prime candidate for optimising these procedures,
+;;; *especially* the many optional BASE-CS parameters.
+;;;
+;;; Note that optional arguments are also a barrier to procedure integration.
+;;; If your Scheme system permits you to specify alternate entry points
+;;; for a call when the number of optional arguments is known in a manner
+;;; that enables inlining/integration, this can provide performance 
+;;; improvements.
+;;;
+;;; There is enough *explicit* error checking that *all* internal operations
+;;; should *never* produce a type or index-range error. Period. Feel like
+;;; living dangerously? *Big* performance win to be had by replacing string
+;;; and record-field accessors and setters with unsafe equivalents in the
+;;; code. Similarly, fixnum-specific operators can speed up the arithmetic
+;;; done on the index values in the inner loops. The only arguments that are
+;;; not completely error checked are
+;;;   - string lists (complete checking requires time proportional to the
+;;;     length of the list)
+;;;   - procedure arguments, such as char->char maps & predicates.
+;;;     There is no way to check the range & domain of procedures in Scheme.
+;;; Procedures that take these parameters cannot fully check their
+;;; arguments. But all other types to all other procedures are fully
+;;; checked.
+;;;
+;;; This does open up the alternate possibility of simply *removing* these 
+;;; checks, and letting the safe primitives raise the errors. On a dumb
+;;; Scheme system, this would provide speed (by eliminating the redundant
+;;; error checks) at the cost of error-message clarity.
+;;;
+;;; In an interpreted Scheme, some of these procedures, or the internal
+;;; routines with % prefixes, are excellent candidates for being rewritten
+;;; in C.
+;;;
+;;; It would also be nice to have the ability to mark some of these
+;;; routines as candidates for inlining/integration.
+;;; 
+;;; See the comments preceding the hash function code for notes on tuning
+;;; the default bound so that the code never overflows your implementation's
+;;; fixnum size into bignum calculation.
+;;;
+;;; All the %-prefixed routines in this source code are written
+;;; to be called internally to this library. They do *not* perform
+;;; friendly error checks on the inputs; they assume everything is
+;;; proper. They also do not take optional arguments. These two properties
+;;; save calling overhead and enable procedure integration -- but they
+;;; are not appropriate for exported routines.
+
+;;; Copyright notice
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Copyright (c) 1988-1995 Massachusetts Institute of Technology
+;;; 
+;;; This material was developed by the Scheme project at the Massachusetts
+;;; Institute of Technology, Department of Electrical Engineering and
+;;; Computer Science.  Permission to copy and modify this software, to
+;;; redistribute either the original software or a modified version, and
+;;; to use this software for any purpose is granted, subject to the
+;;; following restrictions and understandings.
+;;; 
+;;; 1. Any copy made of this software must include this copyright notice
+;;; in full.
+;;; 
+;;; 2. Users of this software agree to make their best efforts (a) to
+;;; return to the MIT Scheme project any improvements or extensions that
+;;; they make, so that these may be included in future releases; and (b)
+;;; to inform MIT of noteworthy uses of this software.
+;;; 
+;;; 3. All materials developed as a consequence of the use of this
+;;; software shall duly acknowledge such use, in accordance with the usual
+;;; standards of acknowledging credit in academic research.
+;;; 
+;;; 4. MIT has made no warrantee or representation that the operation of
+;;; this software will be error-free, and MIT is under no obligation to
+;;; provide any services, by way of maintenance, update, or otherwise.
+;;; 
+;;; 5. In conjunction with products arising from the use of this material,
+;;; there shall be no use of the name of the Massachusetts Institute of
+;;; Technology nor of any adaptation thereof in any advertising,
+;;; promotional, or sales literature without prior written consent from
+;;; MIT in each case.
diff --git a/scsh/lib/cset-lib.txt b/scsh/lib/cset-lib.txt
new file mode 100644
index 0000000..75a77d5
--- /dev/null
+++ b/scsh/lib/cset-lib.txt
@@ -0,0 +1,1271 @@
+The SRFI 14 character-set library				-*- outline -*-
+Olin Shivers
+98/11/8
+Last Update: 2000/7/4
+
+Emacs should display this document in outline mode. Say c-h m for
+instructions on how to move through it by sections (e.g., c-c c-n, c-c c-p).
+
+* Table of contents
+-------------------
+Abstract
+Variable index
+Rationale
+  Linear-update operations
+  Extra-SRFI recommendations
+Specification
+  General procedures
+  Iterating over character sets
+  Creating character sets
+  Querying character sets
+  Character-set algebra
+  Standard character sets
+Unicode, Latin-1 and ASCII definitions of the standard character sets
+Reference implementation
+Acknowledgements
+References & links
+Copyright
+
+
+-------------------------------------------------------------------------------
+* Abstract
+----------
+
+The ability to efficiently represent and manipulate sets of characters is an
+unglamorous but very useful capability for text-processing code -- one that
+tends to pop up in the definitions of other libraries.  Hence it is useful to
+specify a general substrate for this functionality early.  This SRFI defines a
+general library that provides this functionality. 
+
+It is accompanied by a reference implementation for the spec. The reference
+implementation is fairly efficient, straightforwardly portable, and has a
+"free software" copyright. The implementation is tuned for "small" 7 or 8
+bit character types, such as ASCII or Latin-1; the data structures and
+algorithms would have to be altered for larger 16 or 32 bit character types
+such as Unicode -- however, the specs have been carefully designed with these
+larger character types in mind.
+
+Several forthcoming SRFIs can be defined in terms of this one:
+    - string library
+    - delimited input procedures (e.g., READ-LINE)
+    - regular expressions
+
+
+-------------------------------------------------------------------------------
+* Variable index
+-----------------
+Here is the complete set of bindings -- procedural and otherwise --
+exported by this library. In a Scheme system that has a module or package 
+system, these procedures should be contained in a module named "char-set-lib".
+
+char-set? char-set= char-set<=
+
+char-set-hash
+
+char-set-cursor char-set-ref char-set-cursor-next end-of-char-set?
+char-set-fold char-set-unfold char-set-unfold!
+char-set-for-each char-set-map
+
+char-set-copy char-set
+
+list->char-set  string->char-set 
+list->char-set! string->char-set!
+    
+char-set-filter  ucs-range->char-set 
+char-set-filter! ucs-range->char-set!
+
+->char-set
+
+char-set->list  char-set->string
+
+char-set-size char-set-count char-set-contains?
+
+char-set-every char-set-any
+
+char-set-adjoin  char-set-delete 
+char-set-adjoin! char-set-delete!
+
+char-set-complement  char-set-union  char-set-intersection  
+char-set-complement! char-set-union! char-set-intersection! 
+
+char-set-difference  char-set-xor  char-set-diff+intersection
+char-set-difference! char-set-xor! char-set-diff+intersection!
+
+char-set:lower-case	char-set:upper-case	char-set:title-case
+char-set:letter		char-set:digit		char-set:letter+digit
+char-set:graphic	char-set:printing	char-set:whitespace
+char-set:iso-control	char-set:punctuation	char-set:symbol
+char-set:hex-digit	char-set:blank		char-set:ascii
+char-set:empty		char-set:full
+
+
+-------------------------------------------------------------------------------
+* Rationale
+-----------
+
+The ability to efficiently manipulate sets of characters is quite
+useful for text-processing code. Encapsulating this functionality in
+a general, efficiently implemented library can assist all such code.
+This library defines a new data structure to represent these sets, called
+a "char-set." The char-set type is distinct from all other types.
+
+This library is designed to be portable across implementations that use
+different character types and representations, especially ASCII, Latin-1
+and Unicode. Some effort has been made to preserve compatibility with Java
+in the Unicode case (see the definition of CHAR-SET:WHITESPACE for the
+single real deviation).
+
+
+** Linear-update operations
+===========================
+The procedures of this SRFI, by default, are "pure functional" -- they do not
+alter their parameters. However, this SRFI defines a set of "linear-update"
+procedures which have a hybrid pure-functional/side-effecting semantics: they
+are allowed, but not required, to side-effect one of their parameters in order
+to construct their result. An implementation may legally implement these
+procedures as pure, side-effect-free functions, or it may implement them using
+side effects, depending upon the details of what is the most efficient or
+simple to implement in terms of the underlying representation.
+
+The linear-update routines all have names ending with "!".
+
+Clients of these procedures *may not* rely upon these procedures working by
+side effect. For example, this is not guaranteed to work:
+    
+    (let* ((cs1 (char-set #\a #\b #\c))      ; cs1 = {a,b,c}.
+           (cs2 (char-set-adjoin! cs1 #\d))) ; Add d to {a,b,c}.
+      cs1) ; Could be either {a,b,c} or {a,b,c,d}.
+
+However, this is well-defined:
+
+    (let ((cs (char-set #\a #\b #\c)))
+      (char-set-adjoin! cs #\d)) ; Add d to {a,b,c}.
+
+So clients of these procedures write in a functional style, but must
+additionally be sure that, when the procedure is called, there are no other
+live pointers to the potentially-modified character set (hence the term
+"linear update").
+
+There are two benefits to this convention:
+  - Implementations are free to provide the most efficient possible
+    implementation, either functional or side-effecting.
+  - Programmers may nonetheless continue to assume that character sets
+    are purely functional data structures: they may be reliably shared
+    without needing to be copied, uniquified, and so forth.
+
+Note that pure functional representations are the right thing for
+ASCII- or Latin-1-based Scheme implementations, since a char-set can
+be represented in an ASCII Scheme with 4 32-bit words. Pure set-algebra
+operations on such a representation are very fast and efficient. Programmers
+who code using linear-update operations are guaranteed the system will
+provide the best implementation across multiple platforms.
+
+In practice, these procedures are most useful for efficiently constructing
+character sets in a side-effecting manner, in some limited local context, 
+before passing the character set outside the local construction scope to be
+used in a functional manner.
+
+Scheme provides no assistance in checking the linearity of the potentially
+side-effected parameters passed to these functions --- there's no linear
+type checker or run-time mechanism for detecting violations. (But
+sophisticated programming environments, such as DrScheme, might help.)
+
+** Extra-SRFI recommendations
+=============================
+Users are cautioned that the R5RS predicates 
+    CHAR-ALPHABETIC? 
+    CHAR-NUMERIC? 
+    CHAR-WHITESPACE? 
+    CHAR-UPPER-CASE? 
+    CHAR-LOWER-CASE? 
+may or may not be in agreement with the SRFI 14 base character sets
+    CHAR-SET:LETTER
+    CHAR-SET:DIGIT
+    CHAR-SET:WHITESPACE
+    CHAR-SET:UPPER-CASE
+    CHAR-SET:LOWER-CASE
+Implementors are strongly encouraged to bring these predicates into
+agreement with the base character sets of this SRFI; not to do so risks
+major confusion.
+
+
+-------------------------------------------------------------------------------
+* Specification
+---------------
+
+In the following procedure specifications:
+    - A CS parameter is a character set.
+
+    - An S parameter is a string.
+
+    - A CHAR parameter is a character.
+
+    - A CHAR-LIST parameter is a list of characters.
+
+    - A PRED parameter is a unary character predicate procedure, returning 
+      a true/false value when applied to a character.
+
+    - An OBJ parameter may be any value at all.
+
+Passing values to procedures with these parameters that do not satisfy these
+types is an error.
+
+Unless otherwise noted in the specification of a procedure, procedures
+always return character sets that are distinct (from the point of view
+of the linear-update operations) from the parameter character sets. For
+example, CHAR-SET-ADJOIN is guaranteed to provide a fresh character set,
+even if it is not given any character parameters.
+
+Parameters given in square brackets are optional. Unless otherwise noted in
+the text describing the procedure, any prefix of these optional parameters may
+be supplied, from zero arguments to the full list. When a procedure returns
+multiple values, this is shown by listing the return values in square
+brackets, as well. So, for example, the procedure with signature
+
+    halts? f [x init-store] -> [boolean integer]
+
+would take one (F), two (F, X) or three (F, X, INPUT-STORE) input parameters,
+and return two values, a boolean and an integer.
+
+A parameter followed by "..." means zero-or-more elements. So the procedure
+with the signature
+    sum-squares x ... -> number
+takes zero or more arguments (X ...), while the procedure with signature
+    spell-check doc dict1 dict2 ... -> string-list
+takes two required parameters (DOC and DICT1) and zero or more
+optional parameters (DICT2 ...).
+
+
+** General procedures
+=====================
+char-set? obj -> boolean
+    Is the object OBJ a character set?
+
+char-set= cs1 ... -> boolean
+    Are the character sets equal?
+
+    Boundary cases:
+      (char-set=) => true
+      (char-set= cs) => true
+
+    Rationale: transitive binary relations are generally extended to n-ary
+    relations in Scheme, which enables clearer, more concise code to be
+    written. While the zero-argument and one-argument cases will almost
+    certainly not arise in first-order uses of such relations, they may well
+    arise in higher-order cases or macro-generated code. E.g., consider
+        (apply char-set= cset-list)
+    This is well-defined if the list is empty or a singleton list. Hence
+    we extend these relations to any number of arguments. Implementors
+    have reported actual uses of n-ary relations in higher-order cases
+    allowing for fewer than two arguments. The way of Scheme is to handle the
+    general case; we provide the fully general extension.
+
+    A counter-argument to this extension is that R5RS's transitive binary
+    arithmetic relations (=, <, etc.) require at least two arguments, hence
+    this decision is a break with the prior convention -- although it is
+    at least one that is backwards-compatible.
+
+char-set<= cs1 ... -> boolean
+    Returns true if every character set CSi is a subset of character set CSi+1.
+
+    Boundary cases:
+      (char-set<=) => true
+      (char-set<= cs) => true
+
+    Rationale: See CHAR-SET= for discussion of zero- and one-argument
+    applications. Consider testing a list of char-sets for monotonicity
+    with (APPLY CHAR-SET<= CSET-LIST).
+
+char-set-hash cs [bound] -> integer
+    Compute a hash value for the character set CS. BOUND is a non-negative
+    exact integer specifying the range of the hash function. A positive
+    value restricts the return value to the range [0,BOUND).
+
+    If BOUND is either zero or not given, the implementation may use
+    an implementation-specific default value, chosen to be as large as
+    is efficiently practical. For instance, the default range might be chosen
+    for a given implementation to map all character sets into the range of
+    integers that can be represented with a single machine word.
+
+    Invariant:
+       (char-set= cs1 cs2) => (= (char-set-hash cs1 b) (char-set-hash cs2 b))
+
+    A legal but nonetheless discouraged implementation:
+        (define (char-set-hash cs . maybe-bound) 1)
+
+    Rationale: allowing the user to specify an explicit bound simplifies user
+    code by removing the mod operation that typically accompanies every hash
+    computation, and also may allow the implementation of the hash function to
+    exploit a reduced range to efficiently compute the hash value. E.g., for
+    small bounds, the hash function may be computed in a fashion such that
+    intermediate values never overflow into bignum integers, allowing the
+    implementor to provide a fixnum-specific "fast path" for computing the
+    common cases very rapidly.
+
+** Iterating over character sets
+===================================
+
+char-set-cursor cset -> cursor
+char-set-ref cset cursor -> char
+char-set-cursor-next cset cursor -> cursor
+end-of-char-set? cursor -> boolean
+    Cursors are a low-level facility for iterating over the characters in a
+    set. A cursor is a value that indexes a character in a char set.
+    CHAR-SET-CURSOR produces a new cursor for a given char set. The set
+    element indexed by the cursor is fetched with CHAR-SET-REF. A cursor index
+    is incremented with CHAR-SET-CURSOR-NEXT; in this way, code can step
+    through every character in a char set. Stepping a cursor "past the end" of
+    a char set produces a cursor that answers true to END-OF-CHAR-SET?. It is
+    an error to pass such a cursor to CHAR-SET-REF or to CHAR-SET-CURSOR-NEXT.
+
+    A cursor value may not be used in conjunction with a different character
+    set; if it is passed to CHAR-SET-REF or CHAR-SET-CURSOR-NEXT with
+    a character set other than the one used to create it, the results and
+    effects are undefined.
+
+    Cursor values are *not* necessarily distinct from other types. They may be
+    integers, linked lists, records, procedures or other values. This license
+    is granted to allow cursors to be very "lightweight" values suitable for
+    tight iteration, even in fairly simple implementations.
+
+    Note that these primitives are necessary to export an iteration facility
+    for char sets to loop macros.
+
+    Example:
+
+	(define cs (char-set #\G #\a #\T #\e #\c #\h))
+
+	;; Collect elts of CS into a list.
+	(let lp ((cur (char-set-cursor cs)) (ans '()))
+	  (if (end-of-char-set? cur) ans
+	      (lp (char-set-cursor-next cs cur)
+		  (cons (char-set-ref cs cur) ans))))
+	  => (#\G #\T #\a #\c #\e #\h)
+
+	;; Equivalently, using a list unfold (from SRFI 1):
+	(unfold-right end-of-char-set? 
+	              (curry char-set-ref cs)
+		      (curry char-set-cursor-next cs)
+		      (char-set-cursor cs))
+	  => (#\G #\T #\a #\c #\e #\h)
+
+    Rationale: Note that the cursor API's four functions "fit" the functional
+    protocol used by the unfolders provided by the list, string and char-set
+    SRFIs (see the example above). By way of contrast, here is a simpler,
+    two-function API that was rejected for failing this criterion. Besides
+    CHAR-SET-CURSOR, it provided a single function that mapped a cursor and a
+    character set to two values, the indexed character and the next cursor. If
+    the cursor had exhausted the character set, then this function returned
+    false instead of the character value, and another end-of-char-set cursor.
+    In this way, the other three functions of the current API were combined
+    together.
+
+char-set-fold kons knil cs -> object
+    This is the fundamental iterator for character sets.  Applies the function
+    KONS across the character set CS using initial state value KNIL.  That is,
+    if CS is the empty set, the procedure returns KNIL.  Otherwise, some
+    element c of CS is chosen; let cs' be the remaining, unchosen characters.
+    The procedure returns
+	(char-set-fold KONS (KONS c KNIL) cs')
+
+    Examples:
+        ;; CHAR-SET-MEMBERS
+	(lambda (cs) (char-set-fold cons '() cs))
+
+        ;; CHAR-SET-SIZE
+        (lambda (cs) (char-set-fold (lambda (c i) (+ i 1)) 0 cs))
+
+        ;; How many vowels in the char set?
+        (lambda (cs) 
+          (char-set-fold (lambda (c i) (if (vowel? c) (+ i 1) i))
+                         0 cs))
+
+char-set-unfold  f p g seed [base-cs] -> char-set
+char-set-unfold! f p g seed base-cs   -> char-set
+    This is a fundamental constructor for char-sets. 
+    - G is used to generate a series of "seed" values from the initial seed:
+	SEED, (G SEED), (G^2 SEED), (G^3 SEED), ...
+    - P tells us when to stop -- when it returns true when applied to one 
+      of these seed values.
+    - F maps each seed value to a character. These characters are added
+      to the base character set BASE-CS to form the result; BASE-CS defaults to
+      the empty set. CHAR-SET-UNFOLD! adds the characters to BASE-CS in a 
+      linear-update -- it is allowed, but not required, to side-effect
+      and use BASE-CS's storage to construct the result.
+
+    More precisely, the following definitions hold, ignoring the
+    optional-argument issues:
+
+    (define (char-set-unfold p f g seed base-cs) 
+      (char-set-unfold! p f g seed (char-set-copy base-cs)))
+
+    (define (char-set-unfold! p f g seed base-cs)
+      (let lp ((seed seed) (cs base-cs))
+	(if (p seed) cs					; P says we are done.
+	    (lp (g seed)				; Loop on (G SEED).
+		(char-set-adjoin! cs (f seed))))))	; Add (F SEED) to set.
+
+    (Note that the actual implementation may be more efficient.)
+
+    Examples:
+                         
+    (port->char-set p) = (char-set-unfold eof-object? values
+                                          (lambda (x) (read-char p))
+                                          (read-char p))
+
+    (list->char-set lis) = (char-set-unfold null? car cdr lis)
+
+char-set-for-each proc cs -> unspecified
+    Apply procedure PROC to each character in the character set CS.
+    Note that the order in which PROC is applied to the characters in the
+    set is not specified, and may even change from one procedure application
+    to another.
+
+    Nothing at all is specified about the value returned by this procedure; it
+    is not even required to be consistent from call to call. It is simply
+    required to be a value (or values) that may be passed to a command
+    continuation, e.g. as the value of an expression appearing as a
+    non-terminal subform of a BEGIN expression. Note that in R5RS, this
+    restricts the procedure to returning a single value; non-R5RS systems may
+    not even provide this restriction.
+
+char-set-map proc cs -> char-set
+    PROC is a char->char procedure. Apply it to all the characters in
+    the char-set CS, and collect the results into a new character set.
+
+    Essentially lifts PROC from a char->char procedure to a char-set ->
+    char-set procedure.
+
+    Example:
+      (char-set-map char-downcase cset)
+
+
+** Creating character sets
+==========================
+char-set-copy cs -> char-set
+    Returns a copy of the character set CS.  "Copy" means that if either the
+    input parameter or the result value of this procedure is passed to one of
+    the linear-update procedures described below, the other character set is
+    guaranteed not to be altered.  
+
+    A system that provides pure-functional implementations of the
+    linear-operator suite could implement this procedure as the identity
+    function -- so copies are *not* guaranteed to be distinct by EQ?.
+
+char-set char1 ... -> char-set
+    Return a character set containing the given characters.
+
+list->char-set  char-list [base-cs] -> char-set
+list->char-set! char-list  base-cs  -> char-set
+    Return a character set containing the characters in the list of
+    characters CHAR-LIST.
+
+    If character set BASE-CS is provided, the characters from CHAR-LIST
+    are added to it. LIST->CHAR-SET! is allowed, but not required,
+    to side-effect and reuse the storage in BASE-CS; LIST->CHAR-SET
+    produces a fresh character set.
+
+string->char-set  s [base-cs] -> char-set
+string->char-set! s  base-cs  -> char-set
+    Return a character set containing the characters in the string S.
+
+    If character set BASE-CS is provided, the characters from S are added to
+    it. STRING->CHAR-SET! is allowed, but not required, to side-effect and
+    reuse the storage in BASE-CS; STRING->CHAR-SET produces a fresh character
+    set.
+
+char-set-filter  pred cs [base-cs] -> char-set
+char-set-filter! pred cs  base-cs  -> char-set
+    Returns a character set containing every character c in CS
+    such that (PRED c) returns true.
+
+    If character set BASE-CS is provided, the characters specified by PRED
+    are added to it. CHAR-SET-FILTER! is allowed, but not required,
+    to side-effect and reuse the storage in BASE-CS; CHAR-SET-FILTER
+    produces a fresh character set.
+
+    An implementation may not save away a reference to PRED and invoke it
+    after CHAR-SET-FILTER or CHAR-SET-FILTER! returns -- that is, "lazy,"
+    on-demand implementations are not allowed, as PRED may have external
+    dependencies on mutable data or have other side-effects.
+
+    Rationale: This procedure provides a means of converting a character
+    predicate into its equivalent character set; the CS parameter allows the
+    programmer to bound the predicate's domain. Programmers should be aware
+    that filtering a character set such as CHAR-SET:FULL could be a very
+    expensive operation in an implementation that provided an extremely large
+    character type, such as 32-bit Unicode. An earlier draft of this library
+    provided a simple PREDICATE->CHAR-SET procedure, which was rejected in
+    favor of CHAR-SET-FILTER for this reason.
+
+ucs-range->char-set  lower upper [error? base-cs] -> char-set
+ucs-range->char-set! lower upper  error? base-cs  -> char-set
+    LOWER and UPPER are exact non-negative integers; LOWER <= UPPER.
+
+    Returns a character set containing every character whose ISO/IEC 10646
+    UCS-4 code lies in the half-open range [LOWER,UPPER).
+
+    - If the requested range includes unassigned UCS values, these are
+      silently ignored (the current UCS specification has "holes" in the
+      space of assigned codes).
+    
+    - If the requested range includes "private" or "user space" codes, these
+      are handled in an implementation-specific manner; however, a UCS- or
+      Unicode-based Scheme implementation should pass them through
+      transparently.
+    
+    - If any code from the requested range specifies a valid, assigned
+      UCS character that has no corresponding representative in the
+      implementation's character type, then (1) an error is raised if ERROR?
+      is true, and (2) the code is ignored if ERROR? is false (the default).
+      This might happen, for example, if the implementation uses ASCII
+      characters, and the requested range includes non-ASCII characters.
+
+    If character set BASE-CS is provided, the characters specified by the
+    range are added to it. UCS-RANGE->CHAR-SET! is allowed, but not required,
+    to side-effect and reuse the storage in BASE-CS; UCS-RANGE->CHAR-SET
+    produces a fresh character set.
+
+    Note that ASCII codes are a subset of the Latin-1 codes, which are in turn
+    a subset of the 16-bit Unicode codes, which are themselves a subset of the
+    32-bit UCS-4 codes. We commit to a specific encoding in this routine,
+    regardless of the underlying representation of characters, so that client
+    code using this library will be portable. I.e., a conformant Scheme
+    implementation may use EBCDIC or SHIFT-JIS to encode characters; it must
+    simply map the UCS characters from the given range into the native
+    representation when possible, and report errors when not possible.
+
+->char-set x -> char-set
+    Coerces X into a char-set. X may be a string, character or char-set. A
+    string is converted to the set of its constituent characters; a character
+    is converted to a singleton set; a char-set is returned as-is. This
+    procedure is intended for use by other procedures that want to provide
+    "user-friendly," wide-spectrum interfaces to their clients.
+
+
+** Querying character sets
+==========================
+char-set-size cs -> integer
+    Returns the number of elements in character set CS.
+
+char-set-count pred cs -> integer
+    Apply PRED to the chars of character set CS, and return the number
+    of chars that caused the predicate to return true.
+
+char-set->list cs -> character-list
+    This procedure returns a list of the members of character set CS.
+    The order in which CS's characters appear in the list is not defined,
+    and may be different from one call to another.
+
+char-set->string cs -> string
+    This procedure returns a string containing the members of character set CS.
+    The order in which CS's characters appear in the string is not defined,
+    and may be different from one call to another.
+
+char-set-contains? cs char -> boolean
+    This procedure tests CHAR for membership in character set CS.
+
+    The MIT Scheme character-set package called this procedure
+    CHAR-SET-MEMBER?, but the argument order isn't consistent with the name.
+
+char-set-every pred cs -> boolean
+char-set-any   pred cs -> object
+    The CHAR-SET-EVERY procedure returns true if predicate PRED
+    returns true of every character in the character set CS.
+
+    Likewise, CHAR-SET-ANY applies PRED to every character in
+    character set CS, and returns the first true value it finds.
+    If no character produces a true value, it returns false.
+
+    The order in which these procedures sequence through the elements of
+    CS is not specified.
+
+    Note that if you need to determine the actual character on which a 
+    predicate returns true, use CHAR-SET-ANY and arrange for the predicate 
+    to return the character parameter as its true value, e.g.
+        (char-set-any (lambda (c) (and (char-upper-case? c) c)) 
+                      cs)
+
+
+** Character-set algebra
+========================
+char-set-adjoin cs char1 ... -> char-set
+char-set-delete cs char1 ... -> char-set
+    Add/delete the CHARi characters to/from character set CS.
+
+char-set-adjoin! cs char1 ... -> char-set
+char-set-delete! cs char1 ... -> char-set
+    Linear-update variants. These procedures are allowed, but not
+    required, to side-effect their first parameter.
+
+char-set-complement cs                 -> char-set
+char-set-union cs1 ...                 -> char-set
+char-set-intersection cs1 ...          -> char-set
+char-set-difference cs1 cs2 ...        -> char-set
+char-set-xor cs1 ...                   -> char-set
+char-set-diff+intersection cs1 cs2 ... -> [char-set char-set]
+    These procedures implement set complement, union, intersection,
+    difference, and exclusive-or for character sets. The union, intersection
+    and xor operations are n-ary. The difference function is also n-ary, 
+    associates to the left (that is, it computes the difference between
+    its first argument and the union of all the other arguments),
+    and requires at least one argument.
+
+    Boundary cases:
+      (char-set-union) => char-set:empty
+      (char-set-intersection) => char-set:all
+      (char-set-xor) => char-set:empty
+      (char-set-difference cs) => cs
+
+    CHAR-SET-DIFF+INTERSECTION returns both the difference and the
+    intersection of the arguments -- it partitions its first parameter.
+    It is equivalent to 
+        (values (char-set-difference cs1 cs2 ...)
+	        (char-set-intersection cs1 (char-set-union cs2 ...)))
+    but can be implemented more efficiently.
+
+    Programmers should be aware that CHAR-SET-COMPLEMENT could potentially
+    be a very expensive operation in Scheme implementations that provide
+    a very large character type, such as 32-bit Unicode. If this is a
+    possibility, sets can be complimented with respect to a smaller
+    universe using CHAR-SET-DIFFERENCE.
+
+char-set-complement! cs		            -> char-set
+char-set-union! cs1 cs2 ...  	            -> char-set
+char-set-intersection! cs1 cs2 ...          -> char-set
+char-set-difference! cs1 cs2 ...            -> char-set
+char-set-xor! cs1 cs2 ...                   -> char-set
+char-set-diff+intersection! cs1 cs2 cs3 ... -> [char-set char-set]
+    These are linear-update variants of the set-algebra functions.
+    They are allowed, but not required, to side-effect their first 
+    (required) parameter.
+
+    
+    CHAR-SET-DIFF+INTERSECTION! is allowed to side-effect both of
+    its two required parameters, CS1 and CS2.
+
+** Standard character sets
+==========================
+Several character sets are predefined for convenience:
+    char-set:lower-case		Lower-case letters
+    char-set:upper-case		Upper-case letters
+    char-set:title-case		Title-case letters
+    char-set:letter		Letters
+    char-set:digit		Digits
+    char-set:letter+digit	Letters and digits
+    char-set:graphic		Printing characters except spaces
+    char-set:printing		Printing characters including spaces
+    char-set:whitespace		Whitespace characters 
+    char-set:iso-control	The ISO control characters 
+    char-set:punctuation	Punctuation characters
+    char-set:symbol		Symbol characters
+    char-set:hex-digit		A hexadecimal digit: 0-9, A-F, a-f 
+    char-set:blank		Blank characters -- horizontal whitespace
+    char-set:ascii		All characters in the ASCII set. 
+    char-set:empty		Empty set 
+    char-set:full		All characters 
+
+Note that there may be characters in CHAR-SET:LETTER that are neither upper or
+lower case---this might occur in implementations that use a character type
+richer than ASCII, such as Unicode. A "graphic character" is one that would
+put ink on your page. While the exact composition of these sets may vary
+depending upon the character type provided by the underlying Scheme system,
+here are the definitions for some of the sets in an ASCII implementation:
+
+    char-set:lower-case		a-z 
+    char-set:upper-case		A-Z 
+    char-set:letter		A-Z and a-z 
+    char-set:digit		0123456789
+    char-set:punctuation	!"#%&'()*,-./:;?@[\]_{}
+    char-set:symbol		$+<=>^`|~
+    char-set:whitespace		Space, newline, tab, form feed, 
+				vertical tab, carriage return 
+    char-set:blank		Space and tab 
+    char-set:graphic		letter + digit + punctuation + symbol
+    char-set:printing		graphic + whitespace
+    char-set:iso-control	ASCII 0-31 and 127 
+
+Note that the existence of the CHAR-SET:ASCII set implies that the underlying
+character set is required to be at least as rich as ASCII (including
+ASCII's control characters).
+
+Rationale: The name choices reflect a shift from the older
+"alphabetic/numeric" terms found in R5RS and Posix to newer,
+Unicode-influenced "letter/digit" lexemes.
+
+-------------------------------------------------------------------------------
+* Unicode, Latin-1 and ASCII definitions of the standard character sets
+-----------------------------------------------------------------------
+
+In Unicode Scheme implementations, the base character sets are compatible with
+Java's Unicode specifications. For ASCII or Latin-1, we simply restrict the
+Unicode set specifications to their first 128 or 256 codes, respectively.
+Scheme implementations that are not based on ASCII, Latin-1 or Unicode should
+attempt to preserve the sense or spirit of these definitions.
+
+The following descriptions frequently make reference to the "Unicode character
+database." This is a file, available at URL
+    ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt
+Each line contains a description of a Unicode character. The first
+semicolon-delimited field of the line gives the hex value of the character's
+code; the second field gives the name of the character, and the third field
+gives a two-letter category. Other fields give simple 1-1 case-mappings for
+the character and other information; see
+    ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.html
+for further description of the file's format. Note in particular the
+two-letter category specified in the the third field, which is referenced
+frequently in the descriptions below.
+
+** char-set:lower-case
+======================
+For Unicode, we follow Java's specification: a character is lowercase if
+    + it is not in the range [U+2000,U+2FFF], and
+    + the Unicode attribute table does not give a lowercase mapping for it, and
+    + at least one of the following is true:
+        - the Unicode attribute table gives a mapping to uppercase 
+	  for the character, or
+	- the name for the character in the Unicode attribute table contains
+	  the words "SMALL LETTER" or "SMALL LIGATURE".
+
+The lower-case ASCII characters are 
+    abcdefghijklmnopqrstuvwxyz
+Latin-1 adds another 33 lower-case characters to the ASCII set:
+    00B5 MICRO SIGN
+    00DF LATIN SMALL LETTER SHARP S
+    00E0 LATIN SMALL LETTER A WITH GRAVE
+    00E1 LATIN SMALL LETTER A WITH ACUTE
+    00E2 LATIN SMALL LETTER A WITH CIRCUMFLEX
+    00E3 LATIN SMALL LETTER A WITH TILDE
+    00E4 LATIN SMALL LETTER A WITH DIAERESIS
+    00E5 LATIN SMALL LETTER A WITH RING ABOVE
+    00E6 LATIN SMALL LETTER AE
+    00E7 LATIN SMALL LETTER C WITH CEDILLA
+    00E8 LATIN SMALL LETTER E WITH GRAVE
+    00E9 LATIN SMALL LETTER E WITH ACUTE
+    00EA LATIN SMALL LETTER E WITH CIRCUMFLEX
+    00EB LATIN SMALL LETTER E WITH DIAERESIS
+    00EC LATIN SMALL LETTER I WITH GRAVE
+    00ED LATIN SMALL LETTER I WITH ACUTE
+    00EE LATIN SMALL LETTER I WITH CIRCUMFLEX
+    00EF LATIN SMALL LETTER I WITH DIAERESIS
+    00F0 LATIN SMALL LETTER ETH
+    00F1 LATIN SMALL LETTER N WITH TILDE
+    00F2 LATIN SMALL LETTER O WITH GRAVE
+    00F3 LATIN SMALL LETTER O WITH ACUTE
+    00F4 LATIN SMALL LETTER O WITH CIRCUMFLEX
+    00F5 LATIN SMALL LETTER O WITH TILDE
+    00F6 LATIN SMALL LETTER O WITH DIAERESIS
+    00F8 LATIN SMALL LETTER O WITH STROKE
+    00F9 LATIN SMALL LETTER U WITH GRAVE
+    00FA LATIN SMALL LETTER U WITH ACUTE
+    00FB LATIN SMALL LETTER U WITH CIRCUMFLEX
+    00FC LATIN SMALL LETTER U WITH DIAERESIS
+    00FD LATIN SMALL LETTER Y WITH ACUTE
+    00FE LATIN SMALL LETTER THORN
+    00FF LATIN SMALL LETTER Y WITH DIAERESIS
+Note that three of these have no corresponding Latin-1 upper-case character:
+    00B5 MICRO SIGN
+    00DF LATIN SMALL LETTER SHARP S
+    00FF LATIN SMALL LETTER Y WITH DIAERESIS
+(The compatibility micro character uppercases to the non-Latin-1 Greek capital
+mu; the German sharp s character uppercases to the pair of characters "SS,"
+and the capital y-with-diaeresis is non-Latin-1.)
+
+(Note that the Java spec for lowercase characters given at
+    http://java.sun.com/docs/books/jls/html/javalang.doc4.html#14345
+is inconsistent. U+00B5 MICRO SIGN fulfills the requirements for a lower-case
+character (as of Unicode 3.0), but is not given in the numeric list of
+lower-case character codes.)
+
+(Note that the Java spec for isLowerCase() given at
+    http://java.sun.com/products/jdk/1.2/docs/api/java/lang/Character.html#isLowerCase(char)
+gives three mutually inconsistent definitions of "lower case." The first is
+the definition used in this SRFI. Following text says "A character is
+considered to be lowercase if and only if it is specified to be lowercase by
+the Unicode 2.0 standard (category Ll in the Unicode specification data
+file)." The former spec excludes U+00AA FEMININE ORDINAL INDICATOR and
+U+00BA MASCULINE ORDINAL INDICATOR; the later spec includes them. Finally,
+the spec enumerates a list of characters in the Latin-1 subset; this list
+excludes U+00B5 MICRO SIGN, which is included in both of the previous specs.) 
+
+
+** char-set:upper-case
+======================
+For Unicode, we follow Java's specification: a character is uppercase if
+    + it is not in the range [U+2000,U+2FFF], and
+    + the Unicode attribute table does not give an uppercase mapping for it
+      (this excludes titlecase characters), and
+    + at least one of the following is true:
+        - the Unicode attribute table gives a mapping to lowercase 
+	  for the character, or
+	- the name for the character in the Unicode attribute table contains
+	  the words "CAPITAL LETTER" or "CAPITAL LIGATURE".
+
+The upper-case ASCII characters are 
+    ABCDEFGHIJKLMNOPQRSTUVWXYZ
+Latin-1 adds another 30 upper-case characters to the ASCII set:
+    00C0 LATIN CAPITAL LETTER A WITH GRAVE
+    00C1 LATIN CAPITAL LETTER A WITH ACUTE
+    00C2 LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+    00C3 LATIN CAPITAL LETTER A WITH TILDE
+    00C4 LATIN CAPITAL LETTER A WITH DIAERESIS
+    00C5 LATIN CAPITAL LETTER A WITH RING ABOVE
+    00C6 LATIN CAPITAL LETTER AE
+    00C7 LATIN CAPITAL LETTER C WITH CEDILLA
+    00C8 LATIN CAPITAL LETTER E WITH GRAVE
+    00C9 LATIN CAPITAL LETTER E WITH ACUTE
+    00CA LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+    00CB LATIN CAPITAL LETTER E WITH DIAERESIS
+    00CC LATIN CAPITAL LETTER I WITH GRAVE
+    00CD LATIN CAPITAL LETTER I WITH ACUTE
+    00CE LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+    00CF LATIN CAPITAL LETTER I WITH DIAERESIS
+    00D0 LATIN CAPITAL LETTER ETH
+    00D1 LATIN CAPITAL LETTER N WITH TILDE
+    00D2 LATIN CAPITAL LETTER O WITH GRAVE
+    00D3 LATIN CAPITAL LETTER O WITH ACUTE
+    00D4 LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+    00D5 LATIN CAPITAL LETTER O WITH TILDE
+    00D6 LATIN CAPITAL LETTER O WITH DIAERESIS
+    00D8 LATIN CAPITAL LETTER O WITH STROKE
+    00D9 LATIN CAPITAL LETTER U WITH GRAVE
+    00DA LATIN CAPITAL LETTER U WITH ACUTE
+    00DB LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+    00DC LATIN CAPITAL LETTER U WITH DIAERESIS
+    00DD LATIN CAPITAL LETTER Y WITH ACUTE
+    00DE LATIN CAPITAL LETTER THORN
+
+
+** char-set:title-case
+======================
+In Unicode, a character is titlecase if it has the category Lt in
+the character attribute database. There are very few of these characters;
+here is the entire 31-character list as of Unicode 3.0:
+
+    01C5 LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON
+    01C8 LATIN CAPITAL LETTER L WITH SMALL LETTER J
+    01CB LATIN CAPITAL LETTER N WITH SMALL LETTER J
+    01F2 LATIN CAPITAL LETTER D WITH SMALL LETTER Z
+    1F88 GREEK CAPITAL LETTER ALPHA WITH PSILI AND PROSGEGRAMMENI
+    1F89 GREEK CAPITAL LETTER ALPHA WITH DASIA AND PROSGEGRAMMENI
+    1F8A GREEK CAPITAL LETTER ALPHA WITH PSILI AND VARIA AND PROSGEGRAMMENI
+    1F8B GREEK CAPITAL LETTER ALPHA WITH DASIA AND VARIA AND PROSGEGRAMMENI
+    1F8C GREEK CAPITAL LETTER ALPHA WITH PSILI AND OXIA AND PROSGEGRAMMENI
+    1F8D GREEK CAPITAL LETTER ALPHA WITH DASIA AND OXIA AND PROSGEGRAMMENI
+    1F8E GREEK CAPITAL LETTER ALPHA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
+    1F8F GREEK CAPITAL LETTER ALPHA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
+    1F98 GREEK CAPITAL LETTER ETA WITH PSILI AND PROSGEGRAMMENI
+    1F99 GREEK CAPITAL LETTER ETA WITH DASIA AND PROSGEGRAMMENI
+    1F9A GREEK CAPITAL LETTER ETA WITH PSILI AND VARIA AND PROSGEGRAMMENI
+    1F9B GREEK CAPITAL LETTER ETA WITH DASIA AND VARIA AND PROSGEGRAMMENI
+    1F9C GREEK CAPITAL LETTER ETA WITH PSILI AND OXIA AND PROSGEGRAMMENI
+    1F9D GREEK CAPITAL LETTER ETA WITH DASIA AND OXIA AND PROSGEGRAMMENI
+    1F9E GREEK CAPITAL LETTER ETA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
+    1F9F GREEK CAPITAL LETTER ETA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
+    1FA8 GREEK CAPITAL LETTER OMEGA WITH PSILI AND PROSGEGRAMMENI
+    1FA9 GREEK CAPITAL LETTER OMEGA WITH DASIA AND PROSGEGRAMMENI
+    1FAA GREEK CAPITAL LETTER OMEGA WITH PSILI AND VARIA AND PROSGEGRAMMENI
+    1FAB GREEK CAPITAL LETTER OMEGA WITH DASIA AND VARIA AND PROSGEGRAMMENI
+    1FAC GREEK CAPITAL LETTER OMEGA WITH PSILI AND OXIA AND PROSGEGRAMMENI
+    1FAD GREEK CAPITAL LETTER OMEGA WITH DASIA AND OXIA AND PROSGEGRAMMENI
+    1FAE GREEK CAPITAL LETTER OMEGA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI
+    1FAF GREEK CAPITAL LETTER OMEGA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI
+    1FBC GREEK CAPITAL LETTER ALPHA WITH PROSGEGRAMMENI
+    1FCC GREEK CAPITAL LETTER ETA WITH PROSGEGRAMMENI
+    1FFC GREEK CAPITAL LETTER OMEGA WITH PROSGEGRAMMENI
+
+There are no ASCII or Latin-1 titlecase characters.
+
+
+** char-set:letter
+==================
+In Unicode, a letter is any character with one of the letter categories
+(Lu, Ll, Lt, Lm, Lo) in the Unicode character database. 
+
+There are 52 ASCII letters
+    abcdefghijklmnopqrstuvwxyz
+    ABCDEFGHIJKLMNOPQRSTUVWXYZ
+
+There are 117 Latin-1 letters. These are the 115 characters that are
+members of the Latin-1 CHAR-SET:LOWER-CASE and CHAR-SET:UPPER-CASE sets, 
+plus
+    00AA FEMININE ORDINAL INDICATOR
+    00BA MASCULINE ORDINAL INDICATOR
+(These two letters are considered lower-case by Unicode, but not by
+Java or SRFI 14.)
+
+** char-set:digit
+=================
+In Unicode, a character is a digit if it has the category Nd in
+the character attribute database. In Latin-1 and ASCII, the only
+such characters are 0123456789. In Unicode, there are other digit
+characters in other code blocks, such as Gujarati digits and Tibetan
+digits.
+
+
+** char-set:hex-digit
+=====================
+The only hex digits are 0123456789abcdefABCDEF.
+
+
+** char-set:letter+digit
+========================
+The union of CHAR-SET:LETTER and CHAR-SET:DIGIT.
+
+
+** char-set:graphic	
+===================
+A graphic character is one that would put ink on paper. The ASCII and Latin-1
+graphic characters are the members of
+    CHAR-SET:LETTER
+    CHAR-SET:DIGIT
+    CHAR-SET:PUNCTUATION
+    CHAR-SET:SYMBOL
+
+
+** char-set:printing	
+====================
+A printing character is one that would occupy space when printed, i.e.,
+a graphic character or a space character. CHAR-SET:PRINTING is the union
+of CHAR-SET:WHITESPACE and CHAR-SET:GRAPHIC.
+
+
+** char-set:whitespace	
+======================
+In Unicode, a whitespace character is either
+  - a character with one of the space, line, or paragraph separator categories
+    (Zs, Zl or Zp) of the Unicode character database.
+  - U+0009 Horizontal tabulation (\t control-I)
+  - U+000A Line feed (\n control-J)
+  - U+000B Vertical tabulation (\v control-K)
+  - U+000C Form feed (\f control-L)
+  - U+000D Carriage return (\r control-M)
+
+There are 24 whitespace characters in Unicode 3.0:
+    0009 HORIZONTAL TABULATION	\t control-I
+    000A LINE FEED		\n control-J
+    000B VERTICAL TABULATION	\v control-K
+    000C FORM FEED		\f control-L
+    000D CARRIAGE RETURN	\r control-M
+    0020 SPACE			Zs
+    00A0 NO-BREAK SPACE		Zs
+    1680 OGHAM SPACE MARK	Zs
+    2000 EN QUAD		Zs
+    2001 EM QUAD		Zs
+    2002 EN SPACE		Zs
+    2003 EM SPACE		Zs
+    2004 THREE-PER-EM SPACE	Zs
+    2005 FOUR-PER-EM SPACE	Zs
+    2006 SIX-PER-EM SPACE	Zs
+    2007 FIGURE SPACE		Zs
+    2008 PUNCTUATION SPACE	Zs
+    2009 THIN SPACE		Zs
+    200A HAIR SPACE		Zs
+    200B ZERO WIDTH SPACE	Zs
+    2028 LINE SEPARATOR		Zl
+    2029 PARAGRAPH SEPARATOR	Zp
+    202F NARROW NO-BREAK SPACE	Zs
+    3000 IDEOGRAPHIC SPACE	Zs
+
+The ASCII whitespace characters are the first six characters in the above list
+-- line feed, horizontal tabulation, vertical tabulation, form feed, carriage
+return, and space. These are also exactly the characters recognised by the
+Posix isspace() procedure. Latin-1 adds the no-break space.
+
+Note: Java's isWhitespace() method is incompatible, including
+    001C FILE SEPARATOR   (control-\)
+    001D GROUP SEPARATOR  (control-])
+    001E RECORD SEPARATOR (control-^)
+    001F UNIT SEPARATOR   (control-_)
+and excluding
+    00A0 NO-BREAK SPACE
+
+Java's excluding the no-break space means that tokenizers can simply break
+character streams at "whitespace" boundaries. However, the exclusion introduces
+exceptions in other places, e.g. CHAR-SET:PRINTING is no longer simply the
+union of CHAR-SET:GRAPHIC and CHAR-SET:WHITESPACE.
+
+
+** char-set:iso-control	
+=======================
+The ISO control characters are the Unicode/Latin-1 characters in the ranges
+[U+0000,U+001F] and [U+007F,U+009F].
+
+ASCII restricts this set to the characters in the range [U+0000,U+001F] 
+plus the character U+007F.
+
+Note that Unicode defines other control characters which do not belong to this
+set (hence the qualifying prefix "iso-" in the name). This restriction is
+compatible with the Java IsISOControl() method.
+
+
+** char-set:punctuation	
+=======================
+In Unicode, a punctuation character is any character that has one of the
+punctuation categories in the Unicode character database (Pc, Pd, Ps,
+Pe, Pi, Pf, or Po.)
+
+ASCII has 23 punctuation characters:
+    !"#%&'()*,-./:;?@[\]_{}
+
+Latin-1 adds six more:
+    00A1 INVERTED EXCLAMATION MARK
+    00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+    00AD SOFT HYPHEN
+    00B7 MIDDLE DOT
+    00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+    00BF INVERTED QUESTION MARK
+
+Note that the nine ASCII characters $+<=>^`|~ are *not* punctuation.
+They are "symbols."
+
+
+** char-set:symbol
+==================
+In Unicode, a symbol is any character that has one of the symbol categories
+in the Unicode character database (Sm, Sc, Sk, or So). There are nine ASCII 
+symbol characters:
+    $+<=>^`|~
+
+Latin-1 adds 18 more:
+    00A2 CENT SIGN
+    00A3 POUND SIGN
+    00A4 CURRENCY SIGN
+    00A5 YEN SIGN
+    00A6 BROKEN BAR
+    00A7 SECTION SIGN
+    00A8 DIAERESIS
+    00A9 COPYRIGHT SIGN
+    00AC NOT SIGN
+    00AE REGISTERED SIGN
+    00AF MACRON
+    00B0 DEGREE SIGN
+    00B1 PLUS-MINUS SIGN
+    00B4 ACUTE ACCENT
+    00B6 PILCROW SIGN
+    00B8 CEDILLA
+    00D7 MULTIPLICATION SIGN
+    00F7 DIVISION SIGN
+
+
+** char-set:blank	
+=================
+Blank chars are horizontal whitespace. In Unicode, a blank character is either
+  - a character with the space separator category (Zs) in the Unicode 
+    character database.
+  - U+0009 Horizontal tabulation (\t control-I)
+
+There are eighteen blank characters in Unicode 3.0:
+    0009 HORIZONTAL TABULATION	\t control-I
+    0020 SPACE			Zs
+    00A0 NO-BREAK SPACE		Zs
+    1680 OGHAM SPACE MARK	Zs
+    2000 EN QUAD		Zs
+    2001 EM QUAD		Zs
+    2002 EN SPACE		Zs
+    2003 EM SPACE		Zs
+    2004 THREE-PER-EM SPACE	Zs
+    2005 FOUR-PER-EM SPACE	Zs
+    2006 SIX-PER-EM SPACE	Zs
+    2007 FIGURE SPACE		Zs
+    2008 PUNCTUATION SPACE	Zs
+    2009 THIN SPACE		Zs
+    200A HAIR SPACE		Zs
+    200B ZERO WIDTH SPACE	Zs
+    202F NARROW NO-BREAK SPACE	Zs
+    3000 IDEOGRAPHIC SPACE	Zs
+
+The ASCII blank characters are the first two characters above --
+horizontal tab and space. Latin-1 adds the no-break space.
+
+Java doesn't have the concept of "blank" characters, so there are no
+compatibility issues.
+
+
+-------------------------------------------------------------------------------
+* Reference implementation
+--------------------------
+
+This SRFI comes with a reference implementation. It resides at:
+    http://srfi.schemers.org/srfi-14/srfi-14.scm
+I have placed this source on the Net with an unencumbered, "open" copyright.
+Some of the code in the reference implementation bears a distant family
+relation to the MIT Scheme implementation, and being derived from that code,
+is covered by the MIT Scheme copyright (which is a generic BSD-style
+open-source copyright -- see the source file for details). The remainder of
+the code was written by myself for scsh or for this SRFI; I have placed this
+code under the scsh copyright, which is also a generic BSD-style open-source
+copyright.
+
+The code is written for portability and should be simple to port to
+any Scheme. It has only the following deviations from R4RS, clearly
+discussed in the comments:
+  - an ERROR procedure;
+  - the R5RS VALUES procedure for producing multiple return values;
+  - a simple CHECK-ARG procedure for argument checking;
+  - LET-OPTIONALS* and :OPTIONAL macros for for parsing, checking & defaulting
+    optional arguments from rest lists;
+  - The SRFI-19 DEFINE-RECORD-TYPE form;
+  - BITWISE-AND for the hash function;
+  - %LATIN1->CHAR & %CHAR->LATIN1.
+
+The library is written for clarity and well-commented; the current source is
+about 375 lines of source code and 375 lines of comments and white space.
+It is also written for efficiency. Fast paths are provided for common cases.
+
+This is not to say that the implementation can't be tuned up for
+a specific Scheme implementation. There are notes in comments addressing
+ways implementors can tune the reference implementation for performance.
+
+In short, I've written the reference implementation to make it as painless
+as possible for an implementor -- or a regular programmer -- to adopt this
+library and get good results with it.
+
+The code uses a rather simple-minded, inefficient representation for
+ASCII/Latin-1 char-sets -- a 256-character string. The character whose code is
+I is in the set if S[I] = ASCII 1 (soh, or ^a); not in the set if S[I] = ASCII
+0 (nul). A much faster and denser representation would be 16 or 32 bytes worth
+of bit string. A portable implementation using bit sets awaits standards for
+bitwise logical-ops and byte vectors.
+
+"Large" character types, such as Unicode, should use a sparse representation,
+taking care that the Latin-1 subset continues to be represented with a
+dense 32-byte bit set.
+
+
+-------------------------------------------------------------------------------
+* Acknowledgements
+------------------
+
+The design of this library benefited greatly from the feedback provided during
+the SRFI discussion phase. Among those contributing thoughtful commentary and
+suggestions, both on the mailing list and by private discussion, were Paolo
+Amoroso, Lars Arvestad, Alan Bawden, Jim Bender, Dan Bornstein, Per Bothner,
+Will Clinger, Brian Denheyer, Kent Dybvig, Sergei Egorov, Marc Feeley,
+Matthias Felleisen, Will Fitzgerald, Matthew Flatt, Arthur A. Gleckler, Ben
+Goetter, Sven Hartrumpf, Erik Hilsdale, Shiro Kawai, Richard Kelsey, Oleg
+Kiselyov, Bengt Kleberg, Donovan Kolbly, Bruce Korb, Shriram Krishnamurthi,
+Bruce Lewis, Tom Lord, Brad Lucier, Dave Mason, David Rush, Klaus Schilling,
+Jonathan Sobel, Mike Sperber, Mikael Staldal, Vladimir Tsyshevsky, Donald
+Welsh, and Mike Wilson. I am grateful to them for their assistance.
+
+I am also grateful the authors, implementors and documentors of all the systems
+mentioned in the introduction. Aubrey Jaffer and Kent Pitman should be noted
+for their work in producing Web-accessible versions of the R5RS and Common
+Lisp spec, which was a tremendous aid.
+
+This is not to imply that these individuals necessarily endorse the final
+results, of course. 
+
+During this document's long development period, great patience was exhibited
+by Mike Sperber, who is the editor for the SRFI, and by Hillary Sullivan,
+who is not.
+
+-------------------------------------------------------------------------------
+* References & links
+--------------------
+
+[Java]
+    The following URLs provide documentation on relevant Java classes.
+
+    http://java.sun.com/products/jdk/1.2/docs/api/java/lang/Character.html
+    http://java.sun.com/products/jdk/1.2/docs/api/java/lang/String.html
+    http://java.sun.com/products/jdk/1.2/docs/api/java/lang/StringBuffer.html
+    http://java.sun.com/products/jdk/1.2/docs/api/java/text/Collator.html
+    http://java.sun.com/products/jdk/1.2/docs/api/java/text/package-summary.html
+
+[MIT-Scheme]
+    http://www.swiss.ai.mit.edu/projects/scheme/
+
+[R5RS]
+    Revised^5 report on the algorithmic language Scheme.
+    R. Kelsey, W. Clinger, J. Rees (editors).
+    Higher-Order and Symbolic Computation, Vol. 11, No. 1, September, 1998.
+    and ACM SIGPLAN Notices, Vol. 33, No. 9, October, 1998.
+
+    Available at http://www.schemers.org/Documents/Standards/
+
+[SRFI]
+    The SRFI web site.
+    http://srfi.schemers.org/
+
+[SRFI-14]
+    SRFI-14: Character-set library.
+    http://srfi.schemers.org/srfi-14/
+
+    This document, in HTML:
+        http://srfi.schemers.org/srfi-14/srfi-14.html
+    This document, in plain text format:
+        http://srfi.schemers.org/srfi-14/srfi-14.txt
+    Source code for the reference implementation:
+        http://srfi.schemers.org/srfi-14/srfi-14.scm
+    Scheme 48 module specification, with typings: 
+        http://srfi.schemers.org/srfi-14/srfi-14-s48-module.scm 
+    Regression-test suite:
+        http://srfi.schemers.org/srfi-14/srfi-14-tests.scm 
+
+[Unicode]
+    http://www.unicode.org/
+
+[UnicodeData]
+    The Unicode character database.
+    ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.html
+    ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt
+
+
+-------------------------------------------------------------------------------
+* Copyright
+-----------
+
+Certain portions of this document -- the specific, marked segments of text
+describing the R5RS procedures -- were adapted with permission from the R5RS
+report.
+    
+All other text is copyright (C) Olin Shivers (1998, 1999). 
+All Rights Reserved. 
+
+This document and translations of it may be copied and furnished to others,
+and derivative works that comment on or otherwise explain it or assist in its
+implementation may be prepared, copied, published and distributed, in whole or
+in part, without restriction of any kind, provided that the above copyright
+notice and this paragraph are included on all such copies and derivative
+works. However, this document itself may not be modified in any way, such as
+by removing the copyright notice or references to the Scheme Request For
+Implementation process or editors, except as needed for the purpose of
+developing SRFIs in which case the procedures for copyrights defined in the
+SRFI process must be followed, or as required to translate it into languages
+other than English.
+
+The limited permissions granted above are perpetual and will not be revoked by
+the authors or their successors or assigns.
+
+This document and the information contained herein is provided on an "AS IS"
+basis and THE AUTHORS AND THE SRFI EDITORS DISCLAIM ALL WARRANTIES, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO ANY WARRANTY THAT THE USE OF THE
+INFORMATION HEREIN WILL NOT INFRINGE ANY RIGHTS OR ANY IMPLIED WARRANTIES OF
+MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
+
+
+
+-------------------------------------------------------------------------------
+* Ispell "buffer local" dictionary
+----------------------------------
+
+Ispell dumps "buffer local" words here. Please ignore.
+
+ LocalWords:  SRFI Unicode API RS lib ARG ascii xor diff defs Generalise cs CSi
+ LocalWords:  kons knil proc upcase cset lp eof lis cdr pred ary CHARi Posix op
+ LocalWords:  uniquified DrScheme soh nul HTML srfi html txt scm Clinger Rees
+ LocalWords:  SIGPLAN refs ucs iso CS's downcase IEC conformant JIS ASCII URL
+ LocalWords:  FFF abcdefghijklmnopqrstuvwxyz DF DIAERESIS AE EA EB EC EE EF ETH
+ LocalWords:  FA FB FC FD FF SS diaeresis isLowerCase Ll AA BA titlecase CA CB
+ LocalWords:  CC CD CE CF DA DC DD Lt CARON PSILI PROSGEGRAMMENI DASIA VARIA Lu
+ LocalWords:  OXIA PERISPOMENI FAA FAB FAC FAE FAF FBC FFC Lm Lo abcdefABCDEF
+ LocalWords:  Zs Zl Zp OGHAM IDEOGRAPHIC recognised isspace isWhitespace Pc Pd
+ LocalWords:  tokenizers IsISOControl Ps Pe Pf AB BB BF Sm Sc Sk AC AF MACRON
+ LocalWords:  PILCROW obj EQ scsh ops UnicodeData Paolo Amoroso Arvestad Bawden
+ LocalWords:  Bornstein Bothner Denheyer Dybvig Egorov Feeley Matthias Flatt eq
+ LocalWords:  Felleisen Gleckler Goetter Sven Hartrumpf Hilsdale Shiro Kawai
+ LocalWords:  Kiselyov Bengt Kleberg Kolbly Korb Shriram Krishnamurthi Lucier
+ LocalWords:  Schilling Sobel Mikael Staldal Tsyshevsky documentors Jaffer ans
+ LocalWords:  Sperber bignum fixnum ref init doc dict subform
diff --git a/scsh/lib/cset-obsolete.scm b/scsh/lib/cset-obsolete.scm
new file mode 100644
index 0000000..c37e761
--- /dev/null
+++ b/scsh/lib/cset-obsolete.scm
@@ -0,0 +1,52 @@
+;;; Support for obsolete, deprecated 0.5.2 char-set procedures.
+;;; Will go away in a future release.
+
+(define-interface obsolete-char-set-interface
+  (export char-set-members		; char-set->list
+	  chars->char-set		; list->char-set
+	  ascii-range->char-set		; ucs-range->char-set (not exact)
+	  predicate->char-set		; char-set-filter (not exact)
+	  ->char-set			; no longer handles a predicate
+	  char-set-every?		; char-set-every
+
+	  char-set-invert		; char-set-complement
+	  char-set-invert!		; char-set-complement!
+
+	  char-set:alphabetic		; char-set:letter
+	  char-set:numeric		; char-set:digit
+	  char-set:alphanumeric		; char-set:letter+digit
+	  char-set:control))		; char-set:iso-control
+
+
+(define-structure obsolete-char-set-lib obsolete-char-set-interface
+  (open scsh-utilities char-set-lib scheme)
+  (begin
+    
+    (define char-set-members
+      (deprecated-proc char-set->list 'char-set-members
+		       "Use CHAR-SET->LIST instead."))
+    (define chars->char-set
+      (deprecated-proc list->char-set 'chars->char-set
+		       "Use LIST->CHAR-SET instead."))
+    (define ascii-range->char-set
+      (deprecated-proc (lambda (lower upper) (ucs-range->char-set lower upper #t))
+		       'ascii-range->char-set
+		       "Use UCS-RANGE->CHAR-SET instead."))
+    (define predicate->char-set
+      (deprecated-proc (lambda (pred) (char-set-filter pred char-set:full))
+		       'predicate->char-set
+		       "Change code to use CHAR-SET-FILTER."))
+    (define char-set-every?
+      (deprecated-proc char-set-every 'char-set-every?
+		       "Use CHAR-SET-EVERYyn instead."))
+    (define char-set-invert
+      (deprecated-proc char-set-complement 'char-set-invert
+		       "Use CHAR-SET-COMPLEMENTyn instead."))
+    (define char-set-invert!
+      (deprecated-proc char-set-complement! 'char-set-invert!
+		       "Use CHAR-SET-COMPLEMENT!yn instead."))
+
+    (define char-set:alphabetic		char-set:letter)
+    (define char-set:numeric		char-set:digit)
+    (define char-set:alphanumeric	char-set:letter+digit)
+    (define char-set:control		char-set:iso-control)))
diff --git a/scsh/lib/cset-package.scm b/scsh/lib/cset-package.scm
new file mode 100644
index 0000000..28812c0
--- /dev/null
+++ b/scsh/lib/cset-package.scm
@@ -0,0 +1,151 @@
+;;; SRFI-14 interface for Scheme48				-*- Scheme -*-
+;;; 
+;;; Complete interface spec for the SRFI-14 char-set-lib library in the
+;;; Scheme48 interface and module language. The interface is fully typed, in
+;;; the Scheme48 type notation. The structure definitions also provide a
+;;; formal description of the external dependencies of the source code.
+
+(define-interface char-set-interface
+  (export (char-set? (proc (:value) :boolean))
+	  ((char-set= char-set<=) (proc (&rest :value) :boolean))
+
+	  (char-set-hash (proc (:value &opt :exact-integer) :exact-integer))
+
+	  ;; Cursors are exact integers in the reference implementation.
+	  ;; These typings would be different with a different cursor
+	  ;; implementation.
+	  ;; Too bad Scheme doesn't have abstract data types.
+	  (char-set-cursor      (proc (:value) :exact-integer))
+	  (char-set-ref         (proc (:value :exact-integer) :char))
+	  (char-set-cursor-next (proc (:value :exact-integer) :exact-integer))
+	  (end-of-char-set?     (proc (:value) :boolean))
+
+	  (char-set-fold (proc ((proc (:char :value) :value) :value :value)
+			       :value))
+	  (char-set-unfold (proc ((proc (:value) :boolean)
+				  (proc (:value) :value)
+				  (proc (:value) :value)
+				  :value
+				  &opt :value)
+				 :value))
+
+	  (char-set-unfold! (proc ((proc (:value) :boolean)
+				   (proc (:value) :value)
+				   (proc (:value) :value)
+				   :value :value)
+				  :value))
+
+	  (char-set-for-each (proc ((proc (:char) :values) :value) :unspecific))
+	  (char-set-map (proc ((proc (:char) :char) :value) :value))
+
+	  (char-set-copy (proc (:value) :value))
+
+	  (char-set (proc (&rest :char) :value))
+
+	  (list->char-set (proc (:value &opt :value) :value))
+	  (list->char-set! (proc (:value :value) :value))
+
+	  (string->char-set  (proc (:value &opt :value) :value))
+	  (string->char-set! (proc (:value :value) :value))
+
+	  (ucs-range->char-set (proc (:exact-integer :exact-integer &opt
+				      :boolean :value)
+				     :value))
+	  (ucs-range->char-set! (proc (:exact-integer :exact-integer
+				      :boolean :value)
+				     :value))
+
+	  (char-set-filter  (proc ((proc (:char) :boolean) :value &opt :value) :value))
+	  (char-set-filter! (proc ((proc (:char) :boolean) :value :value) :value))
+
+	  (->char-set (proc (:value) :value))
+
+	  (char-set-size (proc (:value) :exact-integer))
+	  (char-set-count (proc ((proc (:char) :boolean) :value) :exact-integer))
+	  (char-set-contains? (proc (:char :value) :boolean))
+
+	  (char-set-every (proc ((proc (:char) :boolean) :value) :boolean))
+	  (char-set-any (proc ((proc (:char) :boolean) :value) :value))
+
+	  ((char-set-adjoin  char-set-delete
+	    char-set-adjoin! char-set-delete!)
+	   (proc (:value &rest :char) :value))
+
+	  (char-set->list   (proc (:value) :value))
+	  (char-set->string (proc (:value) :string))
+
+	  (char-set-complement (proc (:value) :value))
+	  ((char-set-union char-set-intersection char-set-xor)
+	   (proc (&rest :value) :value))
+	  
+	  (char-set-difference (proc (:value &opt :value) :value))
+
+	  (char-set-diff+intersection (proc (:value &rest :value)
+					    (some-values :value :value)))
+
+	  (char-set-complement! (proc (:value) :value))
+
+	  ((char-set-union! char-set-intersection!
+	    char-set-xor! char-set-difference!)
+	   (proc (:value &opt :value) :value))
+
+	  (char-set-diff+intersection! (proc (:value :value &rest :value)
+					     (some-values :value :value)))
+
+	  char-set:lower-case
+	  char-set:upper-case
+	  char-set:letter
+	  char-set:digit
+	  char-set:letter+digit
+	  char-set:graphic
+	  char-set:printing
+	  char-set:whitespace
+	  char-set:blank
+	  char-set:iso-control
+	  char-set:punctuation
+	  char-set:symbol
+	  char-set:hex-digit
+	  char-set:ascii
+	  char-set:empty
+	  char-set:full
+	  ))
+
+; rdelim.scm gets into the innards of char-sets.
+(define-interface scsh-char-set-low-level-interface
+  (export (char-set:s (proc (:value) :string))))
+
+(define-structures ((char-set-lib char-set-interface)
+		    (scsh-char-set-low-level-lib scsh-char-set-low-level-interface))
+  (open error-package	; ERROR procedure
+	let-opt		; LET-OPTIONALS* and :OPTIONAL
+	ascii		; CHAR->ASCII ASCII->CHAR
+	bitwise		; BITWISE-AND
+	jar-d-r-t-package ; DEFINE-RECORD-TYPE/JAR macro.
+	scheme)
+
+  (begin (define (check-arg pred val caller)
+	   (let lp ((val val))
+	     (if (pred val) val (lp (error "Bad argument" val pred caller)))))
+
+	 (define %latin1->char ascii->char)	; Works for S48
+	 (define %char->latin1 char->ascii)	; Works for S48
+
+	 ;; Here's a SRFI-19 d-r-t defined in terms of jar's almost-identical
+	 ;; d-r-t.
+	 (define-syntax define-record-type
+	   (syntax-rules ()
+             ((define-record-type ?name ?stuff ...)
+	      (define-record-type/jar ?name ?name ?stuff ...)))))
+
+  (files cset-lib)
+  (optimize auto-integrate))
+
+;;; Import jar's DEFINE-RECORD-TYPE macro, and export it under the
+;;; name DEFINE-RECORD-TYPE/JAR.
+(define-structure jar-d-r-t-package (export (define-record-type/jar :syntax))
+  (open define-record-types ; JAR's record macro
+	scheme)
+  (begin (define-syntax define-record-type/jar
+	   (syntax-rules ()
+             ((define-record-type/jar ?stuff ...)
+	      (define-record-type ?stuff ...))))))
diff --git a/scsh/lib/cset-tests.scm b/scsh/lib/cset-tests.scm
new file mode 100644
index 0000000..0b96314
--- /dev/null
+++ b/scsh/lib/cset-tests.scm
@@ -0,0 +1,200 @@
+;;; This is a regression testing suite for the SRFI-14 char-set library.
+;;; Olin Shivers
+
+(let-syntax ((test (syntax-rules ()
+		     ((test form ...)
+		      (cond ((not form) (error "Test failed" 'form)) ...
+			    (else 'OK))))))
+  (let ((vowel (lambda (c) (member c '(#\a #\e #\i #\o #\u)))))
+
+(test
+ (not (char-set? 5))
+
+ (char-set? (char-set #\a #\e #\i #\o #\u))
+
+ (char-set=)
+ (char-set= (char-set))
+
+ (char-set= (char-set #\a #\e #\i #\o #\u)
+	    (string->char-set "ioeauaiii"))
+
+ (not (char-set= (char-set #\e #\i #\o #\u)
+		 (string->char-set "ioeauaiii")))
+
+ (char-set<=)
+ (char-set<= (char-set))
+
+ (char-set<= (char-set #\a #\e #\i #\o #\u)
+	     (string->char-set "ioeauaiii"))
+
+ (char-set<= (char-set #\e #\i #\o #\u)
+	     (string->char-set "ioeauaiii"))
+
+ (<= 0 (char-set-hash char-set:graphic 100) 99)
+
+ (= 4 (char-set-fold (lambda (c i) (+ i 1)) 0
+		     (char-set #\e #\i #\o #\u #\e #\e)))
+
+ (char-set= (string->char-set "eiaou2468013579999")
+	    (char-set-unfold null? car cdr '(#\a #\e #\i #\o #\u #\u #\u)
+			     char-set:digit))
+
+ (char-set= (string->char-set "eiaou246801357999")
+	    (char-set-unfold! null? car cdr '(#\a #\e #\i #\o #\u)
+			      (string->char-set "0123456789")))
+
+ (not (char-set= (string->char-set "eiaou246801357")
+		 (char-set-unfold! null? car cdr '(#\a #\e #\i #\o #\u)
+				   (string->char-set "0123456789"))))
+
+ (let ((cs (string->char-set "0123456789")))
+   (char-set-for-each (lambda (c) (set! cs (char-set-delete cs c)))
+		      (string->char-set "02468000"))
+   (char-set= cs (string->char-set "97531")))
+
+ (not (let ((cs (string->char-set "0123456789")))
+	(char-set-for-each (lambda (c) (set! cs (char-set-delete cs c)))
+			   (string->char-set "02468"))
+	(char-set= cs (string->char-set "7531"))))
+
+ (char-set= (char-set-map char-upcase (string->char-set "aeiou"))
+	    (string->char-set "IOUAEEEE"))
+
+ (not (char-set= (char-set-map char-upcase (string->char-set "aeiou"))
+		 (string->char-set "OUAEEEE")))
+
+ (char-set= (char-set-copy (string->char-set "aeiou"))
+	    (string->char-set "aeiou"))
+
+ (char-set= (char-set #\x #\y) (string->char-set "xy"))
+ (not (char-set= (char-set #\x #\y #\z) (string->char-set "xy")))
+
+ (char-set= (string->char-set "xy") (list->char-set '(#\x #\y)))
+ (not (char-set= (string->char-set "axy") (list->char-set '(#\x #\y))))
+
+ (char-set= (string->char-set "xy12345")
+	    (list->char-set '(#\x #\y) (string->char-set "12345")))
+ (not (char-set= (string->char-set "y12345")
+		 (list->char-set '(#\x #\y) (string->char-set "12345"))))
+
+ (char-set= (string->char-set "xy12345")
+	    (list->char-set! '(#\x #\y) (string->char-set "12345")))
+ (not (char-set= (string->char-set "y12345")
+		 (list->char-set! '(#\x #\y) (string->char-set "12345"))))
+
+ (char-set= (string->char-set "aeiou12345")
+	    (char-set-filter vowel? char-set:ascii (string->char-set "12345")))
+ (not (char-set= (string->char-set "aeou12345")
+		 (char-set-filter vowel? char-set:ascii (string->char-set "12345"))))
+
+ (char-set= (string->char-set "aeiou12345")
+	    (char-set-filter! vowel? char-set:ascii (string->char-set "12345")))
+ (not (char-set= (string->char-set "aeou12345")
+		 (char-set-filter! vowel? char-set:ascii (string->char-set "12345"))))
+
+
+ (char-set= (string->char-set "abcdef12345")
+	    (ucs-range->char-set 97 103 #t (string->char-set "12345")))
+ (not (char-set= (string->char-set "abcef12345")
+		 (ucs-range->char-set 97 103 #t (string->char-set "12345"))))
+
+ (char-set= (string->char-set "abcdef12345")
+	    (ucs-range->char-set! 97 103 #t (string->char-set "12345")))
+ (not (char-set= (string->char-set "abcef12345")
+		 (ucs-range->char-set! 97 103 #t (string->char-set "12345"))))
+
+
+ (char-set= (->char-set #\x)
+	    (->char-set "x")
+	    (->char-set (char-set #\x)))
+
+ (not (char-set= (->char-set #\x)
+		 (->char-set "y")
+		 (->char-set (char-set #\x))))
+
+ (= 10 (char-set-size (char-set-intersection char-set:ascii char-set:digit)))
+
+ (= 5 (char-set-count vowel? char-set:ascii))
+
+ (equal? '(#\x) (char-set->list (char-set #\x)))
+ (not (equal? '(#\X) (char-set->list (char-set #\x))))
+
+ (equal? "x" (char-set->string (char-set #\x)))
+ (not (equal? "X" (char-set->string (char-set #\x))))
+
+ (char-set-contains? (->char-set "xyz") #\x)
+ (not (char-set-contains? (->char-set "xyz") #\a))
+
+ (char-set-every char-lower-case? (->char-set "abcd"))
+ (not (char-set-every char-lower-case? (->char-set "abcD")))
+ (char-set-any char-lower-case? (->char-set "abcd"))
+ (not (char-set-any char-lower-case? (->char-set "ABCD")))
+
+ (char-set= (->char-set "ABCD")
+	    (let ((cs (->char-set "abcd")))
+	      (let lp ((cur (char-set-cursor cs)) (ans '()))
+		(if (end-of-char-set? cur) (list->char-set ans)
+		    (lp (char-set-cursor-next cs cur)
+			(cons (char-upcase (char-set-ref cs cur)) ans))))))
+
+
+ (char-set= (char-set-adjoin (->char-set "123") #\x #\a)
+	    (->char-set "123xa"))
+ (not (char-set= (char-set-adjoin (->char-set "123") #\x #\a)
+		 (->char-set "123x")))
+ (char-set= (char-set-adjoin! (->char-set "123") #\x #\a)
+	    (->char-set "123xa"))
+ (not (char-set= (char-set-adjoin! (->char-set "123") #\x #\a)
+		 (->char-set "123x")))
+
+ (char-set= (char-set-delete (->char-set "123") #\2 #\a #\2)
+	    (->char-set "13"))
+ (not (char-set= (char-set-delete (->char-set "123") #\2 #\a #\2)
+		 (->char-set "13a")))
+ (char-set= (char-set-delete! (->char-set "123") #\2 #\a #\2)
+	    (->char-set "13"))
+ (not (char-set= (char-set-delete! (->char-set "123") #\2 #\a #\2)
+		 (->char-set "13a")))
+
+ (char-set= (char-set-intersection char-set:hex-digit (char-set-complement char-set:digit))
+	    (->char-set "abcdefABCDEF"))
+ (char-set= (char-set-intersection! (char-set-complement! (->char-set "0123456789"))
+				    char-set:hex-digit)
+	    (->char-set "abcdefABCDEF"))
+
+ (char-set= (char-set-union char-set:hex-digit
+			    (->char-set "abcdefghijkl"))
+	    (->char-set "abcdefABCDEFghijkl0123456789"))
+ (char-set= (char-set-union! (->char-set "abcdefghijkl")
+			     char-set:hex-digit)
+	    (->char-set "abcdefABCDEFghijkl0123456789"))
+
+ (char-set= (char-set-difference (->char-set "abcdefghijklmn")
+				 char-set:hex-digit)
+	    (->char-set "ghijklmn"))
+ (char-set= (char-set-difference! (->char-set "abcdefghijklmn")
+				  char-set:hex-digit)
+	    (->char-set "ghijklmn"))
+
+ (char-set= (char-set-xor (->char-set "0123456789")
+			  char-set:hex-digit)
+	    (->char-set "abcdefABCDEF"))
+ (char-set= (char-set-xor! (->char-set "0123456789")
+			   char-set:hex-digit)
+	    (->char-set "abcdefABCDEF"))
+
+ (call-with-values (lambda ()
+		     (char-set-diff+intersection char-set:hex-digit
+						 char-set:letter))
+   (lambda (d i)
+     (and (char-set= d (->char-set "0123456789"))
+	  (char-set= i (->char-set "abcdefABCDEF")))))
+
+ (call-with-values (lambda ()
+		     (char-set-diff+intersection! (char-set-copy char-set:hex-digit)
+						  (char-set-copy char-set:letter)))
+   (lambda (d i)
+     (and (char-set= d (->char-set "0123456789"))
+	  (char-set= i (->char-set "abcdefABCDEF"))))))
+
+))
diff --git a/scsh/lib/list-lib.scm b/scsh/lib/list-lib.scm
index 2491355..7386882 100644
--- a/scsh/lib/list-lib.scm
+++ b/scsh/lib/list-lib.scm
@@ -16,6 +16,11 @@
 ;;; This implementation is intended as a portable reference implementation
 ;;; for SRFI-1. See the porting notes below for more information.
 
+;;; Revision history
+;;;;;;;;;;;;;;;;;;;;
+;;; This is version 1.1. 12/18/2000
+;;; Fixes a small bug in DELETE-DUPLICATES!.
+
 ;;; Exported:
 ;;; xcons tree-copy make-list list-tabulate cons* list-copy 
 ;;; proper-list? circular-list? dotted-list? not-pair? null-list? list=
@@ -384,7 +389,7 @@
 (define (null-list? l)
   (cond ((pair? l) #f)
 	((null? l) #t)
-	(else (error "null-pair?: argument out of domain" l))))
+	(else (error "null-list?: argument out of domain" l))))
            
 
 (define (list= = . lists)
@@ -1239,7 +1244,7 @@
 		 (new-tail (recur (delete x tail elt=))))
 	    (if (eq? tail new-tail) lis (cons x new-tail)))))))
 
-(define (delete-duplicates! lis maybe-=)
+(define (delete-duplicates! lis . maybe-=)
   (let ((elt= (:optional maybe-= equal?)))
     (check-arg procedure? elt= delete-duplicates!)
     (let recur ((lis lis))
diff --git a/scsh/lib/srfi-1.html b/scsh/lib/srfi-1.html
index 125ae20..18e6c39 100644
--- a/scsh/lib/srfi-1.html
+++ b/scsh/lib/srfi-1.html
@@ -1,4 +1,4 @@
-<!doctype html public '-//W3C//DTD HTML 4.0//EN'
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0//EN"
   'http://www.w3.org/TR/REC-html40/strict.dtd'>
 
 <!-- Is there a portable way to write an em-dash?
@@ -36,9 +36,15 @@
 	   div.indent { margin-left: 2em; }	  /* General indentation */
 	   pre.code-example { margin-left: 2em; } /* Indent code examples. */
 
+	   /* "Continue" class marks text that isn't really the start
+	   ** of a new paragraph -- e.g., continuing a para after a 
+	   ** code sample.
+	   */
+	   p.continue { text-indent: 0em; margin-top: 0em}
+
 	   /* This stuff is for definition lists of defined procedures.
            ** A proc-def2 is used when you want a stack of procs to go
-	   ** with one <dd> ... </dd> body. In this case, make the first
+	   ** with one dd body. In this case, make the first
 	   ** proc a proc-def1, following ones proc-defi's, and the last one
            ** a proc-defn.
            **
@@ -101,7 +107,7 @@
            a.draft { color: red; }
     </style>
 
-    <style type="text/css"; media=all>
+    <style type="text/css" media=all>
 	   /* Nastiness: Here, I'm using a bug to work around a bug.
 	   ** Netscape rendering bugs mean you need bogus <dt> and <dd>
 	   ** margin settings -- settings which screw up IE's proper rendering.
@@ -140,12 +146,28 @@ List Library
 </div>
 
 <!--========================================================================-->
-<h1>Author</H1>
+<H1>Author</H1>
+<p>
+Olin Shivers
+
     <address>
-       <a href="http://www.ai.mit.edu/~shivers/">Olin Shivers</A> /
-       <a href="mailto:shivers@ai.mit.edu">shivers@ai.mit.edu</A>
+      <a href="http://www.ai.mit.edu/~shivers/">http://www.ai.mit.edu/~shivers/</A> /
+      <a href="mailto:shivers@ai.mit.edu">shivers@ai.mit.edu</A>
     </address>
 
+<!--========================================================================-->
+<H1>Status</H1>
+<p>
+This SRFI is currently in ``final status.  To see an explanation of each status that a SRFI can hold, see <A HREF="http://srfi.schemers.org/srfi-process.html">here</A>.
+You can access the discussion via <A HREF=mail-archive/maillist.html>the archive of the mailing list</A>.
+<P>
+<UL>
+    <LI>Received: 1998/11/08</LI>
+    <LI>Draft: 1998/12/22-1999/03/09</LI>
+    <LI>Revised: several times</LI>
+    <LI>Final: 1999/10/09</LI>
+</UL>
+
 <!--========================================================================-->
 <h1>Table of contents</H1>
 
@@ -154,7 +176,7 @@ List Library
 -->
 <ul id=toc-table>
 <li><a href="#Abstract">Abstract</a>
-<li><a href="#Introduction">Introduction</a>
+<li><a href="#Rationale">Rationale</a>
 <li><a href="#ProcedureIndex">Procedure index</a>
 <li><a href="#GeneralDiscussion">General discussion</a>
   <ul>
@@ -196,14 +218,8 @@ reference implementation of the spec. The reference implementation is
 <li>completely open, public-domain source
 </ul>
 
-<strong><em>Note: This is a working draft, and tends to lag the plain-text version in terms of actual content.
-See <a href="ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1.txt">
-    ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1.txt</a>
-for the latest copy of the plain-text draft.
-</em></strong>
-
 <!--========================================================================-->
-<h1><a name="Introduction">Introduction</a></h1>
+<h1><a name="Rationale">Rationale</a></h1>
 <p>
 The set of basic list and pair operations provided by R4RS/<abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr> Scheme is far
 from satisfactory. Because this set is so small and basic, most
@@ -278,9 +294,9 @@ library and get good results with it.
 <h1><a name="ProcedureIndex">Procedure Index</a></h1>
 <p>
 Here is a short list of the procedures provided by the list-lib package.
-<a href="#R5RS">R5RS</a></abbr> procedures are shown in 
-<span class=r5rs-proc>bold</span class=r5rs-proc>;
-extended <a href="#R5RS">R5RS</a></abbr> 
+<abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr> procedures are shown in 
+<span class=r5rs-proc>bold</span>;
+extended <abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr> 
          procedures, in <span class=r5rs-procx>bold italic</span>.
 <div class=indent>
 <dl>
@@ -1033,9 +1049,10 @@ partition the entire universe of Scheme values.
 <!--
 ==== car cdr
 ============================================================================-->
+<dt class=proc-def1>
 <a name="car"></a>
 <a name="cdr"></a>
-<dt class=proc-def1><code class=proc-def>car</code><var> pair -&gt; value</var>
+<code class=proc-def>car</code><var> pair -&gt; value</var>
 <dt class=proc-defn><code class=proc-def>cdr</code><var> pair -&gt; value</var>
 <dd class=proc-def>
     [<abbr title="Revised^5 Report on Scheme"><a href="#R5RS">R5RS</a></abbr>]
@@ -2786,6 +2803,7 @@ That is, it must be the case that
 <div class=indent>
         <code>(eq? <var>x</var> <var>y</var>)</code> => <code>(<var>=</var> <var>x</var> <var>y</var>)</code>.
 </div>
+<p class=continue>
 Note that this implies, in turn, that two lists that are <code>eq?</code> are
 also set-equal by any legal comparison procedure. This allows for
 constant-time determination of set operations on <code>eq?</code> lists.
@@ -3142,7 +3160,7 @@ John David Stone, and Joerg F. Wittenberger. I am grateful to them for their
 assistance.
 <p>
 I am also grateful the authors, implementors and documentors of all the systems
-mentioned in the introduction. Aubrey Jaffer and Kent Pitman should be noted
+mentioned in the rationale.  Aubrey Jaffer and Kent Pitman should be noted
 for their work in producing Web-accessible versions of the R5RS and 
 <a href="#CommonLisp">Common Lisp</a> spec, which was a tremendous aid.
 <p>
@@ -3156,31 +3174,15 @@ results, of course.
 
 <dl>
 <dt class=biblio>This document, in HTML:
-<dd><a href="http://srfi.schemers.org/srfi-1/srfi-1.html">
+<dd><a href="srfi-1.html">
     http://srfi.schemers.org/srfi-1/srfi-1.html</a>
 
-    <br><a class=draft
-           href="ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1.html">
-    ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1.html (draft)</a>
-
-<dt class=biblio>This document, in simple text format:
-<dd><a href="http://srfi.schemers.org/srfi-1/srfi-1.txt">
-    http://srfi.schemers.org/srfi-1/srfi-1.txt</a>
-
-    <br><a class=draft
-           href="ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1.txt">
-    ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1.txt (draft)</a>
-
 <dt class=biblio>Source code for the reference implementation:
-<dd><a HREF="http://srfi.schemers.org/srfi-1/srfi-1-reference.scm">
+<dd><a HREF="srfi-1-reference.scm">
     http://srfi.schemers.org/srfi-1/srfi-1-reference.scm</a>
 
-    <br><a class=draft
-           href="ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1-reference.scm">
-    ftp://ftp.ai.mit.edu/people/shivers/srfi/srfi-1/srfi-1-reference.scm (draft)</a>
-
 <dt class=biblio>Archive of SRFI-1 discussion-list email:
-<dd><a href="http://srfi.schemers.org/srfi-1/mail-archive/maillist.html">
+<dd><a href="mail-archive/maillist.html">
     http://srfi.schemers.org/srfi-1/mail-archive/maillist.html</a>
 
 <dt class=biblio>SRFI web site:
diff --git a/scsh/lib/string-lib.scm b/scsh/lib/string-lib.scm
index 0282b36..242f6be 100644
--- a/scsh/lib/string-lib.scm
+++ b/scsh/lib/string-lib.scm
@@ -1,229 +1,325 @@
-;;; Scheme Underground string-processing library		-*- Scheme -*-
-;;; Olin Shivers 11/98
-
-;;; SRFI DRAFT -- SRFI DRAFT -- SRFI DRAFT -- SRFI DRAFT -- SRFI DRAFT
-;;; This is *draft* code for a SRFI proposal. If you see this notice in 
-;;; production code, you've got obsolete, bad source -- go find the final 
-;;; non-draft code on the Net.
-;;; SRFI DRAFT -- SRFI DRAFT -- SRFI DRAFT -- SRFI DRAFT -- SRFI DRAFT
-
-;;; Some of this code had (extremely distant) origins in MIT Scheme's string
-;;; lib, and was substantially reworked by Olin Shivers (shivers@ai.mit.edu)
-;;; 9/98. As such, it is
-;;;     Copyright (c) 1988-1994 Massachusetts Institute of Technology.
-;;; The copyright terms are essentially open-software terms;
-;;; the precise terms are at the end of this file.
-;;; 
-;;; The KMP string-search code was massively rehacked from Stephen Bevan's
-;;; code, written for scmlib, and is thus covered by the GPL. If that's a
-;;; problem, write one from scratch (there are citations to standard textbooks
-;;; in the comments), or rip it out and use the ten-line doubly-nested loop
-;;; that's commented out just above this code.
+;;; SRFI 13 string library reference implementation		-*- Scheme -*-
+;;; Olin Shivers 7/2000
 ;;;
-;;; I wish I could mark definitions in this code to be inlined.
-;;; Certain functions could benefit from compiler support.
-;;; 
-;;; My policy on checking start/end substring specs is not uniform.
-;;; I avoided doing arg checks when the function directly calls another
-;;; lower-level function that will check the start/end specs as well.
-;;; This has the advantage of not doing redundant checks, but the disadvantage
-;;; is that errors are not reported early, at the highest possible call.
-;;; There's not much high-level error checking of the other args, anyway.
-;;;     -Olin
+;;; Copyright (c) 1988-1994 Massachusetts Institute of Technology.
+;;; Copyright (c) 1998, 1999, 2000 Olin Shivers. All rights reserved.
+;;;   The details of the copyrights appear at the end of the file. Short
+;;;   summary: BSD-style open source.
 
 ;;; Exports:
-;;; string-map    string-map!
+;;; string-map string-map!
 ;;; string-fold       string-unfold
 ;;; string-fold-right string-unfold-right 
-;;; string-tabulate
-;;; string-for-each string-iter
+;;; string-tabulate string-for-each string-for-each-index
 ;;; string-every string-any
+;;; string-hash string-hash-ci
 ;;; string-compare string-compare-ci
-;;; substring-compare substring-compare-ci
-;;; string= string< string> string<= string>= string<>
+;;; string=    string<    string>    string<=    string>=    string<>
 ;;; string-ci= string-ci< string-ci> string-ci<= string-ci>= string-ci<> 
-;;; substring=     substring<>		substring-ci=  substring-ci<>
-;;; substring<     substring>		substring-ci<  substring-ci>
-;;; substring<=    substring>=		substring-ci<= substring-ci>=
-;;; string-upper-case? string-lower-case?
-;;; capitalize-string  capitalize-words  string-downcase  string-upcase
-;;; capitalize-string! capitalize-words! string-downcase! string-upcase!
+;;; string-downcase  string-upcase  string-titlecase  
+;;; string-downcase! string-upcase! string-titlecase! 
 ;;; string-take string-take-right
 ;;; string-drop string-drop-right
 ;;; string-pad string-pad-right
 ;;; string-trim string-trim-right string-trim-both
 ;;; string-filter string-delete
-;;; string-index string-index-right string-skip string-skip-right
-;;; string-prefix-count string-prefix-count-ci
-;;; string-suffix-count string-suffix-count-ci
-;;; substring-prefix-count substring-prefix-count-ci
-;;; substring-suffix-count substring-suffix-count-ci
+;;; string-index string-index-right 
+;;; string-skip  string-skip-right
+;;; string-count
+;;; string-prefix-length string-prefix-length-ci
+;;; string-suffix-length string-suffix-length-ci
 ;;; string-prefix? string-prefix-ci?
 ;;; string-suffix? string-suffix-ci?
-;;; substring-prefix? substring-prefix-ci?
-;;; substring-suffix? substring-suffix-ci?
-;;; substring? substring-ci?
-;;; string-fill! string-copy! string-copy substring
+;;; string-contains string-contains-ci
+;;; string-copy! substring/shared
 ;;; string-reverse string-reverse! reverse-list->string
-;;; string->list
-;;; string-concat string-concat/shared string-append/shared
+;;; string-concatenate string-concatenate/shared string-concatenate-reverse
+;;; string-append/shared
 ;;; xsubstring string-xcopy!
 ;;; string-null?
-;;; join-strings
+;;; string-join
+;;; string-tokenize
+;;; string-replace
 ;;; 
-;;; string? make-string string string-length string-ref string-set! 
-;;; string-append list->string
+;;; R5RS extended:
+;;; string->list string-copy string-fill! 
 ;;;
-;;; make-kmp-restart-vector
-;;; parse-final-start+end
-;;; parse-start+end
+;;; R5RS re-exports:
+;;; string? make-string string-length string-ref string-set! 
+;;;
+;;; R5RS re-exports (also defined here but commented-out):
+;;; string string-append list->string
+;;;
+;;; Low-level routines:
+;;; make-kmp-restart-vector string-kmp-partial-search kmp-step
+;;; string-parse-start+end
+;;; string-parse-final-start+end
+;;; let-string-start+end
 ;;; check-substring-spec
+;;; substring-spec-ok?
 
 ;;; Imports
+;;; This is a fairly large library. While it was written for portability, you
+;;; must be aware of its dependencies in order to run it in a given scheme
+;;; implementation. Here is a complete list of the dependencies it has and the
+;;; assumptions it makes beyond stock R5RS Scheme:
+;;;
 ;;; This code has the following non-R5RS dependencies:
-;;; - (RECEIVE (var ...) mv-exp body ...) multiple-value binding macro
-;;; - Various imports from the char-set library
-;;; - ERROR
-;;; - LET-OPTIONALS and :OPTIONAL macros for handling optional arguments
-;;; - The R5RS SUBSTRING function is accessed using the Scheme 48
-;;;   STRUCTURE-REF magic accessor.
+;;; - (RECEIVE (var ...) mv-exp body ...) multiple-value binding macro;
+;;;
+;;; - Various imports from the char-set library for the routines that can
+;;;   take char-set arguments;
+;;;   
+;;; - An n-ary ERROR procedure;
+;;;   
+;;; - BITWISE-AND for the hash functions;
+;;;   
+;;; - A simple CHECK-ARG procedure for checking parameter values; it is 
+;;;   (lambda (pred val proc) 
+;;;     (if (pred val) val (error "Bad arg" val pred proc)))
+;;;   
+;;; - :OPTIONAL and LET-OPTIONALS* macros for parsing, defaulting & 
+;;;   type-checking optional parameters from a rest argument;
+;;;   
+;;; - CHAR-CASED? and CHAR-TITLECASE for the STRING-TITLECASE & 
+;;;   STRING-TITLECASE! procedures. The former returns true iff a character is
+;;;   one that has case distinctions; in ASCII it returns true on a-z and A-Z.
+;;;   CHAR-TITLECASE is analagous to CHAR-UPCASE and CHAR-DOWNCASE. In ASCII &
+;;;   Latin-1, it is the same as CHAR-UPCASE.
+;;;
+;;; The code depends upon a small set of core string primitives from R5RS:
+;;;     MAKE-STRING STRING-REF STRING-SET! STRING? STRING-LENGTH SUBSTRING 
+;;; (Actually, SUBSTRING is not a primitive, but we assume that an 
+;;; implementation's native version is probably faster than one we could
+;;; define, so we import it from R5RS.)
+;;;
+;;; The code depends upon a small set of R5RS character primitives:
+;;;   char? char=? char-ci=? char<? char-ci<?
+;;;   char-upcase char-downcase
+;;;   char->integer (for the hash functions)
+;;;   
+;;; We assume the following:
+;;; - CHAR-DOWNCASE o CHAR-UPCASE = CHAR-DOWNCASE
+;;; - CHAR-CI=? is equivalent to
+;;;     (lambda (c1 c2) (char=? (char-downcase (char-upcase c1))
+;;;                             (char-downcase (char-upcase c2))))
+;;; - CHAR-UPCASE, CHAR-DOWNCASE and CHAR-TITLECASE are locale-insensitive
+;;;   and consistent with Unicode's 1-1 char-mapping spec.
+;;; These things are typically true, but if not, you would need to modify
+;;; the case-mapping and case-insensitive routines.
 
+;;; Enough introductory blather. On to the source code. (But see the end of
+;;; the file for further notes on porting & performance tuning.)
 
+
 ;;; Support for START/END substring specs
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; This macro parses optional start/end arguments from arg lists, defaulting
 ;;; them to 0/(string-length s), and checks them for correctness.
 
-(define-syntax let-start+end
+(define-syntax let-string-start+end
   (syntax-rules ()
-    ((let-start+end (start end) proc s-exp args-exp body ...)
-     (receive (start end) (parse-final-start+end proc s-exp args-exp)
+    ((let-string-start+end (start end) proc s-exp args-exp body ...)
+     (receive (start end) (string-parse-final-start+end proc s-exp args-exp)
+       body ...))
+    ((let-string-start+end (start end rest) proc s-exp args-exp body ...)
+     (receive (rest start end) (string-parse-start+end proc s-exp args-exp)
        body ...))))
 
+;;; This one parses out a *pair* of final start/end indices. 
+;;; Not exported; for internal use.
+(define-syntax let-string-start+end2
+  (syntax-rules ()
+    ((l-s-s+e2 (start1 end1 start2 end2) proc s1 s2 args body ...)
+     (let ((procv proc)) ; Make sure PROC is only evaluated once.
+       (let-string-start+end (start1 end1 rest) procv s1 args
+         (let-string-start+end (start2 end2) procv s2 rest
+           body ...))))))
 
-;;; Returns three values: start end rest
 
-(define (parse-start+end proc s args)
+;;; Returns three values: rest start end
+
+(define (string-parse-start+end proc s args)
+  (if (not (string? s)) (error "Non-string value" proc s))
   (let ((slen (string-length s)))
     (if (pair? args)
 
 	(let ((start (car args))
 	      (args (cdr args)))
-	  (if (or (not (integer? start)) (< start 0))
-	      (error "Illegal substring START spec" proc start s)
+	  (if (and (integer? start) (exact? start) (>= start 0))
 	      (receive (end args)
 		  (if (pair? args)
 		      (let ((end (car args))
 			    (args (cdr args)))
-			(if (or (not (integer? end)) (< slen end))
-			    (error "Illegal substring END spec" proc end s)
-			    (values end args)))
+			(if (and (integer? end) (exact? end) (<= end slen))
+			    (values end args)
+			    (error "Illegal substring END spec" proc end s)))
 		      (values slen args))
-		(if (<= start end) (values start end args)
+		(if (<= start end) (values args start end)
 		    (error "Illegal substring START/END spec"
-			   proc start end s)))))
+			   proc start end s)))
+	      (error "Illegal substring START spec" proc start s)))
 
-	(values 0 (string-length s) '()))))
+	(values '() 0 slen))))
 
-(define (parse-final-start+end proc s args)
-  (receive (start end rest) (parse-start+end proc s args)
+(define (string-parse-final-start+end proc s args)
+  (receive (rest start end) (string-parse-start+end proc s args)
     (if (pair? rest) (error "Extra arguments to procedure" proc rest)
 	(values start end))))
 
+(define (substring-spec-ok? s start end)
+  (and (string? s)
+       (integer? start)
+       (exact? start)
+       (integer? end)
+       (exact? end)
+       (<= 0 start)
+       (<= start end)
+       (<= end (string-length s))))
+
 (define (check-substring-spec proc s start end)
-  (if (or (< start 0)
-	  (< (string-length s) end)
-	  (< end start))
-      (error "Illegal substring START/END spec." proc s start end)))
+  (if (not (substring-spec-ok? s start end))
+      (error "Illegal substring spec." proc s start end)))
+
+
+;;; Defined by R5RS, so commented out here.
+;(define (string . chars)
+;  (let* ((len (length chars))
+;         (ans (make-string len)))
+;    (do ((i 0 (+ i 1))
+;	 (chars chars (cdr chars)))
+;	((>= i len))
+;      (string-set! ans i (car chars)))
+;    ans))
+;
+;(define (string . chars) (string-unfold null? car cdr chars))
 
 
 
-;;; substring   S START [END] 
-;;; string-copy S [START END]
+;;; substring/shared S START [END] 
+;;; string-copy      S [START END]
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
-;;; Redefine SUBSTRING so that the END parameter is optional.
-;;; SUBSTRINGX is the underlying R5RS SUBSTRING function. All
-;;; the code in this file uses the simple SUBSTRINGX, so you can
-;;; easily port this code.
 
-(define substringx (structure-ref scheme substring))	; Simple R5RS SUBSTRING
+;;; All this goop is just arg parsing & checking surrounding a call to the
+;;; actual primitive, %SUBSTRING/SHARED.
 
-(define (substring s start . maybe-end)			; Our SUBSTRING
-  (substringx s start (:optional maybe-end (string-length s))))
+(define (substring/shared s start . maybe-end)
+  (check-arg string? s substring/shared)
+  (let ((slen (string-length s)))
+    (check-arg (lambda (start) (and (integer? start) (exact? start) (<= 0 start)))
+	       start substring/shared)
+    (%substring/shared s start
+		       (:optional maybe-end slen
+				  (lambda (end) (and (integer? end)
+						     (exact? end)
+						     (<= start end)
+						     (<= end slen)))))))
+
+;;; Split out so that other routines in this library can avoid arg-parsing
+;;; overhead for END parameter.
+(define (%substring/shared s start end)
+  (if (and (zero? start) (= end (string-length s))) s
+      (substring s start end)))
 
 (define (string-copy s . maybe-start+end)
-  (let-start+end (start end) string-copy s maybe-start+end
-    (substringx s start end)))
-
+  (let-string-start+end (start end) string-copy s maybe-start+end
+    (substring s start end)))
 
+;This library uses the R5RS SUBSTRING, but doesn't export it.
+;Here is a definition, just for completeness.
+;(define (substring s start end)
+;  (check-substring-spec substring s start end)
+;  (let* ((slen (- end start))
+;         (ans (make-string slen)))
+;    (do ((i 0 (+ i 1))
+;         (j start (+ j 1)))
+;        ((>= i slen) ans)
+;      (string-set! ans i (string-ref s j)))))
 
 ;;; Basic iterators and other higher-order abstractions
 ;;; (string-map proc s [start end])
 ;;; (string-map! proc s [start end])
 ;;; (string-fold kons knil s [start end])
 ;;; (string-fold-right kons knil s [start end])
-;;; (string-unfold p f g seed)
-;;; (string-for-each proc s [start end])
-;;; (string-iter     proc s [start end])
-;;; (string-every pred s [start end])
-;;; (string-any pred s [start end])
+;;; (string-unfold       p f g seed [base make-final])
+;;; (string-unfold-right p f g seed [base make-final])
+;;; (string-for-each       proc s [start end])
+;;; (string-for-each-index proc s [start end])
+;;; (string-every char-set/char/pred s [start end])
+;;; (string-any   char-set/char/pred s [start end])
 ;;; (string-tabulate proc len)
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
-;;; No guarantees about order in MAP, FOR-EACH, EVERY, ANY procs.
-;;;
 ;;; You want compiler support for high-level transforms on fold and unfold ops.
 ;;; You'd at least like a lot of inlining for clients of these procedures.
-;;; Hold your breath.
+;;; Don't hold your breath.
 
 (define (string-map proc s . maybe-start+end)
-  (let-start+end (start end) string-map s maybe-start+end
-    (let* ((len (- end start))
-	   (ans (make-string len)))
-      (do ((i (- end 1) (- i 1))
-	   (j (- len 1) (- j 1)))
-	  ((< j 0))
-	(string-set! ans j (proc (string-ref s i))))
-      ans)))
+  (check-arg procedure? proc string-map)
+  (let-string-start+end (start end) string-map s maybe-start+end
+    (%string-map proc s start end)))
+
+(define (%string-map proc s start end)	; Internal utility
+  (let* ((len (- end start))
+	 (ans (make-string len)))
+    (do ((i (- end 1) (- i 1))
+	 (j (- len 1) (- j 1)))
+	((< j 0))
+      (string-set! ans j (proc (string-ref s i))))
+    ans))
 
 (define (string-map! proc s . maybe-start+end)
-  (let-start+end (start end) string-map! s maybe-start+end
-    (do ((i (- end 1) (- i 1)))
-	((< i start))
-      (string-set! s i (proc (string-ref s i))))))
+  (check-arg procedure? proc string-map!)
+  (let-string-start+end (start end) string-map! s maybe-start+end
+    (%string-map! proc s start end)))
+
+(define (%string-map! proc s start end)
+  (do ((i (- end 1) (- i 1)))
+      ((< i start))
+    (string-set! s i (proc (string-ref s i)))))
 
 (define (string-fold kons knil s . maybe-start+end)
-  (let-start+end (start end) string-fold s maybe-start+end
+  (check-arg procedure? kons string-fold)
+  (let-string-start+end (start end) string-fold s maybe-start+end
     (let lp ((v knil) (i start))
       (if (< i end) (lp (kons (string-ref s i) v) (+ i 1))
 	  v))))
 
 (define (string-fold-right kons knil s . maybe-start+end)
-  (let-start+end (start end) string-fold-right s maybe-start+end
+  (check-arg procedure? kons string-fold-right)
+  (let-string-start+end (start end) string-fold-right s maybe-start+end
     (let lp ((v knil) (i (- end 1)))
       (if (>= i start) (lp (kons (string-ref s i) v) (- i 1))
 	  v))))
 
-;;; (string-unfold p f g seed)
+;;; (string-unfold p f g seed [base make-final])
 ;;; This is the fundamental constructor for strings. 
 ;;; - G is used to generate a series of "seed" values from the initial seed:
 ;;;     SEED, (G SEED), (G^2 SEED), (G^3 SEED), ...
 ;;; - P tells us when to stop -- when it returns true when applied to one 
 ;;;   of these seed values.
 ;;; - F maps each seed value to the corresponding character 
-;;;   in the result string.
+;;;   in the result string. These chars are assembled into the
+;;;   string in a left-to-right order.
+;;; - BASE is the optional initial/leftmost portion of the constructed string;
+;;;   it defaults to the empty string "".
+;;; - MAKE-FINAL is applied to the terminal seed value (on which P returns
+;;;   true) to produce the final/rightmost portion of the constructed string.
+;;;   It defaults to (LAMBDA (X) "").
 ;;;
 ;;; In other words, the following (simple, inefficient) definition holds:
-;;; (string-unfold p f g seed) =
-;;;   (if (p seed) "" 
-;;;       (string-append (string (f seed)) 
-;;;                      (string-unfold p f g (g seed))))
+;;; (define (string-unfold p f g seed base make-final)
+;;;   (string-append base
+;;;                  (let recur ((seed seed))
+;;;                    (if (p seed) (make-final seed)
+;;;                        (string-append (string (f seed))
+;;;                                       (recur (g seed)))))))
 ;;; 
 ;;; STRING-UNFOLD is a fairly powerful constructor -- you can use it to
 ;;; reverse a string, copy a string, convert a list to a string, read
 ;;; a port into a string, and so forth. Examples:
 ;;; (port->string port) =
 ;;;   (string-unfold (compose eof-object? peek-char)
-;;;                  read-char identity port)
+;;;                  read-char values port)
 ;;;
 ;;; (list->string lis) = (string-unfold null? car cdr lis)
 ;;; 
@@ -235,89 +331,195 @@
 ;;; it to give a clear, straightforward description of what the function
 ;;; does.
 
-;(define (string-unfold p f g seed)
-;  (let recur ((seed seed) (i 0))
-;    (if (p seed) (make-string i)
-;        (let* ((c (f seed))
-;               (s (recur (g seed) (+ i 1))))
-;          (string-set! s i c)
-;          s))))
-
-;;; This formulation chunks up the constructed string into 1024-char chunks,
-;;; popping the stack frames. So it'll reduce stack growth by a factor of
-;;; 1024. Marc Feeley alerted me to this issue and its general solution.
-
-(define (string-unfold p f g seed)
-  (string-concat/shared
-	 (let recur ((seed seed))
-	   (receive (s seed done?)
-	            (let recur2 ((seed seed) (i 0))
-		      (cond ((p seed) (values (make-string i) seed #t))
-			    ((>= i 1024) (values (make-string i) seed #f))
-			    (else (let ((c (f seed)))
-				    (receive (s seed done?)
-					     (recur2 (g seed) (+ i 1))
-				      (string-set! s i c)
-				      (values s seed done?))))))
-
-	     (if done? (list s)
-		 (cons s (recur seed)))))))
-
-
-;;; This is the same as STRING-UNFOLD, but defined for multiple 
-;;; seed parameters. If you pass N seeds, then
-;;; - P maps N parameters to a boolean.
-;;; - F maps N parameters to a character.
-;;; - G maps N parameters to N return values.
-;;; This definition does a lot of consing; it would need a fair amount
-;;; of compiler support to be efficient.
-
-; Not released
-;(define (string-unfoldn p f g . seeds)
-;  (apply string-append
-;	 (let recur ((seeds seeds))
-;	   (receive (s seeds done?)
-;	            (let recur2 ((seeds seeds) (i 0))
-;		      (cond ((apply p seeds) (values (make-string i) seeds #t))
-;			    ((>= i 1024) (values (make-string i) seeds #f))
-;			    (else (let ((c (apply f seeds)))
-;				    (receive seeds (apply g seeds)
-;				      (receive (s seeds done?)
-;					       (recur2 seeds (+ i 1))
-;					(string-set! s i c)
-;					(values s seeds done?)))))))
+;(define (string-unfold p f g seed base make-final)
+;  (let ((ans (let recur ((seed seed) (i (string-length base)))
+;               (if (p seed)
+;                   (let* ((final (make-final seed))
+;                          (ans (make-string (+ i (string-length final)))))
+;                     (string-copy! ans i final)
+;                     ans)
 ;
-;	     (if done? (list s)
-;		 (cons s (recur seeds)))))))
+;                   (let* ((c (f seed))
+;                          (s (recur (g seed) (+ i 1))))
+;                     (string-set! s i c)
+;                     s)))))
+;    (string-copy! ans 0 base)
+;    ans))
+
+;;; The strategy is to allocate a series of chunks into which we stash the
+;;; chars as we generate them. Chunk size goes up in powers of two starting
+;;; with 40 and levelling out at 4k, i.e.
+;;;     40 40 80 160 320 640 1280 2560 4096 4096 4096 4096 4096...
+;;; This should work pretty well for short strings, 1-line (80 char) strings,
+;;; and longer ones. When done, we allocate an answer string and copy the
+;;; chars over from the chunk buffers.
+
+(define (string-unfold p f g seed . base+make-final)
+  (check-arg procedure? p string-unfold)
+  (check-arg procedure? f string-unfold)
+  (check-arg procedure? g string-unfold)
+  (let-optionals* base+make-final
+                  ((base       ""              (string? base))
+		   (make-final (lambda (x) "") (procedure? make-final)))
+    (let lp ((chunks '())		; Previously filled chunks
+	     (nchars 0)			; Number of chars in CHUNKS
+	     (chunk (make-string 40))	; Current chunk into which we write
+	     (chunk-len 40)
+	     (i 0)			; Number of chars written into CHUNK
+	     (seed seed))
+      (let lp2 ((i i) (seed seed))
+	(if (not (p seed))
+	    (let ((c (f seed))
+		  (seed (g seed)))
+	      (if (< i chunk-len)
+		  (begin (string-set! chunk i c)
+			 (lp2 (+ i 1) seed))
+
+		  (let* ((nchars2 (+ chunk-len nchars))
+			 (chunk-len2 (min 4096 nchars2))
+			 (new-chunk (make-string chunk-len2)))
+		    (string-set! new-chunk 0 c)
+		    (lp (cons chunk chunks) (+ nchars chunk-len)
+			new-chunk chunk-len2 1 seed))))
+
+	    ;; We're done. Make the answer string & install the bits.
+	    (let* ((final (make-final seed))
+		   (flen (string-length final))
+		   (base-len (string-length base))
+		   (j (+ base-len nchars i))
+		   (ans (make-string (+ j flen))))
+	      (%string-copy! ans j final 0 flen)	; Install FINAL.
+	      (let ((j (- j i)))
+		(%string-copy! ans j chunk 0 i)		; Install CHUNK[0,I).
+		(let lp ((j j) (chunks chunks))		; Install CHUNKS.
+		  (if (pair? chunks)
+		      (let* ((chunk  (car chunks))
+			     (chunks (cdr chunks))
+			     (chunk-len (string-length chunk))
+			     (j (- j chunk-len)))
+			(%string-copy! ans j chunk 0 chunk-len)
+			(lp j chunks)))))
+	      (%string-copy! ans 0 base 0 base-len)	; Install BASE.
+	      ans))))))
+
+(define (string-unfold-right p f g seed . base+make-final)
+  (let-optionals* base+make-final
+                  ((base       ""              (string? base))
+		   (make-final (lambda (x) "") (procedure? make-final)))
+    (let lp ((chunks '())		; Previously filled chunks
+	     (nchars 0)			; Number of chars in CHUNKS
+	     (chunk (make-string 40))	; Current chunk into which we write
+	     (chunk-len 40)
+	     (i 40)			; Number of chars available in CHUNK
+	     (seed seed))
+      (let lp2 ((i i) (seed seed))	; Fill up CHUNK from right
+	(if (not (p seed))		; to left.
+	    (let ((c (f seed))
+		  (seed (g seed)))
+	      (if (> i 0)
+		  (let ((i (- i 1)))
+		    (string-set! chunk i c)
+		    (lp2 i seed))
+
+		  (let* ((nchars2 (+ chunk-len nchars))
+			 (chunk-len2 (min 4096 nchars2))
+			 (new-chunk (make-string chunk-len2))
+			 (i (- chunk-len2 1)))
+		    (string-set! new-chunk i c)
+		    (lp (cons chunk chunks) (+ nchars chunk-len)
+			new-chunk chunk-len2 i seed))))
+
+	    ;; We're done. Make the answer string & install the bits.
+	    (let* ((final (make-final seed))
+		   (flen (string-length final))
+		   (base-len (string-length base))
+		   (chunk-used (- chunk-len i))
+		   (j (+ base-len nchars chunk-used))
+		   (ans (make-string (+ j flen))))
+	      (%string-copy! ans 0 final 0 flen)	; Install FINAL.
+	      (%string-copy! ans flen chunk i chunk-len); Install CHUNK[I,).
+	      (let lp ((j (+ flen chunk-used))		; Install CHUNKS.
+		       (chunks chunks))		
+		  (if (pair? chunks)
+		      (let* ((chunk  (car chunks))
+			     (chunks (cdr chunks))
+			     (chunk-len (string-length chunk)))
+			(%string-copy! ans j chunk 0 chunk-len)
+			(lp (+ j chunk-len) chunks))
+		      (%string-copy! ans j base 0 base-len))); Install BASE.
+	      ans))))))
+
 
 (define (string-for-each proc s . maybe-start+end)
-  (let-start+end (start end) string-for-each s maybe-start+end
-    (do ((i (- end 1) (- i 1)))
-	((< i start))
-      (proc (string-ref s i)))))
+  (check-arg procedure? proc string-for-each)
+  (let-string-start+end (start end) string-for-each s maybe-start+end
+    (let lp ((i start))
+      (if (< i end)
+	  (begin (proc (string-ref s i)) 
+		 (lp (+ i 1)))))))
 
-(define (string-iter proc s . maybe-start+end)
-  (let-start+end (start end) string-iter s maybe-start+end
-    (do ((i start (+ i 1)))
-	((>= i end))
-      (proc (string-ref s i)))))
+(define (string-for-each-index proc s . maybe-start+end)
+  (check-arg procedure? proc string-for-each-index)
+  (let-string-start+end (start end) string-for-each-index s maybe-start+end
+    (let lp ((i start))
+      (if (< i end) (begin (proc i) (lp (+ i 1)))))))
 
-(define (string-every pred s . maybe-start+end)
-  (let-start+end (start end) string-every s maybe-start+end
-    (let lp ((i (- end 1)))
-      (or (< i start)
-	  (and (pred (string-ref s i))
-	       (lp (- i 1)))))))
+(define (string-every criterion s . maybe-start+end)
+  (let-string-start+end (start end) string-every s maybe-start+end
+    (cond ((char? criterion)
+	   (let lp ((i start))
+	     (or (>= i end)
+		 (and (char=? criterion (string-ref s i))
+		      (lp (+ i 1))))))
 
-(define (string-any pred s . maybe-start+end)
-  (let-start+end (start end) string-any s maybe-start+end
-    (let lp ((i (- end 1)))
-      (and (>= i start)
-	   (or (pred (string-ref s i))
-	       (lp (- i 1)))))))
+	  ((char-set? criterion)
+	   (let lp ((i start))
+	     (or (>= i end)
+		 (and (char-set-contains? criterion (string-ref s i))
+		      (lp (+ i 1))))))
+
+	  ((procedure? criterion)		; Slightly funky loop so that
+	   (or (= start end)			; final (PRED S[END-1]) call
+	       (let lp ((i start))		; is a tail call.
+		 (let ((c (string-ref s i))
+		       (i1 (+ i 1)))
+		   (if (= i1 end) (criterion c)	; Tail call.
+		       (and (criterion c) (lp i1)))))))
+
+	  (else (error "Second param is neither char-set, char, or predicate procedure."
+		       string-every criterion)))))
+
+
+(define (string-any criterion s . maybe-start+end)
+  (let-string-start+end (start end) string-any s maybe-start+end
+    (cond ((char? criterion)
+	   (let lp ((i start))
+	     (and (< i end)
+		  (or (char=? criterion (string-ref s i))
+		      (lp (+ i 1))))))
+
+	  ((char-set? criterion)
+	   (let lp ((i start))
+	     (and (< i end)
+		  (or (char-set-contains? criterion (string-ref s i))
+		      (lp (+ i 1))))))
+
+	  ((procedure? criterion)		; Slightly funky loop so that
+	   (and (< start end)			; final (PRED S[END-1]) call
+		(let lp ((i start))		; is a tail call.
+		  (let ((c (string-ref s i))
+			(i1 (+ i 1)))
+		    (if (= i1 end) (criterion c)	; Tail call
+			(or (criterion c) (lp i1)))))))
+
+	  (else (error "Second param is neither char-set, char, or predicate procedure."
+		       string-any criterion)))))
 
 
 (define (string-tabulate proc len)
+  (check-arg procedure? proc string-tabulate)
+  (check-arg (lambda (val) (and (integer? val) (exact? val) (<= 0 val)))
+	     len string-tabulate)
   (let ((s (make-string len)))
     (do ((i (- len 1) (- i 1)))
 	((< i 0))
@@ -326,145 +528,162 @@
 
 
 
-;;; string-prefix-count[-ci] s1 s2
-;;; string-suffix-count[-ci] s1 s2
-;;; substring-prefix-count[-ci] s1 start1 end1  s2 start2 end2
-;;; substring-suffix-count[-ci] s1 start1 end1  s2 start2 end2
+;;; string-prefix-length[-ci] s1 s2 [start1 end1 start2 end2]
+;;; string-suffix-length[-ci] s1 s2 [start1 end1 start2 end2]
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; Find the length of the common prefix/suffix.
 ;;; It is not required that the two substrings passed be of equal length.
 ;;; This was microcode in MIT Scheme -- a very tightly bummed primitive.
+;;; %STRING-PREFIX-LENGTH is the core routine of all string-comparisons,
+;;; so should be as tense as possible.
 
-(define (substring-prefix-count s1 start1 end1 s2 start2 end2)
-  (check-substring-spec substring-prefix-count s1 start1 end1)
-  (check-substring-spec substring-prefix-count s2 start2 end2)
+(define (%string-prefix-length s1 start1 end1 s2 start2 end2)
   (let* ((delta (min (- end1 start1) (- end2 start2)))
 	 (end1 (+ start1 delta)))
-    (let lp ((i start1) (j start2))
-      (if (or (>= i end1)
-	      (not (char=? (string-ref s1 i)
-			   (string-ref s2 j))))
-	  (- i start1)
-	  (lp (+ i 1) (+ j 1))))))
 
-(define (substring-suffix-count s1 start1 end1 s2 start2 end2)
-  (check-substring-spec substring-suffix-count s1 start1 end1)
-  (check-substring-spec substring-suffix-count s2 start2 end2)
+    (if (and (eq? s1 s2) (= start1 start2))	; EQ fast path
+	delta
+
+	(let lp ((i start1) (j start2))		; Regular path
+	  (if (or (>= i end1)
+		  (not (char=? (string-ref s1 i)
+			       (string-ref s2 j))))
+	      (- i start1)
+	      (lp (+ i 1) (+ j 1)))))))
+
+(define (%string-suffix-length s1 start1 end1 s2 start2 end2)
   (let* ((delta (min (- end1 start1) (- end2 start2)))
 	 (start1 (- end1 delta)))
-    (let lp ((i (- end1 1)) (j (- end2 1)))
-      (if (or (< i start1)
-	      (not (char=? (string-ref s1 i)
-			   (string-ref s2 j))))
-	  (- (- end1 i) 1)
-	  (lp (- i 1) (- j 1))))))
 
-(define (substring-prefix-count-ci s1 start1 end1 s2 start2 end2)
-  (check-substring-spec substring-prefix-count-ci s1 start1 end1)
-  (check-substring-spec substring-prefix-count-ci s2 start2 end2)
+    (if (and (eq? s1 s2) (= end1 end2))		; EQ fast path
+	delta
+
+	(let lp ((i (- end1 1)) (j (- end2 1)))	; Regular path
+	  (if (or (< i start1)
+		  (not (char=? (string-ref s1 i)
+			       (string-ref s2 j))))
+	      (- (- end1 i) 1)
+	      (lp (- i 1) (- j 1)))))))
+
+(define (%string-prefix-length-ci s1 start1 end1 s2 start2 end2)
   (let* ((delta (min (- end1 start1) (- end2 start2)))
 	 (end1 (+ start1 delta)))
-    (let lp ((i start1) (j start2))
-      (if (or (>= i end1)
-	      (not (char-ci=? (string-ref s1 i)
-			      (string-ref s2 j))))
-	  (- i start1)
-	  (lp (+ i 1) (+ j 1))))))
 
-(define (substring-suffix-count-ci s1 start1 end1 s2 start2 end2)
-  (check-substring-spec substring-suffix-count-ci s1 start1 end1)
-  (check-substring-spec substring-suffix-count-ci s2 start2 end2)
+    (if (and (eq? s1 s2) (= start1 start2))	; EQ fast path
+	delta
+
+	(let lp ((i start1) (j start2))		; Regular path
+	  (if (or (>= i end1)
+		  (not (char-ci=? (string-ref s1 i)
+				  (string-ref s2 j))))
+	      (- i start1)
+	      (lp (+ i 1) (+ j 1)))))))
+
+(define (%string-suffix-length-ci s1 start1 end1 s2 start2 end2)
   (let* ((delta (min (- end1 start1) (- end2 start2)))
 	 (start1 (- end1 delta)))
-    (let lp ((i (- end1 1)) (j (- end2 1)))
-      (if (or (< i start1)
-	      (not (char-ci=? (string-ref s1 i)
-			      (string-ref s2 j))))
-	  (- (- end1 i) 1)
-	  (lp (- i 1) (- j 1))))))
+
+    (if (and (eq? s1 s2) (= end1 end2))		; EQ fast path
+	delta
+
+	(let lp ((i (- end1 1)) (j (- end2 1)))	; Regular path
+	  (if (or (< i start1)
+		  (not (char-ci=? (string-ref s1 i)
+				  (string-ref s2 j))))
+	      (- (- end1 i) 1)
+	      (lp (- i 1) (- j 1)))))))
 
 
-(define (string-prefix-count s1 s2)
-  (substring-prefix-count s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-prefix-length s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-prefix-length s1 s2 maybe-starts+ends
+    (%string-prefix-length s1 start1 end1 s2 start2 end2)))
 
-(define (string-suffix-count s1 s2)
-  (substring-suffix-count s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-suffix-length s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-suffix-length s1 s2 maybe-starts+ends
+    (%string-suffix-length s1 start1 end1 s2 start2 end2)))
 
-(define (string-prefix-count-ci s1 s2)
-  (substring-prefix-count-ci s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-prefix-length-ci s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-prefix-length-ci s1 s2 maybe-starts+ends
+    (%string-prefix-length-ci s1 start1 end1 s2 start2 end2)))
 
-(define (string-suffix-count-ci s1 s2)
-  (substring-suffix-count-ci s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-suffix-length-ci s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-suffix-length-ci s1 s2 maybe-starts+ends
+    (%string-suffix-length-ci s1 start1 end1 s2 start2 end2)))
 
 
-
-;;; string-prefix?    s1 s2 
-;;; string-suffix?    s1 s2 
-;;; string-prefix-ci? s1 s2 
-;;; string-suffix-ci? s1 s2 
-;;; 
-;;; substring-prefix?    s1 start1 end1 s2 start2 end2 
-;;; substring-suffix?    s1 start1 end1 s2 start2 end2 
-;;; substring-prefix-ci? s1 start1 end1 s2 start2 end2 
-;;; substring-suffix-ci? s1 start1 end1 s2 start2 end2 
+;;; string-prefix?    s1 s2 [start1 end1 start2 end2]
+;;; string-suffix?    s1 s2 [start1 end1 start2 end2]
+;;; string-prefix-ci? s1 s2 [start1 end1 start2 end2]
+;;; string-suffix-ci? s1 s2 [start1 end1 start2 end2]
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; These are all simple derivatives of the previous counting funs.
 
-(define (string-prefix? s1 s2) 
-  (substring-prefix? s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-prefix? s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-prefix? s1 s2 maybe-starts+ends
+    (%string-prefix? s1 start1 end1 s2 start2 end2)))
 
-(define (string-suffix? s1 s2) 
-  (substring-suffix-ci? s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-suffix? s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-suffix? s1 s2 maybe-starts+ends
+    (%string-suffix? s1 start1 end1 s2 start2 end2)))
 
-(define (string-prefix-ci? s1 s2)
-  (substring-prefix-ci? s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-prefix-ci? s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-prefix-ci? s1 s2 maybe-starts+ends
+    (%string-prefix-ci? s1 start1 end1 s2 start2 end2)))
 
-(define (string-suffix-ci? s1 s2)
-  (substring-suffix-ci? s1 0 (string-length s1) s2 0 (string-length s2)))
+(define (string-suffix-ci? s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-suffix-ci? s1 s2 maybe-starts+ends
+    (%string-suffix-ci? s1 start1 end1 s2 start2 end2)))
 
-(define (substring-prefix? s1 start1 end1 s2 start2 end2)
+
+;;; Here are the internal routines that do the real work.
+
+(define (%string-prefix? s1 start1 end1 s2 start2 end2)
   (let ((len1 (- end1 start1)))
     (and (<= len1 (- end2 start2))	; Quick check
-	 (= (substring-prefix-count s1 start1 end1
-				    s2 start2 end2)
+	 (= (%string-prefix-length s1 start1 end1
+				   s2 start2 end2)
 	    len1))))
 
-(define (substring-suffix? s1 start1 end1 s2 start2 end2)
+(define (%string-suffix? s1 start1 end1 s2 start2 end2)
   (let ((len1 (- end1 start1)))
     (and (<= len1 (- end2 start2))	; Quick check
-	 (= len1 (substring-suffix-count s1 start1 end1
-					 s2 start2 end2)))))
+	 (= len1 (%string-suffix-length s1 start1 end1
+					s2 start2 end2)))))
 
-(define (substring-prefix-ci? s1 start1 end1 s2 start2 end2)
+(define (%string-prefix-ci? s1 start1 end1 s2 start2 end2)
   (let ((len1 (- end1 start1)))
     (and (<= len1 (- end2 start2))	; Quick check
-	 (= len1 (substring-prefix-count-ci s1 start1 end1
-					    s2 start2 end2)))))
+	 (= len1 (%string-prefix-length-ci s1 start1 end1
+					   s2 start2 end2)))))
 
-(define (substring-suffix-ci? s1 start1 end1 s2 start2 end2)
+(define (%string-suffix-ci? s1 start1 end1 s2 start2 end2)
   (let ((len1 (- end1 start1)))
     (and (<= len1 (- end2 start2))	; Quick check
-	 (= len1 (substring-suffix-count-ci s1 start1 end1
-					    s2 start2 end2)))))
+	 (= len1 (%string-suffix-length-ci s1 start1 end1
+					   s2 start2 end2)))))
 
 
-;;; string-compare    s1 s2 lt-proc eq-proc gt-proc
-;;; string-compare-ci s1 s2 eq-proc lt-proc gt-proc
-;;; substring-compare    s1 start1 end1 s2 start2 end2
-;;;                      lt-proc eq-proc gt-proc
-;;; substring-compare-ci s1 start1 end1 s2 start2 end2
-;;;                      lt-proc eq-proc gt-proc
+;;; string-compare    s1 s2 proc< proc= proc> [start1 end1 start2 end2]
+;;; string-compare-ci s1 s2 proc< proc= proc> [start1 end1 start2 end2]
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; Primitive string-comparison functions.
 ;;; Continuation order is different from MIT Scheme.
 ;;; Continuations are applied to s1's mismatch index;
 ;;; in the case of equality, this is END1.
 
-(define (substring-compare s1 start1 end1 s2 start2 end2
+(define (%string-compare s1 start1 end1 s2 start2 end2
 			   proc< proc= proc>)
   (let ((size1 (- end1 start1))
 	(size2 (- end2 start2)))
-    (let ((match (substring-prefix-count s1 start1 end1 s2 start2 end2)))
+    (let ((match (%string-prefix-length s1 start1 end1 s2 start2 end2)))
       (if (= match size1)
 	  ((if (= match size2) proc= proc<) end1)
 	  ((if (= match size2)
@@ -474,11 +693,11 @@
 		   proc< proc>))
 	   (+ match start1))))))
 
-(define (substring-compare-ci s1 start1 end1 s2 start2 end2
+(define (%string-compare-ci s1 start1 end1 s2 start2 end2
 			      proc< proc= proc>)
   (let ((size1 (- end1 start1))
 	(size2 (- end2 start2)))
-    (let ((match (substring-prefix-count-ci s1 start1 end1 s2 start2 end2)))
+    (let ((match (%string-prefix-length-ci s1 start1 end1 s2 start2 end2)))
       (if (= match size1)
 	  ((if (= match size2) proc= proc<) end1)
 	  ((if (= match size2) proc>
@@ -487,15 +706,22 @@
 		   proc< proc>))
 	   (+ start1 match))))))
 
-(define (string-compare s1 s2 proc< proc= proc>)
-  (substring-compare s1 0 (string-length s1)
-		     s2 0 (string-length s2)
-		     proc< proc= proc>))
+(define (string-compare s1 s2 proc< proc= proc> . maybe-starts+ends)
+  (check-arg procedure? proc< string-compare)
+  (check-arg procedure? proc= string-compare)
+  (check-arg procedure? proc> string-compare)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-compare s1 s2 maybe-starts+ends
+    (%string-compare s1 start1 end1 s2 start2 end2 proc< proc= proc>)))
+
+(define (string-compare-ci s1 s2 proc< proc= proc> . maybe-starts+ends)
+  (check-arg procedure? proc< string-compare-ci)
+  (check-arg procedure? proc= string-compare-ci)
+  (check-arg procedure? proc> string-compare-ci)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-compare-ci s1 s2 maybe-starts+ends
+    (%string-compare-ci s1 start1 end1 s2 start2 end2 proc< proc= proc>)))
 
-(define (string-compare-ci s1 s2 proc< proc= proc>)
-  (substring-compare-ci s1 0 (string-length s1)
-			s2 0 (string-length s2)
-			proc< proc= proc>))
 
 
 ;;; string=          string<>		string-ci=          string-ci<>
@@ -503,225 +729,242 @@
 ;;; string<=         string>=		string-ci<=         string-ci>=
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; Simple definitions in terms of the previous comparison funs.
-;;; Inequality predicates return #f or mismatch index.
-;;; I sure hope these defns get integrated.
+;;; I sure hope the %STRING-COMPARE calls get integrated.
 
-(define (string=  s1 s2)
-  (if (eq? s1 s2) (string-length s1)	; Fast path
-      (string-compare s1 s2 (lambda (i) #f) (lambda (i) i) (lambda (i) #f))))
+(define (string= s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string= s1 s2 maybe-starts+ends
+    (and (= (- end1 start1) (- end2 start2))			; Quick filter
+	 (or (and (eq? s1 s2) (= start1 start2))		; Fast path
+	     (%string-compare s1 start1 end1 s2 start2 end2	; Real test
+			      (lambda (i) #f)
+			      values
+			      (lambda (i) #f))))))
 
-(define (string<  s1 s2)
-  (and (not (eq? s1 s2))		; Fast path
-       (string-compare s1 s2 (lambda (i) i) (lambda (i) #f) (lambda (i) #f))))
+(define (string<> s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string<> s1 s2 maybe-starts+ends
+    (or (not (= (- end1 start1) (- end2 start2)))		; Fast path
+	(and (not (and (eq? s1 s2) (= start1 start2)))		; Quick filter
+	     (%string-compare s1 start1 end1 s2 start2 end2	; Real test
+			      values
+			      (lambda (i) #f)
+			      values)))))
 
-(define (string>  s1 s2)
-  (and (not (eq? s1 s2))		; Fast path
-       (string-compare s1 s2 (lambda (i) #f) (lambda (i) #f) (lambda (i) i))))
+(define (string< s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string< s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(< end1 end2)
 
-(define (string<=  s1 s2)
-  (if (eq? s1 s2) (string-length s1)	; Fast path
-      (string-compare s1 s2 (lambda (i) i) (lambda (i) i) (lambda (i) #f))))
+	(%string-compare s1 start1 end1 s2 start2 end2 		; Real test
+			 values
+			 (lambda (i) #f)
+			 (lambda (i) #f)))))
 
-(define (string>=  s1 s2)
-  (if (eq? s1 s2) (string-length s1)	; Fast path
-      (string-compare s1 s2 (lambda (i) #f) (lambda (i) i) (lambda (i) i))))
+(define (string> s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string> s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(> end1 end2)
 
-(define (string<>  s1 s2) 
-  (and (not (eq? s1 s2))		; Fast path
-       (string-compare s1 s2 (lambda (i) i) (lambda (i) #f) (lambda (i) i))))
+	(%string-compare s1 start1 end1 s2 start2 end2 		; Real test
+			 (lambda (i) #f)
+			 (lambda (i) #f)
+			 values))))
 
+(define (string<= s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string<= s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(<= end1 end2)
 
-(define (string-ci=  s1 s2)
-  (if (eq? s1 s2) (string-length s1)	; Fast path
-      (string-compare-ci s1 s2 (lambda (i) #f) (lambda (i) i) (lambda (i) #f))))
+	(%string-compare s1 start1 end1 s2 start2 end2 		; Real test
+			 values
+			 values
+			 (lambda (i) #f)))))
 
-(define (string-ci<  s1 s2)
-  (and (not (eq? s1 s2))		; Fast path
-       (string-compare-ci s1 s2 (lambda (i) i) (lambda (i) #f) (lambda (i) #f))))
+(define (string>= s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string>= s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(>= end1 end2)
 
-(define (string-ci>  s1 s2)
-  (and (not (eq? s1 s2))		; Fast path
-       (string-compare-ci s1 s2 (lambda (i) #f) (lambda (i) #f) (lambda (i) i))))
+	(%string-compare s1 start1 end1 s2 start2 end2 		; Real test
+			 (lambda (i) #f)
+			 values
+			 values))))
 
-(define (string-ci<=  s1 s2)
-  (if (eq? s1 s2) (string-length s1)	; Fast path
-      (string-compare-ci s1 s2 (lambda (i) i) (lambda (i) i) (lambda (i) #f))))
+(define (string-ci= s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-ci= s1 s2 maybe-starts+ends
+    (and (= (- end1 start1) (- end2 start2))			; Quick filter
+	 (or (and (eq? s1 s2) (= start1 start2))		; Fast path
+	     (%string-compare-ci s1 start1 end1 s2 start2 end2	; Real test
+				 (lambda (i) #f)
+				 values
+				 (lambda (i) #f))))))
 
-(define (string-ci>=  s1 s2)
-  (if (eq? s1 s2) (string-length s1)	; Fast path
-      (string-compare-ci s1 s2 (lambda (i) #f) (lambda (i) i) (lambda (i) i))))
+(define (string-ci<> s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-ci<> s1 s2 maybe-starts+ends
+    (or (not (= (- end1 start1) (- end2 start2)))		; Fast path
+	(and (not (and (eq? s1 s2) (= start1 start2)))		; Quick filter
+	     (%string-compare-ci s1 start1 end1 s2 start2 end2	; Real test
+				 values
+				 (lambda (i) #f)
+				 values)))))
 
-(define (string-ci<>  s1 s2)
-  (and (not (eq? s1 s2))		; Fast path
-       (string-compare-ci s1 s2 (lambda (i) i) (lambda (i) #f) (lambda (i) i))))
+(define (string-ci< s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-ci< s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(< end1 end2)
 
+	(%string-compare-ci s1 start1 end1 s2 start2 end2	; Real test
+			    values
+			    (lambda (i) #f)
+			    (lambda (i) #f)))))
 
-(define (substring= s1 start1 end1 s2 start2 end2)
-  (substring-compare s1 start1 end1
-		     s2 start2 end2
-		     (lambda (i) #f)
-		     (lambda (i) i)
-		     (lambda (i) #f)))
+(define (string-ci> s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-ci> s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(> end1 end2)
 
-(define (substring<> s1 start1 end1 s2 start2 end2)
-  (substring-compare s1 start1 end1
-		     s2 start2 end2
-		     (lambda (i) i)
-		     (lambda (i) #f)
-		     (lambda (i) i)))
+	(%string-compare-ci s1 start1 end1 s2 start2 end2	; Real test
+			    (lambda (i) #f)
+			    (lambda (i) #f)
+			    values))))
 
-(define (substring< s1 start1 end1 s2 start2 end2)
-  (substring-compare s1 start1 end1
-		     s2 start2 end2
-		     (lambda (i) i)
-		     (lambda (i) #f)
-		     (lambda (i) #f)))
+(define (string-ci<= s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-ci<= s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(<= end1 end2)
 
-(define (substring> s1 start1 end1 s2 start2 end2)
-  (substring< s2 start2 end2 s1 start1 end1))
+	(%string-compare-ci s1 start1 end1 s2 start2 end2	; Real test
+			    values
+			    values
+			    (lambda (i) #f)))))
 
-(define (substring<= s1 start1 end1 s2 start2 end2)
-  (substring-compare s1 start1 end1
-		     s2 start2 end2
-		     (lambda (i) i)
-		     (lambda (i) i)
-		     (lambda (i) #f)))
-
-(define (substring>= s1 start1 end1 s2 start2 end2)
-  (substring<= s2 start2 end2 s1 start1 end1))
-
-(define (substring-ci= s1 start1 end1 s2 start2 end2)
-  (substring-compare-ci s1 start1 end1
-			s2 start2 end2
-			(lambda (i) #f)
-			(lambda (i) i)
-			(lambda (i) #f)))
-
-(define (substring-ci<> s1 start1 end1 s2 start2 end2)
-  (substring-compare-ci s1 start1 end1
-			s2 start2 end2
-			(lambda (i) i)
-			(lambda (i) #f)
-			(lambda (i) i)))
-
-(define (substring-ci< s1 start1 end1 s2 start2 end2)
-  (substring-compare-ci s1 start1 end1
-			s2 start2 end2
-			(lambda (i) i)
-			(lambda (i) #f)
-			(lambda (i) #f)))
-
-(define (substring-ci> s1 start1 end1 s2 start2 end2)
-  (substring-ci< s2 start2 end2 s1 start1 end1))
-
-(define (substring-ci<= s1 start1 end1 s2 start2 end2)
-  (substring-compare-ci s1 start1 end1
-			s2 start2 end2
-			(lambda (i) i)
-			(lambda (i) i)
-			(lambda (i) #f)))
-
-(define (substring-ci>= s1 start1 end1 s2 start2 end2)
-  (substring-ci<= s2 start2 end2 s1 start1 end1))
+(define (string-ci>= s1 s2 . maybe-starts+ends)
+  (let-string-start+end2 (start1 end1 start2 end2) 
+			 string-ci>= s1 s2 maybe-starts+ends
+    (if (and (eq? s1 s2) (= start1 start2))			; Fast path
+	(>= end1 end2)
 
+	(%string-compare-ci s1 start1 end1 s2 start2 end2	; Real test
+			    (lambda (i) #f)
+			    values
+			    values))))
 
 
+;;; Hash
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Compute (c + 37 c + 37^2 c + ...) modulo BOUND, with sleaze thrown in
+;;; to keep the intermediate values small. (We do the calculation with just
+;;; enough bits to represent BOUND, masking off high bits at each step in
+;;; calculation. If this screws up any important properties of the hash
+;;; function I'd like to hear about it. -Olin)
+;;;
+;;; If you keep BOUND small enough, the intermediate calculations will 
+;;; always be fixnums. How small is dependent on the underlying Scheme system; 
+;;; we use a default BOUND of 2^22 = 4194304, which should hack it in
+;;; Schemes that give you at least 29 signed bits for fixnums. The core 
+;;; calculation that you don't want to overflow is, worst case,
+;;;     (+ 65535 (* 37 (- bound 1)))
+;;; where 65535 is the max character code. Choose the default BOUND to be the
+;;; biggest power of two that won't cause this expression to fixnum overflow, 
+;;; and everything will be copacetic.
+
+(define (%string-hash s char->int bound start end)
+  (let ((iref (lambda (s i) (char->int (string-ref s i))))
+	;; Compute a 111...1 mask that will cover BOUND-1:
+	(mask (let lp ((i #x10000)) ; Let's skip first 16 iterations, eh?
+		(if (>= i bound) (- i 1) (lp (+ i i))))))
+    (let lp ((i start) (ans 0))
+      (if (>= i end) (modulo ans bound)
+	  (lp (+ i 1) (bitwise-and mask (+ (* 37 ans) (iref s i))))))))
+
+(define (string-hash s . maybe-bound+start+end)
+  (let-optionals* maybe-bound+start+end ((bound 4194304 (and (integer? bound)
+							     (exact? bound)
+							     (<= 0 bound)))
+					 rest)
+    (let ((bound (if (zero? bound) 4194304 bound)))	; 0 means default.
+      (let-string-start+end (start end) string-hash s rest
+        (%string-hash s char->integer bound start end)))))
+
+(define (string-hash-ci s . maybe-bound+start+end)
+  (let-optionals* maybe-bound+start+end ((bound 4194304 (and (integer? bound)
+							     (exact? bound)
+							     (<= 0 bound)))
+					 rest)
+    (let ((bound (if (zero? bound) 4194304 bound)))	; 0 means default.
+      (let-string-start+end (start end) string-hash-ci s rest
+        (%string-hash s (lambda (c) (char->integer (char-downcase c)))
+		      bound start end)))))
+
 ;;; Case hacking
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
-;;; string-upper-case?
-;;; string-lower-case?
-;;;
 ;;; string-upcase  s [start end]
 ;;; string-upcase! s [start end]
 ;;; string-downcase  s [start end]
 ;;; string-downcase! s [start end]
 ;;;
-;;; capitalize-string  s [start end]
-;;; capitalize-string! s [start end]
-;;;   Uppercase first alphanum char, lowercase rest.
-;;;
-;;; capitalize-words  s [start end]
-;;; capitalize-words! s [start end]
-;;;   Capitalize every contiguous alphanum sequence: uppercase
+;;; string-titlecase  s [start end]
+;;; string-titlecase! s [start end]
+;;;   Capitalize every contiguous alpha sequence: capitalise
 ;;;   first char, lowercase rest.
 
-;;; These two use a different definition of an "upper-/lower-case string"
-;;; than MIT Scheme uses:
-
-(define (string-upper-case? s . maybe-start+end)
-  (not (apply string-any char-lower-case? s maybe-start+end)))
-
-(define (string-lower-case? s . maybe-start+end)
-  (not (apply string-any char-upper-case? s maybe-start+end)))
-
-
 (define (string-upcase  s . maybe-start+end)
-  (apply string-map char-upcase s maybe-start+end))
+  (let-string-start+end (start end) string-upcase s maybe-start+end
+    (%string-map char-upcase s start end)))
 
 (define (string-upcase! s . maybe-start+end)
-  (apply string-map! char-upcase s maybe-start+end))
+  (let-string-start+end (start end) string-upcase! s maybe-start+end
+    (%string-map! char-upcase s start end)))
 
 (define (string-downcase  s . maybe-start+end)
-  (apply string-map char-downcase s maybe-start+end))
+  (let-string-start+end (start end) string-downcase s maybe-start+end
+    (%string-map char-downcase s start end)))
 
 (define (string-downcase! s . maybe-start+end)
-  (apply string-map! char-downcase s maybe-start+end))
+  (let-string-start+end (start end) string-downcase! s maybe-start+end
+    (%string-map! char-downcase s start end)))
 
-
-;;; capitalize-string  s [start end]
-;;; capitalize-string! s [start end]
-;;;   Uppercase first alphanum char, lowercase rest.
-
-(define (really-capitalize-string! s start end)
-  (cond ((string-index s char-set:alphanumeric start end) =>
-         (lambda (i)
-	   (string-set! s i (char-upcase (string-ref s i)))
-	   (string-downcase! s i)))))
-
-(define (capitalize-string! s . maybe-start+end)
-  (let-start+end (start end) capitalize-string! s maybe-start+end
-    (really-capitalize-string! s start end)))
-
-(define (capitalize-string s . maybe-start+end)
-  (let-start+end (start end) capitalize-string s maybe-start+end
-    (let ((ans (substringx s start end)))
-      (really-capitalize-string! ans 0 (- end start))
-      ans)))
-
-;;; capitalize-words  s [start end]
-;;; capitalize-words! s [start end]
-;;;   Capitalize every contiguous alphanum sequence: uppercase
-;;;   first char, lowercase rest.
-
-(define (really-capitalize-words! s start end)
+(define (%string-titlecase! s start end)
   (let lp ((i start))
-    (cond ((string-index s char-set:alphanumeric i end) =>
+    (cond ((string-index s char-cased? i end) =>
            (lambda (i)
-	     (string-set! s i (char-upcase (string-ref s i)))
+	     (string-set! s i (char-titlecase (string-ref s i)))
 	     (let ((i1 (+ i 1)))
-	       (cond ((string-skip s char-set:alphanumeric i1 end) =>
+	       (cond ((string-skip s char-cased? i1 end) =>
 		      (lambda (j)
 			(string-downcase! s i1 j)
 			(lp (+ j 1))))
 		     (else (string-downcase! s i1 end)))))))))
 
-(define (capitalize-words! s . maybe-start+end)
-  (let-start+end (start end) capitalize-string! s maybe-start+end
-    (really-capitalize-words! s start end)))
+(define (string-titlecase! s . maybe-start+end)
+  (let-string-start+end (start end) string-titlecase! s maybe-start+end
+    (%string-titlecase! s start end)))
 
-(define (capitalize-words s . maybe-start+end)
-  (let-start+end (start end) capitalize-string! s maybe-start+end
-    (let ((ans (substringx s start end)))
-      (really-capitalize-words! ans 0 (- end start))
+(define (string-titlecase s . maybe-start+end)
+  (let-string-start+end (start end) string-titlecase! s maybe-start+end
+    (let ((ans (substring s start end)))
+      (%string-titlecase! ans 0 (- end start))
       ans)))
 
-
 
 ;;; Cutting & pasting strings
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; string-take string nchars
 ;;; string-drop string nchars
 ;;;
+;;; string-take-right string nchars
+;;; string-drop-right string nchars
+;;;
 ;;; string-pad string k [char start end] 
 ;;; string-pad-right string k [char start end] 
 ;;; 
@@ -733,67 +976,80 @@
 ;;; say what you want to trim.
 
 (define (string-take s n)
-  (if (> n 0)
-      (substringx s 0 n)
-      (let ((len (string-length s)))
-	(substringx s (+ len n) len))))
+  (check-arg string? s string-take)
+  (check-arg (lambda (val) (and (integer? n) (exact? n)
+				(<= 0 n (string-length s))))
+	     n string-take)
+  (%substring/shared s 0 n))
+
+(define (string-take-right s n)
+  (check-arg string? s string-take-right)
+  (let ((len (string-length s)))
+    (check-arg (lambda (val) (and (integer? n) (exact? n) (<= 0 n len)))
+	       n string-take-right)
+    (%substring/shared s (- len n) len)))
 
 (define (string-drop s n)
+  (check-arg string? s string-drop)
   (let ((len (string-length s)))
-    (if (> n 0)
-	(substringx s n len)
-	(substringx s 0 (+ len n)))))
+    (check-arg (lambda (val) (and (integer? n) (exact? n) (<= 0 n len)))
+	       n string-drop)
+  (%substring/shared s n len)))
 
-(define (string-trim s . args)
-  (let-optionals args ((criteria char-set:whitespace)
-		       (start 0)
-		       (end (string-length s)))
-    (cond ((string-skip s criteria start end) =>
-	   (lambda (i) (substringx s i end)))
-	  (else ""))))
-
-(define (string-trim-right s . args)
-  (let-optionals args ((criteria char-set:whitespace)
-		       (start 0)
-		       (end (string-length s)))
-    (cond ((string-skip-right s criteria end start) =>
-	   (lambda (i) (substringx s 0 (+ 1 i))))
-	  (else ""))))
-
-(define (string-trim-both s . args)
-  (let-optionals args ((criteria char-set:whitespace)
-		       (start 0)
-		       (end (string-length s)))
-    (cond ((string-skip s criteria start end) =>
-	   (lambda (i) (substringx s i (+ 1 (string-skip-right s criteria end)))))
-	  (else ""))))
+(define (string-drop-right s n)
+  (check-arg string? s string-drop-right)
+  (let ((len (string-length s)))
+    (check-arg (lambda (val) (and (integer? n) (exact? n) (<= 0 n len)))
+	       n string-drop-right)
+    (%substring/shared s 0 (- len n))))
 
 
-(define (string-pad-right s n . args)
-  (let-optionals args ((char #\space) (start 0) (end (string-length s)))
-    (check-substring-spec string-pad-right s start end)
-    (let ((len (- end start)))
-      (cond ((= n len)						; No pad.
-	     (if (zero? start) s (substringx s start end)))
+(define (string-trim s . criterion+start+end)
+  (let-optionals* criterion+start+end ((criterion char-set:whitespace) rest)
+    (let-string-start+end (start end) string-trim s rest
+      (cond ((string-skip s criterion start end) =>
+	     (lambda (i) (%substring/shared s i end)))
+	    (else "")))))
 
-	    ((< n len) (substringx s start (+ start n)))	; Trim.
+(define (string-trim-right s . criterion+start+end)
+  (let-optionals* criterion+start+end ((criterion char-set:whitespace) rest)
+    (let-string-start+end (start end) string-trim-right s rest
+      (cond ((string-skip-right s criterion start end) =>
+	     (lambda (i) (%substring/shared s 0 (+ 1 i))))
+	    (else "")))))
 
-	    (else (let ((ans (make-string n char)))
-		    (string-copy! ans 0 s start end)
-		    ans))))))
+(define (string-trim-both s . criterion+start+end)
+  (let-optionals* criterion+start+end ((criterion char-set:whitespace) rest)
+    (let-string-start+end (start end) string-trim-both s rest
+      (cond ((string-skip s criterion start end) =>
+	     (lambda (i)
+	       (%substring/shared s i (+ 1 (string-skip-right s criterion i end)))))
+	    (else "")))))
 
-(define (string-pad s n . args)
-  (let-optionals args ((char #\space) (start 0) (end (string-length s)))
-    (check-substring-spec string-pad s start end)
-    (let ((len (- end start)))
-      (cond ((= n len)						; No pad.
-	     (if (zero? start) s (substringx s start end)))
 
-	    ((< n len) (substringx s  (- end n) end))		; Trim.
+(define (string-pad-right s n . char+start+end)
+  (let-optionals* char+start+end ((char #\space (char? char)) rest)
+    (let-string-start+end (start end) string-pad-right s rest
+      (check-arg (lambda (n) (and (integer? n) (exact? n) (<= 0 n)))
+		 n string-pad-right)
+      (let ((len (- end start)))
+	(if (<= n len)
+	    (%substring/shared s start (+ start n))
+	    (let ((ans (make-string n char)))
+	      (%string-copy! ans 0 s start end)
+	      ans))))))
 
-	    (else (let ((ans (make-string n char)))
-		    (string-copy! ans (- n len) s start end)
-		    ans))))))
+(define (string-pad s n . char+start+end)
+  (let-optionals* char+start+end ((char #\space (char? char)) rest)
+    (let-string-start+end (start end) string-pad s rest
+      (check-arg (lambda (n) (and (integer? n) (exact? n) (<= 0 n)))
+		 n string-pad)
+      (let ((len (- end start)))
+	(if (<= n len)
+	    (%substring/shared s (- end n) end)
+	    (let ((ans (make-string n char)))
+	      (%string-copy! ans (- n len) s start end)
+	      ans))))))
 
 
 
@@ -802,30 +1058,30 @@
 ;;; string-delete char/char-set/pred string [start end]
 ;;; string-filter char/char-set/pred string [start end]
 ;;;
-;;; If the filter criteria is a char or char-set, we scan the string twice
-;;;   with string-fold -- once to determine the length of the result string, 
+;;; If the criterion is a char or char-set, we scan the string twice with
+;;;   string-fold -- once to determine the length of the result string, 
 ;;;   and once to do the filtered copy.
-;;; If the filter criteria is a predicate, we don't do this double-scan
-;;;   strategy, because the predicate might have side-effects or be very
-;;;   expensive to compute. So we preallocate a temp buffer pessimistically,
-;;;   and only do one scan over S. This is likely to be faster and more
-;;;   space-efficient than consing a list.
+;;; If the criterion is a predicate, we don't do this double-scan strategy, 
+;;;   because the predicate might have side-effects or be very expensive to
+;;;   compute. So we preallocate a temp buffer pessimistically, and only do
+;;;   one scan over S. This is likely to be faster and more space-efficient
+;;;   than consing a list.
 
-(define (string-delete criteria s . maybe-start+end)
-  (let-start+end (start end) string-delete s maybe-start+end
-    (if (procedure? criteria)
+(define (string-delete criterion s . maybe-start+end)
+  (let-string-start+end (start end) string-delete s maybe-start+end
+    (if (procedure? criterion)
 	(let* ((slen (- end start))
 	       (temp (make-string slen))
 	       (ans-len (string-fold (lambda (c i)
-				       (if (criteria c) i
+				       (if (criterion c) i
 					   (begin (string-set! temp i c)
 						  (+ i 1))))
 				     0 s start end)))
-	  (if (= ans-len slen) temp (substringx temp 0 ans-len)))
+	  (if (= ans-len slen) temp (substring temp 0 ans-len)))
 
-	(let* ((cset (cond ((char-set? criteria) criteria)
-			   ((char? criteria) (char-set criteria))
-			   (else (error "string-delete criteria not predicate, char or char-set" criteria))))
+	(let* ((cset (cond ((char-set? criterion) criterion)
+			   ((char? criterion) (char-set criterion))
+			   (else (error "string-delete criterion not predicate, char or char-set" criterion))))
 	       (len (string-fold (lambda (c i) (if (char-set-contains? cset c)
 						   i
 						   (+ i 1)))
@@ -838,22 +1094,22 @@
 		       0 s start end)
 	  ans))))
 
-(define (string-filter criteria s . maybe-start+end)
-  (let-start+end (start end) string-filter s maybe-start+end
-    (if (procedure? criteria)
+(define (string-filter criterion s . maybe-start+end)
+  (let-string-start+end (start end) string-filter s maybe-start+end
+    (if (procedure? criterion)
 	(let* ((slen (- end start))
 	       (temp (make-string slen))
 	       (ans-len (string-fold (lambda (c i)
-				       (if (criteria c)
+				       (if (criterion c)
 					   (begin (string-set! temp i c)
 						  (+ i 1))
 					   i))
 				     0 s start end)))
-	  (if (= ans-len slen) temp (substringx temp 0 ans-len)))
+	  (if (= ans-len slen) temp (substring temp 0 ans-len)))
 
-	(let* ((cset (cond ((char-set? criteria) criteria)
-			   ((char? criteria) (char-set criteria))
-			   (else (error "string-delete criteria not predicate, char or char-set" criteria))))
+	(let* ((cset (cond ((char-set? criterion) criterion)
+			   ((char? criterion) (char-set criterion))
+			   (else (error "string-delete criterion not predicate, char or char-set" criterion))))
 
 	       (len (string-fold (lambda (c i) (if (char-set-contains? cset c)
 						   (+ i 1)
@@ -867,104 +1123,126 @@
 		       0 s start end)
 	  ans))))
 
-
 
 ;;; String search
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; string-index       string char/char-set/pred [start end]
-;;; string-index-right string char/char-set/pred [end start]
+;;; string-index-right string char/char-set/pred [start end]
 ;;; string-skip        string char/char-set/pred [start end]
-;;; string-skip-right  string char/char-set/pred [end start]
-;;;     Note the odd start/end ordering of index-right and skip-right params.
+;;; string-skip-right  string char/char-set/pred [start end]
+;;; string-count       char/char-set/pred string [start end]
 ;;;     There's a lot of replicated code here for efficiency.
 ;;;     For example, the char/char-set/pred discrimination has
 ;;;     been lifted above the inner loop of each proc.
 
-(define (string-index str criteria . maybe-start+end)
-  (let-start+end (start end) string-index str maybe-start+end
-    (cond ((char? criteria)
+(define (string-index str criterion . maybe-start+end)
+  (let-string-start+end (start end) string-index str maybe-start+end
+    (cond ((char? criterion)
 	   (let lp ((i start))
 	     (and (< i end)
-		  (if (char=? criteria (string-ref str i)) i
+		  (if (char=? criterion (string-ref str i)) i
 		      (lp (+ i 1))))))
-	  ((char-set? criteria)
+	  ((char-set? criterion)
 	   (let lp ((i start))
 	     (and (< i end)
-		  (if (char-set-contains? criteria (string-ref str i)) i
+		  (if (char-set-contains? criterion (string-ref str i)) i
 		      (lp (+ i 1))))))
-	  ((procedure? criteria)
+	  ((procedure? criterion)
 	   (let lp ((i start))
 	     (and (< i end)
-		  (if (criteria (string-ref str i)) i
+		  (if (criterion (string-ref str i)) i
 		      (lp (+ i 1))))))
 	  (else (error "Second param is neither char-set, char, or predicate procedure."
-		       string-index criteria)))))
+		       string-index criterion)))))
 
-(define (string-index-right str criteria . maybe-end+start)
-  (let-optionals maybe-end+start ((start 0) (end (string-length str)))
-    (check-substring-spec string-index-right str start end)
-    (cond ((char? criteria)
+(define (string-index-right str criterion . maybe-start+end)
+  (let-string-start+end (start end) string-index-right str maybe-start+end
+    (cond ((char? criterion)
 	   (let lp ((i (- end 1)))
 	     (and (>= i 0)
-		  (if (char=? criteria (string-ref str i)) i
+		  (if (char=? criterion (string-ref str i)) i
 		      (lp (- i 1))))))
-	  ((char-set? criteria)
+	  ((char-set? criterion)
 	   (let lp ((i (- end 1)))
 	     (and (>= i 0)
-		  (if (char-set-contains? criteria (string-ref str i)) i
+		  (if (char-set-contains? criterion (string-ref str i)) i
 		      (lp (- i 1))))))
-	  ((procedure? criteria)
+	  ((procedure? criterion)
 	   (let lp ((i (- end 1)))
 	     (and (>= i 0)
-		  (if (criteria (string-ref str i)) i
+		  (if (criterion (string-ref str i)) i
 		      (lp (- i 1))))))
 	  (else (error "Second param is neither char-set, char, or predicate procedure."
-		       string-index-right criteria)))))
+		       string-index-right criterion)))))
 
-(define (string-skip str criteria . maybe-start+end)
-  (let-start+end (start end) string-skip str maybe-start+end
-    (cond ((char? criteria)
+(define (string-skip str criterion . maybe-start+end)
+  (let-string-start+end (start end) string-skip str maybe-start+end
+    (cond ((char? criterion)
 	   (let lp ((i start))
 	     (and (< i end)
-		  (if (char=? criteria (string-ref str i))
+		  (if (char=? criterion (string-ref str i))
 		      (lp (+ i 1))
 		      i))))
-	  ((char-set? criteria)
+	  ((char-set? criterion)
 	   (let lp ((i start))
 	     (and (< i end)
-		  (if (char-set-contains? criteria (string-ref str i))
+		  (if (char-set-contains? criterion (string-ref str i))
 		      (lp (+ i 1))
 		      i))))
-	  ((char-set? criteria)
+	  ((procedure? criterion)
 	   (let lp ((i start))
 	     (and (< i end)
-		  (if (criteria (string-ref str i)) (lp (+ i 1))
+		  (if (criterion (string-ref str i)) (lp (+ i 1))
 		      i))))
 	  (else (error "Second param is neither char-set, char, or predicate procedure."
-		       string-skip criteria)))))
+		       string-skip criterion)))))
 
-(define (string-skip-right str criteria . maybe-end+start)
-  (let-optionals maybe-end+start ((start 0) (end (string-length str)))
-    (check-substring-spec string-index-right str start end)
-    (cond ((char? criteria)
+(define (string-skip-right str criterion . maybe-start+end)
+  (let-string-start+end (start end) string-skip-right str maybe-start+end
+    (cond ((char? criterion)
 	   (let lp ((i (- end 1)))
 	     (and (>= i 0)
-		  (if (char=? criteria (string-ref str i))
+		  (if (char=? criterion (string-ref str i))
 		      (lp (- i 1))
 		      i))))
-	  ((char-set? criteria)
+	  ((char-set? criterion)
 	   (let lp ((i (- end 1)))
 	     (and (>= i 0)
-		  (if (char-set-contains? criteria (string-ref str i))
+		  (if (char-set-contains? criterion (string-ref str i))
 		      (lp (- i 1))
 		      i))))
-	  ((procedure? criteria)
+	  ((procedure? criterion)
 	   (let lp ((i (- end 1)))
 	     (and (>= i 0)
-		  (if (criteria (string-ref str i)) (lp (- i 1))
+		  (if (criterion (string-ref str i)) (lp (- i 1))
 		      i))))
-	  (else (error "CRITERIA param is neither char-set or char."
-		       string-skip-right criteria)))))
+	  (else (error "CRITERION param is neither char-set or char."
+		       string-skip-right criterion)))))
+
+
+(define (string-count criterion s . maybe-start+end)
+  (let-string-start+end (start end) string-count s maybe-start+end
+    (cond ((char? criterion)
+	   (do ((i start (+ i 1))
+		(count 0 (if (char=? criterion (string-ref s i))
+			     (+ count 1)
+			     count)))
+	       ((>= i end) count)))
+
+	  ((char-set? criterion)
+	   (do ((i start (+ i 1))
+		(count 0 (if (char-set-contains? criterion (string-ref s i))
+			     (+ count 1)
+			     count)))
+	       ((>= i end) count)))
+
+	  ((procedure? criterion)
+	   (do ((i start (+ i 1))
+		(count 0 (if (criterion (string-ref s i)) (+ count 1) count)))
+	       ((>= i end) count)))
+
+	  (else (error "CRITERION param is neither char-set or char."
+		       string-count criterion)))))
 
 
 
@@ -975,146 +1253,251 @@
 ;;; 	Guaranteed to work, even if s1 eq s2.
 
 (define (string-fill! s char . maybe-start+end)
-  (let-start+end (start end) string-fill! s maybe-start+end
+  (check-arg char? char string-fill!)
+  (let-string-start+end (start end) string-fill! s maybe-start+end
     (do ((i (- end 1) (- i 1)))
 	((< i start))
       (string-set! s i char))))
 
 (define (string-copy! to tstart from . maybe-fstart+fend)
-  (let-start+end (fstart fend) string-copy! from maybe-fstart+fend
-    (let ((tend (+ tstart (- fend fstart))))
-      (check-substring-spec string-copy! to tstart tend)
-      (if (> fstart tstart)
-	  (do ((i fstart (+ i 1))
-	       (j tstart (+ j 1)))
-	      ((>= i fend))
-	    (string-set! to j (string-ref from i)))
+  (let-string-start+end (fstart fend) string-copy! from maybe-fstart+fend
+    (check-arg integer? tstart string-copy!)
+    (check-substring-spec string-copy! to tstart (+ tstart (- fend fstart)))
+    (%string-copy! to tstart from fstart fend)))
 
-	  (do ((i (- fend 1) (- i 1))
-	       (j (- tend 1) (- j 1)))
-	      ((< i fstart))
-	    (string-set! to j (string-ref from i)))))))
+;;; Library-internal routine
+(define (%string-copy! to tstart from fstart fend)
+  (if (> fstart tstart)
+      (do ((i fstart (+ i 1))
+	   (j tstart (+ j 1)))
+	  ((>= i fend))
+	(string-set! to j (string-ref from i)))
 
+      (do ((i (- fend 1)                    (- i 1))
+	   (j (+ -1 tstart (- fend fstart)) (- j 1)))
+	  ((< i fstart))
+	(string-set! to j (string-ref from i)))))
 
 
-;;; Returns starting-position or #f if not true.
-;;; This implementation is slow & simple. See below for KMP.
-;;; Boyer-Moore would be nice.
-;(define (substring? substring string . maybe-start+end)
-;  (let-start+end (start end) string substring? maybe-start+end
-;    (if (string-null? substring) start
-;	(let* ((len (string-length substring))
-;	       (i-bound (- end len))
-;	       (char1 (string-ref substring start)))
-;	  (let lp ((i 0))
-;	    (cond ((string-index string char1 i i-bound) =>
-;		   (lambda (i)
-;		     (if (substring= substring 0 len string i (+ i len))
-;			 i
-;			 (lp (+ i 1)))))
-;		  (else #f)))))))
-
 
-;;; Searching for an occurence of a substring
+;;; Returns starting-position in STRING or #f if not true.
+;;; This implementation is slow & simple. It is useful as a "spec" or for
+;;; comparison testing with fancier implementations.
+;;; See below for fast KMP version.
+
+;(define (string-contains string substring . maybe-starts+ends)
+;  (let-string-start+end2 (start1 end1 start2 end2) 
+;                         string-contains string substring maybe-starts+ends
+;    (let* ((len (- end2 start2))
+;	   (i-bound (- end1 len)))
+;      (let lp ((i start1))
+;	(and (< i i-bound)
+;	     (if (string= string substring i (+ i len) start2 end2)
+;		 i
+;		 (lp (+ i 1))))))))
+
+
+;;; Searching for an occurrence of a substring
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
-;;; This uses the KMP algorithm
-;;;     "Fast Pattern Matching in Strings"
+
+(define (string-contains text pattern . maybe-starts+ends)
+  (let-string-start+end2 (t-start t-end p-start p-end)
+                         string-contains text pattern maybe-starts+ends
+    (%kmp-search pattern text char=? p-start p-end t-start t-end)))
+
+(define (string-contains-ci text pattern . maybe-starts+ends)
+  (let-string-start+end2 (t-start t-end p-start p-end)
+                         string-contains-ci text pattern maybe-starts+ends
+    (%kmp-search pattern text char-ci=? p-start p-end t-start t-end)))
+
+
+;;; Knuth-Morris-Pratt string searching
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; See
+;;;     "Fast pattern matching in strings"
 ;;;     SIAM J. Computing 6(2):323-350 1977
 ;;;     D. E. Knuth, J. H. Morris and V. R. Pratt
 ;;; also described in
-;;;     "Pattern Matching in Strings"
+;;;     "Pattern matching in strings"
 ;;;     Alfred V. Aho
 ;;;     Formal Language Theory - Perspectives and Open Problems
 ;;;     Ronald V. Brook (editor)
 ;;; This algorithm is O(m + n) where m and n are the 
 ;;; lengths of the pattern and string respectively
-;;; Original version of this code by bevan; I have substantially rehacked it.
 
-(define (substring? pattern source . maybe-start+end)
-  (let-start+end (start end) substring? source maybe-start+end
-    (really-substring? char=? pattern source start end)))
+;;; KMP search source[start,end) for PATTERN. Return starting index of
+;;; leftmost match or #f.
 
-(define (substring-ci? pattern source . maybe-start+end)
-  (let-start+end (start end) substring-ci? source maybe-start+end
-    (really-substring? char-ci=? pattern source start end)))
+(define (%kmp-search pattern text c= p-start p-end t-start t-end)
+  (let ((plen (- p-end p-start))
+	(rv (make-kmp-restart-vector pattern c= p-start p-end)))
 
-;;; Compute the Knuth-Morris-Pratt restart vector RV for string PATTERN.  If
+    ;; The search loop. TJ & PJ are redundant state.
+    (let lp ((ti t-start) (pi 0)
+	     (tj (- t-end t-start))	; (- tlen ti) -- how many chars left.
+	     (pj plen))			; (- plen pi) -- how many chars left.
+
+      (if (= pi plen) (- ti plen)			; Win.
+	  
+	  (and (<= pj tj)				; Lose.
+		 
+	       (if (c= (string-ref text ti)		; Search.
+		       (string-ref pattern (+ p-start pi)))
+		   (lp (+ 1 ti) (+ 1 pi) (- tj 1) (- pj 1))	; Advance.
+		   
+		   (let ((pi (vector-ref rv pi)))		; Retreat.
+		     (if (= pi -1)
+			 (lp (+ ti 1)  0   (- tj 1)  plen)	; Punt.
+			 (lp ti        pi  tj        (- plen pi))))))))))
+
+;;; (make-kmp-restart-vector pattern [c= start end]) -> integer-vector
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Compute the KMP restart vector RV for string PATTERN.  If
 ;;; we have matched chars 0..i-1 of PATTERN against a search string S, and
 ;;; PATTERN[i] doesn't match S[k], then reset i := RV[i], and try again to
 ;;; match S[k].  If RV[i] = -1, then punt S[k] completely, and move on to
-;;; S[k+1] and PATTERN[0].
+;;; S[k+1] and PATTERN[0] -- no possible match of PAT[0..i] contains S[k].
 ;;;
 ;;; In other words, if you have matched the first i chars of PATTERN, but
 ;;; the i+1'th char doesn't match, RV[i] tells you what the next-longest
 ;;; prefix of PATTERN is that you have matched.
 ;;;
-;;; C= is the character comparator -- usefully CHAR= or CHAR-CI=.
+;;; - C= (default CHAR=?) is used to compare characters for equality.
+;;;   Pass in CHAR-CI=? for case-folded string search.
+;;;
+;;; - START & END restrict the pattern to the indicated substring; the
+;;;   returned vector will be of length END - START. The numbers stored
+;;;   in the vector will be values in the range [0,END-START) -- that is,
+;;;   they are valid indices into the restart vector; you have to add START
+;;;   to them to use them as indices into PATTERN.
 ;;;
 ;;; I've split this out as a separate function in case other constant-string
 ;;; searchers might want to use it.
+;;;
+;;; E.g.:
+;;;    a b d  a b x
+;;; #(-1 0 0 -1 1 2)
 
-(define (make-kmp-restart-vector pattern c=)
-  (let* ((plen (string-length pattern))
-	 (rv (make-vector plen)))
-    (if (> plen 0)
-	(let ((plen-1 (- plen 1)))
-	  (vector-set! rv 0 -1)
-	  (let lp ((i 0) (j -1))
-	    (if (< i plen-1)
-		(if (or (= j -1)
-			(c= (string-ref pattern i)
-			    (string-ref pattern j)))
-		    (let ((i (+ 1 i))
-			  (j (+ 1 j)))
-		      (vector-set! rv i j)
-		      (lp i j))
-		    (lp i (vector-ref rv j)))))))
-    rv))
+(define (make-kmp-restart-vector pattern . maybe-c=+start+end)
+  (let-optionals* maybe-c=+start+end
+                  ((c= char=? (procedure? c=))
+		   ((start end) (lambda (args)
+				  (string-parse-start+end make-kmp-restart-vector
+							  pattern args))))
+    (let* ((rvlen (- end start))
+	   (rv (make-vector rvlen -1)))
+      (if (> rvlen 0)
+	  (let ((rvlen-1 (- rvlen 1))
+		(c0 (string-ref pattern start)))
 
-(define (really-substring? c= pattern source start end)
-  (let ((plen (string-length pattern))
-	(rv (make-kmp-restart-vector pattern c=)))
+	    ;; Here's the main loop. We have set rv[0] ... rv[i].
+	    ;; K = I + START -- it is the corresponding index into PATTERN.
+	    (let lp1 ((i 0) (j -1) (k start))	
+	      (if (< i rvlen-1)
 
-    ;; The search loop. SJ & PJ are redundant state.
-    (let lp ((si start) (pi 0)
-	     (sj (- end start))	; (- end si)  -- how many chars left.
-	     (pj plen))		; (- plen pi) -- how many chars left.
+		  (let ((ck (string-ref pattern k)))
+		    ;; lp2 invariant:
+		    ;;   pat[(k-j) .. k-1] matches pat[start .. start+j-1]
+		    ;;   or j = -1.
+		    (let lp2 ((j j))
 
-      (if (= pi plen) (- si plen)			; Win.
+		      (cond ((= j -1)
+			     (let ((i1 (+ i 1)))
+			       (vector-set! rv i1 (if (c= ck c0) -1 0))
+			       (lp1 i1 0 (+ k 1))))
 
-	  (and (<= pj sj)				; Lose.
-		     
-	       (if (c= (string-ref source si)		; Search.
-		       (string-ref pattern pi))
-		   (lp (+ 1 si) (+ 1 pi) (- sj 1) (- pj 1))	; Advance.
-			 
-		   (let ((pi (vector-ref rv pi)))		; Retreat.
-		     (if (= pi -1)
-			 (lp (+ si 1)  0   (- sj 1)  plen)	; Punt.
-			 (lp si        pi  sj        (- plen pi))))))))))
+			    ;; pat[(k-j) .. k] matches pat[start..start+j].
+			    ((c= ck (string-ref pattern (+ j start)))
+			     (let* ((i1 (+ 1 i))
+				    (j1 (+ 1 j)))
+			       (vector-set! rv i1 j1)
+			       (lp1 i1 j1 (+ k 1))))
 
+			    (else (lp2 (vector-ref rv j))))))))))
+      rv)))
+
+
+;;; We've matched I chars from PAT. C is the next char from the search string.
+;;; Return the new I after handling C. 
+;;;
+;;; The pattern is (VECTOR-LENGTH RV) chars long, beginning at index PAT-START
+;;; in PAT (PAT-START is usually 0). The I chars of the pattern we've matched
+;;; are 
+;;;     PAT[PAT-START .. PAT-START + I].
+;;;
+;;; It's *not* an oversight that there is no friendly error checking or
+;;; defaulting of arguments. This is a low-level, inner-loop procedure
+;;; that we want integrated/inlined into the point of call.
+
+(define (kmp-step pat rv c i c= p-start)
+  (let lp ((i i))
+    (if (c= c (string-ref pat (+ i p-start)))	; Match =>
+	(+ i 1)					;   Done.
+	(let ((i (vector-ref rv i)))		; Back up in PAT.
+	  (if (= i -1) 0			; Can't back up further.
+	      (lp i))))))			; Keep trying for match.
+
+;;; Zip through S[start,end), looking for a match of PAT. Assume we've
+;;; already matched the first I chars of PAT when we commence at S[start].
+;;; - <0:  If we find a match *ending* at index J, return -J.
+;;; - >=0: If we get to the end of the S[start,end) span without finding
+;;;   a complete match, return the number of chars from PAT we'd matched
+;;;   when we ran off the end.
+;;;
+;;; This is useful for searching *across* buffers -- that is, when your
+;;; input comes in chunks of text. We hand-integrate the KMP-STEP loop
+;;; for speed.
+
+(define (string-kmp-partial-search pat rv s i . c=+p-start+s-start+s-end)
+  (check-arg vector? rv string-kmp-partial-search)
+  (let-optionals* c=+p-start+s-start+s-end
+		  ((c=      char=? (procedure? c=))
+		   (p-start 0 (and (integer? p-start) (exact? p-start) (<= 0 p-start)))
+		   ((s-start s-end) (lambda (args)
+				      (string-parse-start+end string-kmp-partial-search
+							      s args))))
+    (let ((patlen (vector-length rv)))
+      (check-arg (lambda (i) (and (integer? i) (exact? i) (<= 0 i) (< i patlen)))
+		 i string-kmp-partial-search)
+
+      ;; Enough prelude. Here's the actual code.
+      (let lp ((si s-start)		; An index into S.
+	       (vi i))			; An index into RV.
+	(cond ((= vi patlen) (- si))	; Win.
+	      ((= si s-end) vi)		; Ran off the end.
+	      (else			; Match s[si] & loop.
+	       (let ((c (string-ref s si)))
+		 (lp (+ si 1)	
+		     (let lp2 ((vi vi))	; This is just KMP-STEP.
+		       (if (c= c (string-ref pat (+ vi p-start)))
+			   (+ vi 1)
+			   (let ((vi (vector-ref rv vi)))
+			     (if (= vi -1) 0
+				 (lp2 vi)))))))))))))
 
 
 ;;; Misc
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; (string-null? s)
 ;;; (string-reverse  s [start end])
 ;;; (string-reverse! s [start end])
-;;; (string-null? s)
+;;; (reverse-list->string clist)
+;;; (string->list s [start end])
 
 (define (string-null? s) (zero? (string-length s)))
 
 (define (string-reverse s . maybe-start+end)
-  (let-start+end (start end) string-reverse s maybe-start+end
-    (let ((ans (make-string (- end start))))
-      (do ((i (- end 1) (- i 1))
-	   (j start (+ j 1)))
-	  ((< i j))
-	(string-set! ans i (string-ref s j))
+  (let-string-start+end (start end) string-reverse s maybe-start+end
+    (let* ((len (- end start))
+	   (ans (make-string len)))
+      (do ((i start (+ i 1))
+	   (j (- len 1) (- j 1)))
+	  ((< j 0))
 	(string-set! ans j (string-ref s i)))
       ans)))
 
 (define (string-reverse! s . maybe-start+end)
-  (let-start+end (start end) string-reverse! s maybe-start+end
+  (let-string-start+end (start end) string-reverse! s maybe-start+end
     (do ((i (- end 1) (- i 1))
 	 (j start (+ j 1)))
 	((<= i j))
@@ -1133,18 +1516,20 @@
 
 
 ;(define (string->list s . maybe-start+end)
-;  (let-start+end (start end) string->list s maybe-start+end
-;    (do ((i (- end 1) (- i 1))
-;	 (ans '() (cons (string-ref s i) ans)))
-;	((< i start) ans))))
+;  (apply string-fold-right cons '() s maybe-start+end))
 
 (define (string->list s . maybe-start+end)
-  (apply string-fold-right cons '() s maybe-start+end))
+  (let-string-start+end (start end) string->list s maybe-start+end
+    (do ((i (- end 1) (- i 1))
+	 (ans '() (cons (string-ref s i) ans)))
+	((< i start) ans))))
+
+;;; Defined by R5RS, so commented out here.
+;(define (list->string lis) (string-unfold null? car cdr lis))
 
 
-
-;;; string-concat        string-list -> string
-;;; string-concat/shared string-list -> string
+;;; string-concatenate        string-list -> string
+;;; string-concatenate/shared string-list -> string
 ;;; string-append/shared s ... -> string
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; STRING-APPEND/SHARED has license to return a string that shares storage
@@ -1152,52 +1537,162 @@
 ;;; string amongst its parameters, it is permitted to return that string as
 ;;; its result. STRING-APPEND, by contrast, always allocates new storage.
 ;;;
-;;; STRING-CONCAT & STRING-CONCAT/SHARED are passed a list of strings,
-;;; which they concatenate into a result string. STRING-CONCAT always
-;;; allocates a fresh string; STRING-CONCAT/SHARED may (or may not) return
-;;; a result that shares storage with any of its arguments. In particular,
-;;; if it is applied to a singleton list, it is permitted to return the
-;;; car of that list as its value.
-;;;
-;;; This is portable code, but could be much more efficient w/compiler
-;;; support. Especially the n-ary guys.
+;;; STRING-CONCATENATE & STRING-CONCATENATE/SHARED are passed a list of
+;;; strings, which they concatenate into a result string. STRING-CONCATENATE
+;;; always allocates a fresh string; STRING-CONCATENATE/SHARED may (or may
+;;; not) return a result that shares storage with any of its arguments. In
+;;; particular, if it is applied to a singleton list, it is permitted to
+;;; return the car of that list as its value.
 
-;;; We delete the empty strings from the parameter list before handing
-;;; off to string-concat/shared. I wrote the recursion out by hand instead
-;;; of using list-lib's FILTER or FILTER! to minimize non-R5RS dependencies.
+(define (string-append/shared . strings) (string-concatenate/shared strings))
 
-(define (string-append/shared . strings) (string-concat/shared strings))
+(define (string-concatenate/shared strings)
+  (let lp ((strings strings) (nchars 0) (first #f))
+    (cond ((pair? strings)			; Scan the args, add up total
+	   (let* ((string  (car strings))	; length, remember 1st 
+		  (tail (cdr strings))		; non-empty string.
+		  (slen (string-length string)))
+	     (if (zero? slen)
+		 (lp tail nchars first)
+		 (lp tail (+ nchars slen) (or first strings)))))
 
-(define (string-concat/shared strings)
-  (let ((strings (let recur ((strings strings))		; Delete empty strings.
-		   (if (pair? strings)
-		       (let ((s (car strings))
-			     (tail (recur (cdr strings))))
-			 (if (string-null? s) tail (cons s tail)))
-		       '()))))
+	  ((zero? nchars) "")
 
-    (cond ((not (pair? strings)) "")			; () => "".
-	  ((not (pair? (cdr strings))) (car strings))	; (s) => s.
-	  (else (string-concat strings)))))		; Allocate & concat.
+	  ;; Just one non-empty string! Return it.
+	  ((= nchars (string-length (car first))) (car first))
+
+	  (else (let ((ans (make-string nchars)))
+		  (let lp ((strings first) (i 0))
+		    (if (pair? strings)
+			(let* ((s (car strings))
+			       (slen (string-length s)))
+			  (%string-copy! ans i s 0 slen)
+			  (lp (cdr strings) (+ i slen)))))
+		  ans)))))
+			
 
 ; Alas, Scheme 48's APPLY blows up if you have many, many arguments.
-;(define (string-concat strings) (apply string-append strings))
+;(define (string-concatenate strings) (apply string-append strings))
 
 ;;; Here it is written out. I avoid using REDUCE to add up string lengths
 ;;; to avoid non-R5RS dependencies.
-(define (string-concat strings)
+(define (string-concatenate strings)
   (let* ((total (do ((strings strings (cdr strings))
 		     (i 0 (+ i (string-length (car strings)))))
 		    ((not (pair? strings)) i)))
 	 (ans (make-string total)))
     (let lp ((i 0) (strings strings))
       (if (pair? strings)
-	  (let ((s (car strings)))
-	    (string-copy! ans i s)
-	    (lp (+ i (string-length s)) (cdr strings)))))
+	  (let* ((s (car strings))
+		 (slen (string-length s)))
+	    (%string-copy! ans i s 0 slen)
+	    (lp (+ i slen) (cdr strings)))))
     ans))
 	  
 
+;;; Defined by R5RS, so commented out here.
+;(define (string-append . strings) (string-concatenate strings))
+
+;;; string-concatenate-reverse        string-list [final-string end] -> string
+;;; string-concatenate-reverse/shared string-list [final-string end] -> string
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Return
+;;;   (string-concatenate 
+;;;     (reverse
+;;;       (cons (substring final-string 0 end) string-list)))
+
+(define (string-concatenate-reverse string-list . maybe-final+end)
+  (let-optionals* maybe-final+end ((final "" (string? final))
+				   (end (string-length final)
+					(and (integer? end)
+					     (exact? end)
+					     (<= 0 end (string-length final)))))
+    (let ((len (let lp ((sum 0) (lis string-list))
+		 (if (pair? lis)
+		     (lp (+ sum (string-length (car lis))) (cdr lis))
+		     sum))))
+
+      (%finish-string-concatenate-reverse len string-list final end))))
+
+(define (string-concatenate-reverse/shared string-list . maybe-final+end)
+  (let-optionals* maybe-final+end ((final "" (string? final))
+				   (end (string-length final)
+					(and (integer? end)
+					     (exact? end)
+					     (<= 0 end (string-length final)))))
+    ;; Add up the lengths of all the strings in STRING-LIST; also get a
+    ;; pointer NZLIST into STRING-LIST showing where the first non-zero-length
+    ;; string starts.
+    (let lp ((len 0) (nzlist #f) (lis string-list))
+      (if (pair? lis)
+	  (let ((slen (string-length (car string-list))))
+	    (lp (+ len slen)
+		(if (or nzlist (zero? slen)) nzlist lis)
+		(cdr lis)))
+
+	  (cond ((zero? len) (substring/shared final 0 end))
+
+		;; LEN > 0, so NZLIST is non-empty.
+
+		((and (zero? end) (= len (string-length (car nzlist))))
+		 (car nzlist))
+
+		(else (%finish-string-concatenate-reverse len nzlist final end)))))))
+
+(define (%finish-string-concatenate-reverse len string-list final end)
+  (let ((ans (make-string (+ end len))))
+    (%string-copy! ans len final 0 end)
+    (let lp ((i len) (lis string-list))
+      (if (pair? lis)
+	  (let* ((s   (car lis))
+		 (lis (cdr lis))
+		 (slen (string-length s))
+		 (i (- i slen)))
+	    (%string-copy! ans i s 0 slen)
+	    (lp i lis))))
+    ans))
+
+
+
+
+;;; string-replace s1 s2 start1 end1 [start2 end2] -> string
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Replace S1[START1,END1) with S2[START2,END2).
+
+(define (string-replace s1 s2 start1 end1 . maybe-start+end)
+  (check-substring-spec string-replace s1 start1 end1)
+  (let-string-start+end (start2 end2) string-replace s2 maybe-start+end
+    (let* ((slen1 (string-length s1))
+	   (sublen2 (- end2 start2))
+	   (alen (+ (- slen1 (- end1 start1)) sublen2))
+	   (ans (make-string alen)))
+      (%string-copy! ans 0 s1 0 start1)
+      (%string-copy! ans start1 s2 start2 end2)
+      (%string-copy! ans (+ start1 sublen2) s1 end1 slen1)
+      ans)))
+
+
+;;; string-tokenize s [token-set start end] -> list
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; Break S up into a list of token strings, where a token is a maximal
+;;; non-empty contiguous sequence of chars belonging to TOKEN-SET.
+;;; (string-tokenize "hello, world") => ("hello," "world")
+
+(define (string-tokenize s . token-chars+start+end)
+  (let-optionals* token-chars+start+end
+                  ((token-chars char-set:graphic (char-set? token-chars)) rest)
+    (let-string-start+end (start end) string-tokenize s rest
+      (let lp ((i end) (ans '()))
+	(cond ((and (< start i) (string-index-right s token-chars start i)) =>
+	       (lambda (tend-1)
+		 (let ((tend (+ 1 tend-1)))
+		   (cond ((string-skip-right s token-chars start tend-1) =>
+			  (lambda (tstart-1)
+			    (lp tstart-1
+				(cons (substring s (+ 1 tstart-1) tend)
+				      ans))))
+			 (else (cons (substring s start tend) ans))))))
+	      (else ans))))))
 
 
 ;;; xsubstring s from [to start end] -> string
@@ -1228,33 +1723,36 @@
 ;;; dispensation when FROM=TO.
 
 (define (xsubstring s from . maybe-to+start+end)
+  (check-arg (lambda (val) (and (integer? val) (exact? val)))
+	     from xsubstring)
   (receive (to start end)
            (if (pair? maybe-to+start+end)
-	       (let-start+end (start end) xsubstring s (cdr maybe-to+start+end)
-		 (values (car maybe-to+start+end) start end))
-	       (let ((slen (string-length s)))
+	       (let-string-start+end (start end) xsubstring s (cdr maybe-to+start+end)
+		 (let ((to (car maybe-to+start+end)))
+		   (check-arg (lambda (val) (and (integer? val)
+						 (exact? val)
+						 (<= from val)))
+			      to xsubstring)
+		   (values to start end)))
+	       (let ((slen (string-length (check-arg string? s xsubstring))))
 		 (values (+ from slen) 0 slen)))
     (let ((slen   (- end start))
 	  (anslen (- to  from)))
-      (cond ((< anslen 0)
-	     (error "Illegal FROM/TO spec passed to xsubstring -- FROM > TO."
-		    s from to start end))
-
-	    ((zero? anslen) "")
-	    ((zero? slen) (error "Empty (sub)string passed to xsubstring"
-				  s from to start end))
+      (cond ((zero? anslen) "")
+	    ((zero? slen) (error "Cannot replicate empty (sub)string"
+				  xsubstring s from to start end))
 
 	    ((= 1 slen)		; Fast path for 1-char replication.
 	     (make-string anslen (string-ref s start)))
 
 	    ;; Selected text falls entirely within one span.
 	    ((= (floor (/ from slen)) (floor (/ to slen)))
-	     (substringx s (+ start (modulo from slen))
-			   (+ start (modulo to   slen))))
+	     (substring s (+ start (modulo from slen))
+			  (+ start (modulo to   slen))))
 
 	    ;; Selected text requires multiple spans.
 	    (else (let ((ans (make-string anslen)))
-		    (multispan-repcopy! ans 0 s from to start end)
+		    (%multispan-repcopy! ans 0 s from to start end)
 		    ans))))))
 
 
@@ -1266,10 +1764,15 @@
 ;;; a string on top of itself.
 
 (define (string-xcopy! target tstart s sfrom . maybe-sto+start+end)
+  (check-arg (lambda (val) (and (integer? val) (exact? val)))
+	     sfrom string-xcopy!)
   (receive (sto start end)
            (if (pair? maybe-sto+start+end)
-	       (let-start+end (start end) string-xcopy! s (cdr maybe-sto+start+end)
-		 (values (car maybe-sto+start+end) start end))
+	       (let-string-start+end (start end) string-xcopy! s (cdr maybe-sto+start+end)
+		 (let ((sto (car maybe-sto+start+end)))
+		   (check-arg (lambda (val) (and (integer? val) (exact? val)))
+			      sto string-xcopy!)
+		   (values sto start end)))
 	       (let ((slen (string-length s)))
 		 (values (+ sfrom slen) 0 slen)))
 
@@ -1277,34 +1780,32 @@
 	   (tend (+ tstart tocopy))
 	   (slen (- end start)))
       (check-substring-spec string-xcopy! target tstart tend)
-      (cond ((< tocopy 0)
-	     (error "Illegal FROM/TO spec passed to string-xcopy! -- FROM > TO."
-		    target tstart s sfrom sto start end))
-	    ((zero? tocopy))
-	    ((zero? slen) (error "Empty (sub)string passed to string-xcopy!"
-				  target tstart s sfrom sto start end))
+      (cond ((zero? tocopy))
+	    ((zero? slen) (error "Cannot replicate empty (sub)string"
+				 string-xcopy!
+				 target tstart s sfrom sto start end))
 
 	    ((= 1 slen)			; Fast path for 1-char replication.
 	     (string-fill! target (string-ref s start) tstart tend))
 
 	    ;; Selected text falls entirely within one span.
 	    ((= (floor (/ sfrom slen)) (floor (/ sto slen)))
-	     (string-copy! target tstart s 
-			   (+ start (modulo sfrom slen))
-			   (+ start (modulo sto   slen))))
+	     (%string-copy! target tstart s 
+			    (+ start (modulo sfrom slen))
+			    (+ start (modulo sto   slen))))
 
 	    ;; Multi-span copy.
-	    (else (multispan-repcopy! target tstart s sfrom sto start end))))))
+	    (else (%multispan-repcopy! target tstart s sfrom sto start end))))))
 
 ;;; This is the core copying loop for XSUBSTRING and STRING-XCOPY!
 ;;; Internal -- not exported, no careful arg checking.
-(define (multispan-repcopy! target tstart s sfrom sto start end)
+(define (%multispan-repcopy! target tstart s sfrom sto start end)
   (let* ((slen (- end start))
 	 (i0 (+ start (modulo sfrom slen)))
 	 (total-chars (- sto sfrom)))
 
     ;; Copy the partial span @ the beginning
-    (string-copy! target tstart s i0 end)
+    (%string-copy! target tstart s i0 end)
 		    
     (let* ((ncopied (- end i0))			; We've copied this many.
 	   (nleft (- total-chars ncopied))	; # chars left to copy.
@@ -1315,43 +1816,155 @@
 	   (nspans nspans (- nspans 1)))	; # spans to copy
 	  ((zero? nspans)
 	   ;; Copy the partial-span @ the end & we're done.
-	   (string-copy! target i s start (+ start (- total-chars (- i tstart)))))
+	   (%string-copy! target i s start (+ start (- total-chars (- i tstart)))))
 
-	(string-copy! target i s start end))))) ; Copy a whole span.
+	(%string-copy! target i s start end))))); Copy a whole span.
 
 
 
-;;; (join-strings string-list [delimiter grammar]) => string
+;;; (string-join string-list [delimiter grammar]) => string
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; Paste strings together using the delimiter string.
 ;;;
 ;;; (join-strings '("foo" "bar" "baz") ":") => "foo:bar:baz"
 ;;;
 ;;; DELIMITER defaults to a single space " "
-;;; GRAMMAR is one of the symbols {infix, suffix} and defaults to 'infix.
+;;; GRAMMAR is one of the symbols {prefix, infix, strict-infix, suffix} 
+;;; and defaults to 'infix.
+;;;
+;;; I could rewrite this more efficiently -- precompute the length of the
+;;; answer string, then allocate & fill it in iteratively. Using 
+;;; STRING-CONCATENATE is less efficient.
 
-;;; (join-strings strings [delim grammar])
+(define (string-join strings . delim+grammar)
+  (let-optionals* delim+grammar ((delim " " (string? delim))
+				 (grammar 'infix))
+    (let ((buildit (lambda (lis final)
+		     (let recur ((lis lis))
+		       (if (pair? lis)
+			   (cons delim (cons (car lis) (recur (cdr lis))))
+			   final)))))
 
-(define (join-strings strings . args)
-  (if (pair? strings)
-      (let-optionals args ((delim " ") (grammar 'infix))
-	(let ((strings (reverse strings)))
-	  (let lp ((strings (cdr strings))
-		   (ans (case grammar
-			  ((infix)  (list (car strings)))
-			  ((suffix) (list (car strings) delim))
-			  (else (error "Illegal join-strings grammar" grammar)))))
-	    (if (pair? strings)
-		(lp (cdr strings)
-		    (cons (car strings) (cons delim ans)))
-	  
-		; All done
-		(string-concat ans)))))
+      (cond ((pair? strings)
+	     (string-concatenate
+	      (case grammar
 
-      ""))	; Special-cased for infix grammar.
+		((infix strict-infix)
+		 (cons (car strings) (buildit (cdr strings) '())))
 
+		((prefix) (buildit strings '()))
+
+		((suffix)
+		 (cons (car strings) (buildit (cdr strings) (list delim))))
+
+		(else (error "Illegal join grammar"
+			     grammar string-join)))))
+
+	     ((not (null? strings))
+	      (error "STRINGS parameter not list." strings string-join))
+
+	     ;; STRINGS is ()
+
+	     ((eq? grammar 'strict-infix)
+	      (error "Empty list cannot be joined with STRICT-INFIX grammar."
+		     string-join))
+
+	     (else "")))))		; Special-cased for infix grammar.
 
 
+;;; Porting & performance-tuning notes
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; See the section at the beginning of this file on external dependencies.
+;;;
+;;; The biggest issue with respect to porting is the LET-OPTIONALS* macro.
+;;; There are many, many optional arguments in this library; the complexity
+;;; of parsing, defaulting & type-testing these parameters is handled with the
+;;; aid of this macro. There are about 15 uses of LET-OPTIONALS*. You can
+;;; rewrite the uses, port the hairy macro definition (which is implemented
+;;; using a Clinger-Rees low-level explicit-renaming macro system), or port
+;;; the simple, high-level definition, which is less efficient.
+;;;
+;;; There is a fair amount of argument checking. This is, strictly speaking,
+;;; unnecessary -- the actual body of the procedures will blow up if, say, a
+;;; START/END index is improper. However, the error message will not be as
+;;; good as if the error were caught at the "higher level." Also, a very, very
+;;; smart Scheme compiler may be able to exploit having the type checks done
+;;; early, so that the actual body of the procedures can assume proper values.
+;;; This isn't likely; this kind of compiler technology isn't common any 
+;;; longer.
+;;; 
+;;; The overhead of optional-argument parsing is irritating. The optional
+;;; arguments must be consed into a rest list on entry, and then parsed out.
+;;; Function call should be a matter of a few register moves and a jump; it
+;;; should not involve heap allocation! Your Scheme system may have a superior
+;;; non-R5RS optional-argument system that can eliminate this overhead. If so,
+;;; then this is a prime candidate for optimising these procedures,
+;;; *especially* the many optional START/END index parameters.
+;;;
+;;; Note that optional arguments are also a barrier to procedure integration.
+;;; If your Scheme system permits you to specify alternate entry points
+;;; for a call when the number of optional arguments is known in a manner
+;;; that enables inlining/integration, this can provide performance 
+;;; improvements.
+;;;
+;;; There is enough *explicit* error checking that *all* string-index
+;;; operations should *never* produce a bounds error. Period. Feel like
+;;; living dangerously? *Big* performance win to be had by replacing
+;;; STRING-REF's and STRING-SET!'s with unsafe equivalents in the loops. 
+;;; Similarly, fixnum-specific operators can speed up the arithmetic done on 
+;;; the index values in the inner loops. The only arguments that are not
+;;; completely error checked are
+;;;   - string lists (complete checking requires time proportional to the
+;;;     length of the list)
+;;;   - procedure arguments, such as char->char maps & predicates.
+;;;     There is no way to check the range & domain of procedures in Scheme.
+;;; Procedures that take these parameters cannot fully check their
+;;; arguments. But all other types to all other procedures are fully
+;;; checked.
+;;;
+;;; This does open up the alternate possibility of simply *removing* these 
+;;; checks, and letting the safe primitives raise the errors. On a dumb
+;;; Scheme system, this would provide speed (by eliminating the redundant
+;;; error checks) at the cost of error-message clarity.
+;;;
+;;; See the comments preceding the hash function code for notes on tuning
+;;; the default bound so that the code never overflows your implementation's
+;;; fixnum size into bignum calculation.
+;;;
+;;; In an interpreted Scheme, some of these procedures, or the internal
+;;; routines with % prefixes, are excellent candidates for being rewritten
+;;; in C. Consider STRING-HASH, %STRING-COMPARE, the 
+;;; %STRING-{SUF,PRE}FIX-LENGTH routines, STRING-COPY!, STRING-INDEX &
+;;; STRING-SKIP (char-set & char cases), SUBSTRING and SUBSTRING/SHARED,
+;;; %KMP-SEARCH, and %MULTISPAN-REPCOPY!.
+;;;
+;;; It would also be nice to have the ability to mark some of these
+;;; routines as candidates for inlining/integration.
+;;; 
+;;; All the %-prefixed routines in this source code are written
+;;; to be called internally to this library. They do *not* perform
+;;; friendly error checks on the inputs; they assume everything is
+;;; proper. They also do not take optional arguments. These two properties
+;;; save calling overhead and enable procedure integration -- but they
+;;; are not appropriate for exported routines.
+
+
+;;; Copyright details
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; The prefix/suffix and comparison routines in this code had (extremely
+;;; distant) origins in MIT Scheme's string lib, and was substantially
+;;; reworked by Olin Shivers (shivers@ai.mit.edu) 9/98. As such, it is
+;;; covered by MIT Scheme's open source copyright. See below for details.
+;;; 
+;;; The KMP string-search code was influenced by implementations written
+;;; by Stephen Bevan, Brian Dehneyer and Will Fitzgerald. However, this
+;;; version was written from scratch by myself.
+;;;
+;;; The remainder of this code was written from scratch by myself for scsh.
+;;; The scsh copyright is a BSD-style open source copyright. See below for
+;;; details.
+;;;     -Olin Shivers
+
 ;;; MIT Scheme copyright terms
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 ;;; This material was developed by the Scheme project at the Massachusetts
@@ -1382,3 +1995,29 @@
 ;;; Technology nor of any adaptation thereof in any advertising,
 ;;; promotional, or sales literature without prior written consent from
 ;;; MIT in each case.
+
+;;; Scsh copyright terms
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; All rights reserved.
+;;; 
+;;; Redistribution and use in source and binary forms, with or without
+;;; modification, are permitted provided that the following conditions
+;;; are met:
+;;; 1. Redistributions of source code must retain the above copyright
+;;;    notice, this list of conditions and the following disclaimer.
+;;; 2. Redistributions in binary form must reproduce the above copyright
+;;;    notice, this list of conditions and the following disclaimer in the
+;;;    documentation and/or other materials provided with the distribution.
+;;; 3. The name of the authors may not be used to endorse or promote products
+;;;    derived from this software without specific prior written permission.
+;;; 
+;;; THIS SOFTWARE IS PROVIDED BY THE AUTHORS ``AS IS'' AND ANY EXPRESS OR
+;;; IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+;;; OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+;;; IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+;;; INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+;;; NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+;;; DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+;;; THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+;;; (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+;;; THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
diff --git a/scsh/lib/string-package.scm b/scsh/lib/string-package.scm
new file mode 100644
index 0000000..e29dc50
--- /dev/null
+++ b/scsh/lib/string-package.scm
@@ -0,0 +1,350 @@
+;;; Complete interface spec for the SRFI-13 string-lib and 	-*- Scheme -*-
+;;; string-lib-internals libraries in the Scheme48 interface
+;;; and module language. The interfaces are fully typed, in
+;;; the Scheme48 type notation. The structure definitions also
+;;; provide a formal description of the external dependencies
+;;; of the source code.
+
+;;; string-lib
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; string-map string-map!
+;;; string-fold       string-unfold
+;;; string-fold-right string-unfold-right 
+;;; string-tabulate string-for-each string-for-each-index
+;;; string-every string-any
+;;; string-hash string-hash-ci
+;;; string-compare string-compare-ci
+;;; string=    string<    string>    string<=    string>=    string<>
+;;; string-ci= string-ci< string-ci> string-ci<= string-ci>= string-ci<> 
+;;; string-downcase  string-upcase  string-titlecase  
+;;; string-downcase! string-upcase! string-titlecase! 
+;;; string-take string-take-right
+;;; string-drop string-drop-right
+;;; string-pad string-pad-right
+;;; string-trim string-trim-right string-trim-both
+;;; string-filter string-delete
+;;; string-index string-index-right 
+;;; string-skip  string-skip-right
+;;; string-count
+;;; string-prefix-length string-prefix-length-ci
+;;; string-suffix-length string-suffix-length-ci
+;;; string-prefix? string-prefix-ci?
+;;; string-suffix? string-suffix-ci?
+;;; string-contains string-contains-ci
+;;; string-fill! string-copy! 
+;;; string-copy substring/shared
+;;; string-reverse string-reverse! reverse-list->string
+;;; string->list
+;;; string-concatenate string-concatenate/shared
+;;; string-concatenate-reverse string-concatenate-reverse/shared
+;;; string-append/shared
+;;; xsubstring string-xcopy!
+;;; string-null?
+;;; string-join
+;;; string-tokenize
+;;; string-replace
+;;; 
+;;; string? make-string string string-length string-ref string-set! 
+;;; string-append list->string
+;;;
+;;; make-kmp-restart-vector string-kmp-partial-search kmp-step
+;;; string-parse-start+end
+;;; string-parse-final-start+end
+;;; let-string-start+end
+;;; check-substring-spec
+;;; substring-spec-ok?
+
+(define-interface string-lib-interface
+  (export
+   ;; string-map proc s [start end] -> s
+   (string-map (proc ((proc (:char) :char)
+		      :string
+		      &opt :exact-integer :exact-integer)
+		     :string))
+
+   ;; string-map! proc s [start end] -> unspecific
+   (string-map! (proc ((proc (:char) :values)
+		       :string
+		       &opt :exact-integer :exact-integer)
+		      :unspecific))
+
+   ;; string-fold       kons knil s [start end] -> value
+   ;; string-fold-right kons knil s [start end] -> value
+   ((string-fold string-fold-right)
+    (proc ((proc (:char :value) :value)
+	   :value :string
+	   &opt :exact-integer :exact-integer)
+	  :value))
+
+   ;; string-unfold       p f g seed [base make-final] -> string
+   ;; string-unfold-right p f g seed [base make-final] -> string
+   ((string-unfold string-unfold)
+    (proc ((proc (:value) :boolean)
+	   (proc (:value) :char)
+	   (proc (:value) :value)
+	   :value
+	   &opt :string (proc (:value) :string))
+	  :string))
+
+;   Enough is enough.
+;   ;; string-unfoldn p f g seed ... -> string
+;   (string-unfoldn (proc ((procedure :values :boolean)
+;                          (procedure :values :char)
+;                          (procedure :values :values)
+;                          &rest :value)
+;                         :string))
+
+   ;; string-tabulate proc len -> string
+   (string-tabulate (proc ((proc (:exact-integer) :char) :exact-integer)
+			  :string))
+
+   ;; string-for-each       proc s [start end] -> unspecific
+   ;; string-for-each-index proc s [start end] -> unspecific
+   ((string-for-each string-for-each-index)
+    (proc ((proc (:char) :values) :string &opt :exact-integer :exact-integer)
+	  :unspecific))
+
+   ;; string-every pred s [start end]
+   ;; string-any   pred s [start end]
+   (string-every
+    (proc ((proc (:char) :boolean) :string &opt :exact-integer :exact-integer)
+	  :boolean))
+   (string-any
+    (proc ((proc (:char) :boolean) :string &opt :exact-integer :exact-integer)
+	  :value))
+
+   ;; string-hash    s [bound start end]
+   ;; string-hash-ci s [bound start end]
+   ((string-hash string-hash-ci)
+    (proc (:string &opt :exact-integer :exact-integer :exact-integer)
+	  :exact-integer))
+
+   ;; string-compare    string1 string2 lt-proc eq-proc gt-proc [start end]
+   ;; string-compare-ci string1 string2 lt-proc eq-proc gt-proc [start end]
+   ((string-compare string-compare-ci)
+    (proc (:string :string (proc (:exact-integer) :values)
+		           (proc (:exact-integer) :values)
+			   (proc (:exact-integer) :values)
+			   &opt :exact-integer :exact-integer)
+	  :values))
+
+   ;; string< string1 string2 [start1 end1 start2 end2]
+   ((string= string< string> string<= string>= string<>
+     string-ci= string-ci< string-ci> string-ci<= string-ci>= string-ci<>)
+    (proc (:string :string &opt :exact-integer :exact-integer
+		                :exact-integer :exact-integer)
+	  :boolean))
+
+   ;; string-titlecase  string [start end]
+   ;; string-upcase     string [start end]
+   ;; string-downcase   string [start end]
+   ;; string-titlecase! string [start end]
+   ;; string-upcase!    string [start end]
+   ;; string-downcase!  string [start end]
+   ((string-titlecase  string-upcase  string-downcase)
+    (proc (:string &opt :exact-integer :exact-integer) :string))
+   ((string-titlecase! string-upcase! string-downcase!)
+    (proc (:string &opt :exact-integer :exact-integer) :unspecific))
+
+   ;; string-take       string nchars
+   ;; string-drop       string nchars
+   ;; string-take-right string nchars
+   ;; string-drop-right string nchars
+   ((string-take string-drop string-take-right string-drop-right)
+    (proc (:string :exact-integer) :string))
+
+   ;; string-pad       string k [char start end] 
+   ;; string-pad-right string k [char start end] 
+   ((string-pad string-pad-right)
+    (proc (:string :exact-integer &opt :char :exact-integer :exact-integer)
+	  :string))
+
+   ;; string-trim       string [char/char-set/pred start end] 
+   ;; string-trim-right string [char/char-set/pred start end] 
+   ;; string-trim-both  string [char/char-set/pred start end] 
+   ((string-trim string-trim-right string-trim-both)
+    (proc (:string &opt :value :exact-integer :exact-integer)
+	  :string))
+
+   ;; string-filter char/char-set/pred string [start end]
+   ;; string-delete char/char-set/pred string [start end]
+   ((string-filter string-delete)
+    (proc (:value :string &opt :exact-integer :exact-integer) :string))
+
+   ;; string-index       string char/char-set/pred [start end]
+   ;; string-index-right string char/char-set/pred [end start]
+   ;; string-skip        string char/char-set/pred [start end]
+   ;; string-skip-right  string char/char-set/pred [end start]
+   ((string-index string-index-right string-skip string-skip-right)
+    (proc (:string :value &opt :exact-integer :exact-integer)
+	  :value))
+
+   ;; string-count string char/char-set/pred [start end]
+   (string-count (proc (:string :value &opt :exact-integer :exact-integer)
+		       :exact-integer))
+
+   ;; string-prefix-length    string1 string2 [start1 end1 start2 end2]
+   ;; string-suffix-length    string1 string2 [start1 end1 start2 end2]
+   ;; string-prefix-length-ci string1 string2 [start1 end1 start2 end2]
+   ;; string-suffix-length-ci string1 string2 [start1 end1 start2 end2]
+   ((string-prefix-length string-prefix-length-ci
+     string-suffix-length string-suffix-length-ci)
+    (proc (:string :string &opt
+		   :exact-integer :exact-integer :exact-integer :exact-integer)
+	  :exact-integer))
+
+   ;; string-prefix?    string1 string2 [start1 end1 start2 end2]
+   ;; string-suffix?    string1 string2 [start1 end1 start2 end2]
+   ;; string-prefix-ci? string1 string2 [start1 end1 start2 end2]
+   ;; string-suffix-ci? string1 string2 [start1 end1 start2 end2]
+   ((string-prefix? string-prefix-ci?
+     string-suffix? string-suffix-ci?)
+    (proc (:string :string &opt
+		   :exact-integer :exact-integer :exact-integer :exact-integer)
+	  :boolean))
+
+   ;; string-contains    string pattern [s-start s-end p-start p-end]
+   ;; string-contains-ci string pattern [s-start s-end p-start p-end]
+   ((string-contains string-contains-ci)
+    (proc (:string :string &opt :exact-integer :exact-integer
+		                :exact-integer :exact-integer)
+	  :value))
+
+   ;; string-fill! string char [start end]
+   (string-fill! (proc (:string :char &opt :exact-integer :exact-integer)
+		       :unspecific))
+
+   ;; string-copy! to tstart from [fstart fend]
+   (string-copy! (proc (:string :exact-integer :string
+				&opt :exact-integer :exact-integer)
+		       :unspecific))
+
+   ;; string-copy        s [start end] -> string
+   ;; substring/shared   s start [end] -> string
+   (string-copy      (proc (:string &opt :exact-integer :exact-integer) :string))
+   (substring/shared (proc (:string :exact-integer &opt :exact-integer) :string))
+
+   ;; string-reverse  s [start end]
+   ;; string-reverse! s [start end]
+   (string-reverse  (proc (:string &opt :exact-integer :exact-integer) :string))
+   (string-reverse! (proc (:string &opt :exact-integer :exact-integer) :unspecific))
+
+   ;; reverse-list->string char-list
+   ;; string->list s [start end]
+   ;; string-concatenate        string-list
+   ;; string-concatenate/shared string-list
+   ;; string-append/shared s ...
+   (reverse-list->string (proc (:value) :string))
+   (string->list (proc (:string &opt :exact-integer :exact-integer) :value))
+   ((string-concatenate string-concatenate/shared) (proc (:value) :string))
+   (string-append/shared (proc (&rest :string) :string))
+
+   ;; string-concatenate-reverse        string-list [final-string end]
+   ;; string-concatenate-reverse/shared string-list [final-string end]
+   ((string-concatenate-reverse string-concatenate-reverse/shared)
+    (proc (:value &opt :string :exact-integer) :string))
+
+   ;; xsubstring s from [to start end]
+   ;; string-xcopy! target tstart s from [to start end]
+   (xsubstring (proc (:string :exact-integer &opt
+			      :exact-integer :exact-integer :exact-integer)
+		     :string))
+   (string-xcopy! (proc (:string :exact-integer :string :exact-integer &opt
+				 :exact-integer :exact-integer :exact-integer)
+			:unspecific))
+
+   ;; string-null? s
+   (string-null? (proc (:string) :boolean))
+
+   ;; string-join string-list [delim grammar]
+   (string-join (proc (:value &opt :string :symbol) :string))
+
+   ;; string-tokenize string [token-chars start end]
+   (string-tokenize (proc (:string &opt :value :exact-integer :exact-integer)
+			  :value))
+
+   ;; string-replace s1 s2 start1 end1 [start2 end2]
+   (string-replace (proc (:string :string :exact-integer :exact-integer
+				  &opt :exact-integer :exact-integer)
+			 :string))
+
+   ;; Here are the R4RS/R5RS procs
+   (string? (proc (:value) :boolean))
+   (make-string (proc (:exact-integer &opt :char) :string))
+   (string (proc (&rest :char) :string))
+   (string-length (proc (:string) :exact-integer))
+   (string-ref (proc (:string :exact-integer) :char))
+   (string-set! (proc (:string :exact-integer :char) :unspecific))
+   (string-append (proc (&rest :string) :string))
+   (list->string (proc (:value) :string))
+
+   ;; These are the R4RS types for STRING-COPY, STRING-FILL!, and
+   ;; STRING->LIST. The string-lib types are different -- extended.
+   ;(string-copy (proc (:string) :string))
+   ;(string-fill! (proc (:string :char) :unspecific))
+   ;(string->list (proc (:string) :value))
+
+   ))
+
+
+;;; make-kmp-restart-vector
+;;; string-kmp-partial-search
+;;; kmp-step
+;;; string-parse-start+end
+;;; string-parse-final-start+end
+;;; let-string-start+end
+;;; check-substring-spec
+;;; substring-spec-ok?
+
+(define-interface string-lib-internals-interface
+  (export
+   (let-string-start+end :syntax)
+   (string-parse-start+end (proc ((procedure :values :values) :string :value)
+				 (some-values :exact-integer :exact-integer :value)))
+   (string-parse-final-start+end (proc ((procedure :values :values) :string :value)
+				       (some-values :exact-integer :exact-integer)))
+   (check-substring-spec (proc ((procedure :values :values) :string :exact-integer :exact-integer)
+			       :unspecific))
+   (substring-spec-ok? (proc ((procedure :values :values) :string :exact-integer :exact-integer)
+			     :boolean))
+
+   ;; string-kmp-partial-search pat rv s i [c= p-start s-start s-end] -> integer
+   (string-kmp-partial-search (proc (:string :vector :string :exact-integer
+				     &opt (proc (:char :char) :boolean)
+				          :exact-integer :exact-integer :exact-integer)
+				    :exact-integer))
+
+   ;; make-kmp-restart-vector s [c= start end] -> vector
+   (make-kmp-restart-vector (proc (:string &opt (proc (:char :char) :boolean)
+					        :exact-integer :exact-integer)
+				  :vector))
+
+   ;; kmp-step pat rv c i c= p-start -> integer
+   (kmp-step (proc (:string :vector :char :exact-integer
+			    (proc (:char :char) :boolean)
+			    :exact-integer)
+		   :exact-integer))
+   ))
+
+
+(define-structures ((string-lib string-lib-interface)
+		    (string-lib-internals string-lib-internals-interface))
+  (access scheme)	; Get at R5RS SUBSTRING
+  (open receiving	; RECEIVE
+	char-set-lib	; Various
+	bitwise		; BITWISE-AND for hashing
+	error-package	; ERROR
+	let-opt		; LET-OPTIONALS* :OPTIONAL
+	scheme)
+
+  ;; A few cheesy S48/scsh definitions for string-lib dependencies:
+  (begin (define (check-arg pred val caller)
+	   (let lp ((val val))
+	     (if (pred val) val (lp (error "Bad argument" val pred caller)))))
+
+	 ;; These two internal procedures are correctly defined for ASCII or
+	 ;; Latin-1. They are *not* correct for Unicode.
+	 (define (char-cased? c) (char-set-contains? char-set:letter c))
+	 (define (char-titlecase c) (char-upcase c)))
+
+  (files string-lib))
diff --git a/scsh/meta-arg.scm b/scsh/meta-arg.scm
index 06add40..ee57b1e 100644
--- a/scsh/meta-arg.scm
+++ b/scsh/meta-arg.scm
@@ -52,7 +52,7 @@
 ;;; line two. Return these as a list of strings.
 
 (define read-files-secondary-args
-  (let ((non-newline (char-set-invert (char-set #\newline))))
+  (let ((non-newline (char-set-complement! (char-set #\newline))))
     (lambda (fname)
       (call-with-input-file fname
 	(lambda (port)
diff --git a/scsh/rx/packages.scm b/scsh/rx/packages.scm
index 1ef520e..45d2907 100644
--- a/scsh/rx/packages.scm
+++ b/scsh/rx/packages.scm
@@ -198,7 +198,7 @@
 	define-record-types
 	defrec-package
 	receiving
-	char-set-package
+	char-set-lib
 	error-package
 	ascii
 	string-lib		; string-fold
@@ -234,7 +234,7 @@
   (open re-internals
 	conditionals
 	re-level-0
-	char-set-package
+	char-set-lib
 	scsh-utilities	; fold
 	error-package
 	ascii
@@ -249,7 +249,7 @@
 
 (define-structure rx-syntax rx-syntax-interface
   (open re-level-0
-	char-set-package
+	char-set-lib
 	rx-lib
 	scheme)
   (for-syntax (open sre-internal-syntax-tools scheme))
diff --git a/scsh/rx/parse.scm b/scsh/rx/parse.scm
index fed54e0..e75ccc2 100644
--- a/scsh/rx/parse.scm
+++ b/scsh/rx/parse.scm
@@ -74,8 +74,8 @@
                
 
 ;;; Two useful standard char sets
-(define nonl-chars (char-set-invert (char-set #\newline)))
-(define word-chars (char-set-union (char-set #\_) char-set:alphanumeric))
+(define nonl-chars (char-set-complement (char-set #\newline)))
+(define word-chars (char-set-union (char-set #\_) char-set:letter+digit))
 
 ;;; Little utility that should be moved to scsh's utilities.scm
 (define (partition pred lis)
@@ -232,8 +232,8 @@
 					   (map parse-char-class (cdr sre))
 					   r))
 			(cs (if (char-set? cs)
-				(char-set-invert cs)
-				`(,(r 'char-set-invert) ,cs))))
+				(char-set-complement cs)
+				`(,(r 'char-set-complement) ,cs))))
 		   (if cset? cs (make-re-char-set cs))))
 
 	    ((&) (let ((cs (assoc-cset-op char-set-intersection 'char-set-intersection
@@ -281,15 +281,15 @@
 			   ((nonl)			nonl-chars)
 			   ((lower-case lower)		char-set:lower-case)
 			   ((upper-case upper)		char-set:upper-case)
-			   ((alphabetic alpha)		char-set:alphabetic)
-			   ((numeric digit num)	char-set:numeric)
-			   ((alphanumeric alnum alphanum) char-set:alphanumeric)
+			   ((alphabetic alpha)		char-set:letter)
+			   ((numeric digit num)	char-set:digit)
+			   ((alphanumeric alnum alphanum) char-set:letter+digit)
 			   ((punctuation punct)	char-set:punctuation)
 			   ((graphic graph)		char-set:graphic)
 			   ((blank)			char-set:blank)
 			   ((whitespace space white)	char-set:whitespace)
 			   ((printing print)		char-set:printing)
-			   ((control cntrl)		char-set:control)
+			   ((control cntrl)		char-set:iso-control)
 			   ((hex-digit xdigit hex)	char-set:hex-digit)
 			   ((ascii)			char-set:ascii)
 			   (else (error "Illegal regular expression" sre)))))
@@ -346,10 +346,9 @@
 	  (if (< i 0)
 	      (if cs? cset (uncase-char-set cset)) ; Case fold if necessary.
 	      (lp (- i 2)
-		  (char-set-union!
-		      cset
-		      (ascii-range->char-set (char->ascii (string-ref specs (- i 1)))
-					     (+ 1 (char->ascii (string-ref specs i)))))))))))
+		  (ucs-range->char-set! (char->ascii (string-ref specs (- i 1)))
+					(+ 1 (char->ascii (string-ref specs i)))
+					#f cset)))))))
 
 ;;; (regexp->scheme re r)
 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
@@ -451,17 +450,17 @@
 			   (else #f)))
 		(if one
 		    (switch char-set= cs
-		      ((char-set:alphanumeric)	alphanum)
+		      ((char-set:letter+digit)	alphanum)
 		      ((char-set:graphic)	graph)
 		      ((char-set:hex-digit)	hex)
 		      (else #f))
-		    (and (char-set= cs char-set:alphabetic) alpha)))
+		    (and (char-set= cs char-set:letter) alpha)))
 	    (and (char-set= cs char-set:lower-case) lower)) ; a, not A
 
 	(if biga
 	    (and (not space) (char-set= cs char-set:upper-case) upper)
 	    (if one
-		(and (not space) (char-set= cs char-set:numeric) num)
+		(and (not space) (char-set= cs char-set:digit) num)
 		(if space
 		    (switch char-set= cs
 		      ((char-set:whitespace) white)
@@ -469,7 +468,7 @@
 		      (else #f))
 		    (switch char-set= cs
 		      ((char-set:punctuation)	punct)
-		      ((char-set:control)	ctl)
+		      ((char-set:iso-control)	ctl)
 		      (else #f))))))))
 		
 
@@ -478,21 +477,21 @@
 	       (try-classify-char-set cs
 				      'char-set:full         'nonl-chars
 				      'char-set:lower-case   'char-set:upper-case
-				      'char-set:alphabetic   'char-set:numeric
-				      'char-set:alphanumeric 'char-set:punctuation
+				      'char-set:letter       'char-set:digit
+				      'char-set:letter+digit 'char-set:punctuation
 				      'char-set:graphic      'char-set:whitespace
-				      'char-set:printing     'char-set:control
+				      'char-set:printing     'char-set:iso-control
 				      'char-set:hex-digit    'char-set:blank
 				      'char-set:ascii))))
     (? ((not (char-set? cs)) cs) ; Dynamic -- *already* Scheme code.
        ((char-set-empty? cs) (r 'char-set:empty))
        ((try cs) => r)
-       ((try (char-set-invert cs)) =>
-	(lambda (name) `(,(r 'char-set-invert) ,name)))
+       ((try (char-set-complement cs)) =>
+	(lambda (name) `(,(r 'char-set-complement) ,name)))
 
        (else
 	(receive (loose+ ranges+) (char-set->in-pair cs)
-	  (receive (loose- ranges-) (char-set->in-pair (char-set-invert cs))
+	  (receive (loose- ranges-) (char-set->in-pair (char-set-complement cs))
 	    (let ((makeit (r 'spec->char-set)))
 	      (if (< (+ (length loose-) (* 12 (length ranges-)))
 		     (+ (length loose+) (* 12 (length ranges+))))
@@ -517,9 +516,9 @@
 					  'ascii)))
 	    (nchars (char-set-size cs)))
 	(? ((zero? nchars) `(,(r '|)))
-	   ((= 1 nchars) (apply string (char-set-members cs)))
+	   ((= 1 nchars) (apply string (char-set->list cs)))
 	   ((try cs) => r)
-	   ((try (char-set-invert cs)) =>
+	   ((try (char-set-complement cs)) =>
 	    (lambda (name) `(,(r '~) ,name)))
 	   (else (receive (cs rp comp?) (char-set->in-sexp-spec cs)
 		   (let ((args (append (? ((string=? cs "") '())
@@ -619,7 +618,7 @@
 						      `(,(car r) ,(cdr r) . ,lis))
 						    '() ranges)))))))
     (receive (cs+ rp+) (->sexp-pair cset)
-      (receive (cs- rp-) (->sexp-pair (char-set-invert cset))
+      (receive (cs- rp-) (->sexp-pair (char-set-complement cset))
 	(if (< (+ (string-length cs-) (string-length rp-))
 	       (+ (string-length cs+) (string-length rp+)))
 	    (values cs- rp- #t)
diff --git a/scsh/rx/posixstr.scm b/scsh/rx/posixstr.scm
index bbd06e5..9c9628b 100644
--- a/scsh/rx/posixstr.scm
+++ b/scsh/rx/posixstr.scm
@@ -375,11 +375,11 @@
 	(? ((= 0 nchars) (values "[^\000-\177]" 1 0 '#()))	; Empty set
 	     
 	   ((= 1 nchars)					; Singleton set
-	    (translate-string (string (car (char-set-members cset)))))
+	    (translate-string (string (car (char-set->list cset)))))
 
 	   ;; General case. Try both [...] and [^...].
 	   (else (let ((s- (->bracket-string cset #t))
-		       (s+ (->bracket-string (char-set-invert cset) #f)))
+		       (s+ (->bracket-string (char-set-complement cset) #f)))
 		   (values (if (< (string-length s-) (string-length s+))
 			       s- s+)
 			   1 0 '#())))))))
diff --git a/scsh/rx/re.scm b/scsh/rx/re.scm
index 263a259..fd32c26 100644
--- a/scsh/rx/re.scm
+++ b/scsh/rx/re.scm
@@ -162,7 +162,7 @@
 				      (string->char-set (re-string:chars elt))))
 				res))))
 	  (if (= 1 (char-set-size cset))
-	      (make-re-string (apply string (char-set-members cset)))
+	      (make-re-string (apply string (char-set->list cset)))
 	      (make-re-char-set cset)))
 
 	(if (pair? res)
@@ -387,7 +387,7 @@
 	      (char-set-full? cs)))))
 
 (define re-nonl
-  (make-re-char-set/posix (char-set-invert (char-set #\newline))
+  (make-re-char-set/posix (char-set-complement (char-set #\newline))
 			  "[^\n]"
 			  '#()))
 
@@ -414,7 +414,7 @@
 
 
 (define re-word
-  (let ((wcs (char-set-union char-set:alphanumeric	; Word chars
+  (let ((wcs (char-set-union char-set:letter+digit	; Word chars
 			     (char-set #\_))))
     (make-re-seq (list re-bow
 		       (make-re-repeat 1 #f (make-re-char-set wcs))
diff --git a/scsh/rx/rx-lib.scm b/scsh/rx/rx-lib.scm
index 9bb245b..07c3fe6 100644
--- a/scsh/rx/rx-lib.scm
+++ b/scsh/rx/rx-lib.scm
@@ -36,5 +36,5 @@
 		      ranges))))
     (if in?
 	(doit loose ranges)
-	(char-set-invert! (doit loose ranges)))))
+	(char-set-complement! (doit loose ranges)))))
 
diff --git a/scsh/rx/simp.scm b/scsh/rx/simp.scm
index 8d15347..d8656fe 100644
--- a/scsh/rx/simp.scm
+++ b/scsh/rx/simp.scm
@@ -47,7 +47,7 @@
       (values (let ((cs (re-char-set:cset re)))
 		(if (and (char-set? cs)
 			 (= 1 (char-set-size cs)))
-		    (make-re-string (string (car (char-set-members cs))))
+		    (make-re-string (string (car (char-set->list cs))))
 		    re))
 	      0))
 
@@ -243,7 +243,7 @@
 	 (tail (if (and bos? (not prev-bos?)) (cons re-bos tail) tail))
 	 (tail (? ((zero? numchars) tail)	; Drop empty char set.
 		  ((= 1 numchars)		; {c} => "c"
-		   (cons (make-re-string (string (car (char-set-members cset))))
+		   (cons (make-re-string (string (car (char-set->list cset))))
 			 tail))
 		  (else (cons (make-re-char-set cset) tail)))))
     tail))
diff --git a/scsh/rx/spencer.scm b/scsh/rx/spencer.scm
index 2b4368f..e61c904 100644
--- a/scsh/rx/spencer.scm
+++ b/scsh/rx/spencer.scm
@@ -128,7 +128,7 @@
 		    ((#\]) (if (= i i0)
 			       (lp i1 (char-set-adjoin! cset #\]))
 			       (let ((cset (if negate?
-					       (char-set-invert! cset)
+					       (char-set-complement! cset)
 					       cset)))
 				 (values (make-re-char-set cset) i1))))
 
diff --git a/scsh/scsh-interfaces.scm b/scsh/scsh-interfaces.scm
index 5342108..0cad09c 100644
--- a/scsh/scsh-interfaces.scm
+++ b/scsh/scsh-interfaces.scm
@@ -684,82 +684,8 @@
 	  ))
 
 
-(define-interface char-set-interface
-  (export char:newline char:tab char:page char:return char:space char:vtab
-	  char-ascii?
-
-	  char-set?
-	  char-set-copy
-	  char-set=
-	  char-set<=
-	  char-set-size
-
-	  char-set-adjoin  char-set-delete
-	  char-set-adjoin! char-set-delete!
-	  char-set-for-each
-	  char-set-fold reduce-char-set
-
-	  char-set
-	  chars->char-set
-	  string->char-set
-	  ascii-range->char-set
-	  predicate->char-set
-	  ->char-set
-
-	  char-set-members
-	  char-set-contains?
-
-	  char-set-every?
-	  char-set-any
-
-	  char-set-invert
-	  char-set-union
-	  char-set-intersection
-	  char-set-difference
-
-	  char-set-invert!
-	  char-set-union!
-	  char-set-intersection!
-	  char-set-difference!
-
-	  char-set:lower-case
-	  char-set:upper-case
-	  char-set:alphabetic
-	  char-set:numeric
-	  char-set:alphanumeric
-	  char-set:graphic
-	  char-set:printing
-	  char-set:whitespace
-	  char-set:blank
-	  char-set:control
-	  char-set:punctuation
-	  char-set:hex-digit
-	  char-set:ascii
-	  char-set:empty
-	  char-set:full
-
-	  char-lower-case?
-	  char-upper-case?
-	  char-alphabetic?
-	  char-numeric?
-	  char-alphanumeric?
-	  char-graphic?
-	  char-printing?
-	  char-whitespace?
-	  char-blank?
-	  char-control?
-	  char-punctuation?
-	  char-hex-digit?
-	  char-ascii?
-
-	  ;; This is not properly part of the interface,
-	  ;; and should be moved to an internals interface --
-	  ;; it is used by rdelim.scm code.
-	  char-set:s))
-
-
 (define-interface scsh-field-reader-interface
-  (export join-strings
+  (export join-strings	; Obsolete. Has become SRFI-13's STRING-JOIN.
 	  field-splitter infix-splitter suffix-splitter sloppy-suffix-splitter
 	  record-reader
 	  field-reader
diff --git a/scsh/scsh-package.scm b/scsh/scsh-package.scm
index ca74362..6d20b9f 100644
--- a/scsh/scsh-package.scm
+++ b/scsh/scsh-package.scm
@@ -61,17 +61,6 @@
   )
 
 
-(define-structure char-set-package char-set-interface  
-  (open error-package
-	ascii
-	define-record-types	; JAR's record macro.
-	scsh-utilities		; For DEPRECATED-PROC
-	scheme)
-  (files char-set)
-  (optimize auto-integrate)
-  )
-
-
 (define-structures ((tty-flags tty-flags-interface)
 		    (scsh-internal-tty-flags scsh-internal-tty-flags-interface))
   (open scheme ascii bitwise)
@@ -166,9 +155,10 @@
 	fluids
 	weak
 
+	scsh-char-set-low-level-lib	    ; rdelim.scm needs it.
 ;	scsh-regexp-package
 ;	scsh-regexp-internals
-	char-set-package
+	char-set-lib
 	scsh-version
 	tty-flags
 	scsh-internal-tty-flags             ; Not exported
@@ -181,7 +171,8 @@
 
 	string-lib
 
-	loopholes                    ; For my bogus CALL-TERMINALLY implementation.
+	fluids			; For exec-path-list
+	loopholes		; For my bogus CALL-TERMINALLY implementation.
 
 	scheme
 	)
@@ -288,17 +279,19 @@
 
 (define-structure field-reader-package scsh-field-reader-interface
   (open receiving		; receive
-	char-set-package
-	scsh-utilities		; nth
+	scsh-utilities		; nth & deprecated-proc (for join-strings)
 	error-package		; error
+	string-lib		; string-join for obsolete join-strings
 	scsh-level-0		; delimited readers
 ;	scsh-regexp-package
 	re-exports
-	string-lib		; join-strings
 	let-opt			; optional-arg parsing & defaulting
 	scheme
 	)
   (files fr)
+  ;; Handle a little bit of backwards compatibility.
+  (begin (define join-strings (deprecated-proc string-join 'join-strings
+					       "Use SRFI-13 STRING-JOIN.")))
   (optimize auto-integrate)
   )
 
@@ -364,9 +357,12 @@
 		      (export repl)
 		      awk-interface
 		      odbc-interface
+		      char-set-predicates-interface; Urk -- Some of this is R5RS!
+		      obsolete-char-set-interface
 		      )
 
   (open structure-refs
+	obsolete-char-set-lib
 	scsh-level-0
 	scsh-level-0-internals
 	re-exports
@@ -377,6 +373,7 @@
 	awk-package
 	odbc-package
 	field-reader-package
+	char-set-predicates-lib	; Urk -- Some of this is R5RS!
 	scheme)
 
   (access scsh-top-package)
diff --git a/scsh/scsh.scm b/scsh/scsh.scm
index 7d9fbad..08621a1 100644
--- a/scsh/scsh.scm
+++ b/scsh/scsh.scm
@@ -664,7 +664,7 @@
   (%exec prog (cons prog arglist) env))
 
 ;(define (exec-path/env prog env . arglist)
-;  (cond ((exec-path-search (stringify prog) exec-path-list) =>
+;  (cond ((exec-path-search (stringify prog) (fluid exec-path-list)) =>
 ;	 (lambda (binary)
 ;	   (apply exec/env binary env arglist)))
 ;	(else (error "No executable found." prog arglist))))
@@ -686,7 +686,7 @@
 	  (for-each (lambda (dir)
 		      (let ((binary (string-append dir "/" prog)))
 			(%%exec/errno binary argv env)))
-		    exec-path-list))))
+		    (fluid exec-path-list)))))
 
     (error "No executable found." prog arglist))
 	 
@@ -746,7 +746,7 @@
 
 ;;; Some globals:
 (define home-directory "")
-(define exec-path-list '())
+(define exec-path-list (make-fluid '()))
 
 (define (init-scsh-vars quietly?)
   (set! home-directory
@@ -754,11 +754,11 @@
 	      (else (if (not quietly?)
 			(warn "Starting up with no home directory ($HOME)."))
 		    "/")))
-  (set! exec-path-list
-	(cond ((getenv "PATH") => split-colon-list)
-	      (else (if (not quietly?)
-			(warn "Starting up with no path ($PATH)."))
-		    '()))))
+  (set-fluid! exec-path-list
+	      (cond ((getenv "PATH") => split-colon-list)
+		    (else (if (not quietly?)
+			      (warn "Starting up with no path ($PATH)."))
+			  '()))))
 
 
 ; SIGTSTP blows s48 away. ???

`char-set:lower-case`	Lower-case letters
`char-set:upper-case`	Upper-case letters
`char-set:title-case`	Title-case letters
`char-set:letter`	Letters
`char-set:digit`	Digits
`char-set:letter+digit`	Letters and digits
`char-set:graphic`	Printing characters except spaces
`char-set:printing`	Printing characters including spaces
`char-set:whitespace`	Whitespace characters
`char-set:iso-control`	The ISO control characters
`char-set:punctuation`	Punctuation characters
`char-set:symbol`	Symbol characters
`char-set:hex-digit`	A hexadecimal digit: 0-9, A-F, a-f
`char-set:blank`	Blank characters -- horizontal whitespace
`char-set:ascii`	All characters in the ASCII set.
`char-set:empty`	Empty set
`char-set:full`	All characters
00B5	MICRO SIGN
00DF	LATIN SMALL LETTER SHARP S
00E0	LATIN SMALL LETTER A WITH GRAVE
00E1	LATIN SMALL LETTER A WITH ACUTE
00E2	LATIN SMALL LETTER A WITH CIRCUMFLEX
00E3	LATIN SMALL LETTER A WITH TILDE
00E4	LATIN SMALL LETTER A WITH DIAERESIS
00E5	LATIN SMALL LETTER A WITH RING ABOVE
00E6	LATIN SMALL LETTER AE
00E7	LATIN SMALL LETTER C WITH CEDILLA
00E8	LATIN SMALL LETTER E WITH GRAVE
00E9	LATIN SMALL LETTER E WITH ACUTE
00EA	LATIN SMALL LETTER E WITH CIRCUMFLEX
00EB	LATIN SMALL LETTER E WITH DIAERESIS
00EC	LATIN SMALL LETTER I WITH GRAVE
00ED	LATIN SMALL LETTER I WITH ACUTE
00EE	LATIN SMALL LETTER I WITH CIRCUMFLEX
00EF	LATIN SMALL LETTER I WITH DIAERESIS
00F0	LATIN SMALL LETTER ETH
00F1	LATIN SMALL LETTER N WITH TILDE
00F2	LATIN SMALL LETTER O WITH GRAVE
00F3	LATIN SMALL LETTER O WITH ACUTE
00F4	LATIN SMALL LETTER O WITH CIRCUMFLEX
00F5	LATIN SMALL LETTER O WITH TILDE
00F6	LATIN SMALL LETTER O WITH DIAERESIS
00F8	LATIN SMALL LETTER O WITH STROKE
00F9	LATIN SMALL LETTER U WITH GRAVE
00FA	LATIN SMALL LETTER U WITH ACUTE
00FB	LATIN SMALL LETTER U WITH CIRCUMFLEX
00FC	LATIN SMALL LETTER U WITH DIAERESIS
00FD	LATIN SMALL LETTER Y WITH ACUTE
00FE	LATIN SMALL LETTER THORN
00FF	LATIN SMALL LETTER Y WITH DIAERESIS
00C0	LATIN CAPITAL LETTER A WITH GRAVE
00C1	LATIN CAPITAL LETTER A WITH ACUTE
00C2	LATIN CAPITAL LETTER A WITH CIRCUMFLEX
00C3	LATIN CAPITAL LETTER A WITH TILDE
00C4	LATIN CAPITAL LETTER A WITH DIAERESIS
00C5	LATIN CAPITAL LETTER A WITH RING ABOVE
00C6	LATIN CAPITAL LETTER AE
00C7	LATIN CAPITAL LETTER C WITH CEDILLA
00C8	LATIN CAPITAL LETTER E WITH GRAVE
00C9	LATIN CAPITAL LETTER E WITH ACUTE
00CA	LATIN CAPITAL LETTER E WITH CIRCUMFLEX
00CB	LATIN CAPITAL LETTER E WITH DIAERESIS
00CC	LATIN CAPITAL LETTER I WITH GRAVE
00CD	LATIN CAPITAL LETTER I WITH ACUTE
00CE	LATIN CAPITAL LETTER I WITH CIRCUMFLEX
00CF	LATIN CAPITAL LETTER I WITH DIAERESIS
00D0	LATIN CAPITAL LETTER ETH
00D1	LATIN CAPITAL LETTER N WITH TILDE
00D2	LATIN CAPITAL LETTER O WITH GRAVE
00D3	LATIN CAPITAL LETTER O WITH ACUTE
00D4	LATIN CAPITAL LETTER O WITH CIRCUMFLEX
00D5	LATIN CAPITAL LETTER O WITH TILDE
00D6	LATIN CAPITAL LETTER O WITH DIAERESIS
00D8	LATIN CAPITAL LETTER O WITH STROKE
00D9	LATIN CAPITAL LETTER U WITH GRAVE
00DA	LATIN CAPITAL LETTER U WITH ACUTE
00DB	LATIN CAPITAL LETTER U WITH CIRCUMFLEX
00DC	LATIN CAPITAL LETTER U WITH DIAERESIS
00DD	LATIN CAPITAL LETTER Y WITH ACUTE
00DE	LATIN CAPITAL LETTER THORN
01C5	LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON +
01C8	LATIN CAPITAL LETTER L WITH SMALL LETTER J +
01CB	LATIN CAPITAL LETTER N WITH SMALL LETTER J +
01F2	LATIN CAPITAL LETTER D WITH SMALL LETTER Z +
1F88	GREEK CAPITAL LETTER ALPHA WITH PSILI AND PROSGEGRAMMENI +
1F89	GREEK CAPITAL LETTER ALPHA WITH DASIA AND PROSGEGRAMMENI +
1F8A	GREEK CAPITAL LETTER ALPHA WITH PSILI AND VARIA AND PROSGEGRAMMENI +
1F8B	GREEK CAPITAL LETTER ALPHA WITH DASIA AND VARIA AND PROSGEGRAMMENI +
1F8C	GREEK CAPITAL LETTER ALPHA WITH PSILI AND OXIA AND PROSGEGRAMMENI +
1F8D	GREEK CAPITAL LETTER ALPHA WITH DASIA AND OXIA AND PROSGEGRAMMENI +
1F8E	GREEK CAPITAL LETTER ALPHA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI +
1F8F	GREEK CAPITAL LETTER ALPHA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI +
1F98	GREEK CAPITAL LETTER ETA WITH PSILI AND PROSGEGRAMMENI +
1F99	GREEK CAPITAL LETTER ETA WITH DASIA AND PROSGEGRAMMENI +
1F9A	GREEK CAPITAL LETTER ETA WITH PSILI AND VARIA AND PROSGEGRAMMENI +
1F9B	GREEK CAPITAL LETTER ETA WITH DASIA AND VARIA AND PROSGEGRAMMENI +
1F9C	GREEK CAPITAL LETTER ETA WITH PSILI AND OXIA AND PROSGEGRAMMENI +
1F9D	GREEK CAPITAL LETTER ETA WITH DASIA AND OXIA AND PROSGEGRAMMENI +
1F9E	GREEK CAPITAL LETTER ETA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI +
1F9F	GREEK CAPITAL LETTER ETA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI +
1FA8	GREEK CAPITAL LETTER OMEGA WITH PSILI AND PROSGEGRAMMENI +
1FA9	GREEK CAPITAL LETTER OMEGA WITH DASIA AND PROSGEGRAMMENI +
1FAA	GREEK CAPITAL LETTER OMEGA WITH PSILI AND VARIA AND PROSGEGRAMMENI +
1FAB	GREEK CAPITAL LETTER OMEGA WITH DASIA AND VARIA AND PROSGEGRAMMENI +
1FAC	GREEK CAPITAL LETTER OMEGA WITH PSILI AND OXIA AND PROSGEGRAMMENI +
1FAD	GREEK CAPITAL LETTER OMEGA WITH DASIA AND OXIA AND PROSGEGRAMMENI +
1FAE	GREEK CAPITAL LETTER OMEGA WITH PSILI AND PERISPOMENI AND PROSGEGRAMMENI +
1FAF	GREEK CAPITAL LETTER OMEGA WITH DASIA AND PERISPOMENI AND PROSGEGRAMMENI +
1FBC	GREEK CAPITAL LETTER ALPHA WITH PROSGEGRAMMENI +
1FCC	GREEK CAPITAL LETTER ETA WITH PROSGEGRAMMENI +
1FFC	GREEK CAPITAL LETTER OMEGA WITH PROSGEGRAMMENI +
00AA	FEMININE ORDINAL INDICATOR
00BA	MASCULINE ORDINAL INDICATOR
0009	HORIZONTAL TABULATION	\t control-I
000A	LINE FEED	\n control-J
000B	VERTICAL TABULATION	\v control-K
000C	FORM FEED	\f control-L
000D	CARRIAGE RETURN	\r control-M
0020	SPACE	Zs
00A0	NO-BREAK SPACE	Zs
1680	OGHAM SPACE MARK	Zs
2000	EN QUAD	Zs
2001	EM QUAD	Zs
2002	EN SPACE	Zs
2003	EM SPACE	Zs
2004	THREE-PER-EM SPACE	Zs
2005	FOUR-PER-EM SPACE	Zs
2006	SIX-PER-EM SPACE	Zs
2007	FIGURE SPACE	Zs
2008	PUNCTUATION SPACE	Zs
2009	THIN SPACE	Zs
200A	HAIR SPACE	Zs
200B	ZERO WIDTH SPACE	Zs
2028	LINE SEPARATOR	Zl
2029	PARAGRAPH SEPARATOR	Zp
202F	NARROW NO-BREAK SPACE	Zs
3000	IDEOGRAPHIC SPACE	Zs
0009	HORIZONTAL TABULATION	(\t control-I)
001C	FILE SEPARATOR	(control-\)
001D	GROUP SEPARATOR	(control-])
001E	RECORD SEPARATOR	(control-^)
001F	UNIT SEPARATOR	(control-_)
00A1	INVERTED EXCLAMATION MARK +
00AB	LEFT-POINTING DOUBLE ANGLE QUOTATION MARK +
00AD	SOFT HYPHEN +
00B7	MIDDLE DOT +
00BB	RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK +
00BF	INVERTED QUESTION MARK +
00A2	CENT SIGN
00A3	POUND SIGN
00A4	CURRENCY SIGN
00A5	YEN SIGN
00A6	BROKEN BAR
00A7	SECTION SIGN
00A8	DIAERESIS
00A9	COPYRIGHT SIGN
00AC	NOT SIGN
00AE	REGISTERED SIGN
00AF	MACRON
00B0	DEGREE SIGN
00B1	PLUS-MINUS SIGN
00B4	ACUTE ACCENT
00B6	PILCROW SIGN
00B8	CEDILLA
00D7	MULTIPLICATION SIGN
00F7	DIVISION SIGN