stk/Src/read.c

353 lines
8.9 KiB
C

/*
* r e a d . c -- reading stuff
*
* Copyright © 1993-1999 Erick Gallesio - I3S-CNRS/ESSI <eg@unice.fr>
*
*
* Permission to use, copy, modify, distribute,and license this
* software and its documentation for any purpose is hereby granted,
* provided that existing copyright notices are retained in all
* copies and that this notice is included verbatim in any
* distributions. No written agreement, license, or royalty fee is
* required for any of the authorized uses.
* This software is provided ``AS IS'' without express or implied
* warranty.
*
* Author: Erick Gallesio [eg@unice.fr]
* Creation date: ??-Oct-1993 ??:??
* Last file update: 3-Sep-1999 20:22 (eg)
*
*/
#include <ctype.h>
#include "stk.h"
#include "module.h"
static SCM cycles = NULL; /* used for reading circular data */
static char *proc_name = "read"; /* for Serror macro */
static SCM read_rec(SCM port, int case_significant);
static int flush_ws(SCM port, char *message)
{
int c;
c = Getc(port);
for ( ; ; ) {
switch (c) {
case EOF: if (message) Serror(message,NIL); else return(c);
case ';': do
c = Getc(port);
while (c != '\n' && c != EOF);
continue;
case '\n': STk_line_counter += 1; break;
default: if (!isspace(c)) return(c);
}
c = Getc(port);
}
}
static SCM read_list(SCM port, char delim, int case_significant)
/* Read a list ended by the `delim' char */
{
int c;
SCM tmp;
c = flush_ws(port, "End of file inside list");
if (c == delim) return(NIL);
/* Read the car */
Ungetc(c, port);
tmp = read_rec(port, case_significant);
/* Read the cdr */
if (EQ(tmp, Sym_dot)) {
tmp = read_rec(port, case_significant);
c = flush_ws(port, "End of file inside list");
if (c != delim) Serror("missing close parenthesis", NIL);
return(tmp);
}
return(Cons(tmp, read_list(port, delim, case_significant)));
}
static void read_word(SCM port, int c, int case_significant)
/* read an item whose 1st char is in c */
{
register int j = 0;
int allchars = 0;
for( ; ; ) {
allchars ^= (c == '|');
if (c != '|')
STk_tkbuffer[j++] = (allchars || case_significant) ? c : tolower(c);
c = Getc(port);
if (c == EOF) break;
if (!allchars) {
if (strchr("()[]'`,;\"\n", c)) {
Ungetc(c, port);
break;
}
if (isspace(c)) break;
}
if (j >= TKBUFFERN-1) Serror("token too large", NIL);
}
STk_tkbuffer[j] = '\0';
}
static void read_char(SCM port, int c)
/* read an char (or a char name) item whose 1st char is in c */
{
register int j = 0;
for( ; ; ) {
STk_tkbuffer[j++] = c;
c = Getc(port);
if (c == EOF || isspace(c)) break;
if (strchr("()[]'`,;\"", c)) {
Ungetc(c, port);
break;
}
if (j >= TKBUFFERN-1) Serror("token too large", NIL);
}
STk_tkbuffer[j] = '\0';
}
static SCM read_token(SCM port, int c, int case_significant)
{
SCM z;
read_word(port, c, case_significant);
z = STk_Cstr2number(STk_tkbuffer, 10L);
if (z == Ntruth)
/* It is not a number */
switch (*STk_tkbuffer) {
case ':': return STk_makekey(STk_tkbuffer);
case '#': Serror("bad # syntax", STk_makestring(STk_tkbuffer));
default : return Intern(STk_tkbuffer);
}
/* Return the number read */
return z;
}
static SCM read_cycle(SCM port, int c, int case_significant)
/* read a #xx# or #xx= cycle item whose 1st char is in c. */
{
register int j = 0;
for( ; ; ) {
STk_tkbuffer[j++] = c;
c = Getc(port);
if (c == EOF || !isdigit(c)) break;
if (j >= TKBUFFERN-1) Serror("token too large", NIL);
}
STk_tkbuffer[j] = '\0';
switch (c) {
case '#': {
SCM tmp, k = STk_makeinteger(atoi(STk_tkbuffer));
if ((tmp = STk_assv(k, cycles)) != Ntruth) {
return CDR(tmp);
}
else {
char buffer[70];
sprintf(buffer, "key ``#%d='' not defined", atoi(STk_tkbuffer));
Serror(buffer, NIL);
}
}
case '=': {
SCM val, tmp, k = STk_makeinteger(atoi(STk_tkbuffer));
if ((tmp = STk_assv(k, cycles)) == Ntruth) {
/* This is a little bit tricky here: We create a fake cell
* that could be referenced by the further read. Once the read
* is finished, we overwrite the fake cell with the value
* returned by the read. So, the fake cell becomes the real
* result (not too clear :-).
* ATTENTION: the value returned the next read can be of
* any type (e.g. '(1 2 #0="ab" #0#) ). But all our cells
* have the same size => no problem.
*/
tmp = Cons(UNBOUND, UNBOUND); /* The fake cell */
cycles = Cons(Cons(k, tmp), cycles); /* For next read */
val = read_rec(port, case_significant);/* Read item */
*tmp = *val; /*Overwrt fake cell*/
return tmp;
}
else {
char buffer[70];
sprintf(buffer, "key ``#%d='' already defined",
atoi(STk_tkbuffer))
;
Serror(buffer, NIL);
}
}
default: Ungetc(c, port); Serror("bad # syntax", STk_makestring(STk_tkbuffer));
}
return UNBOUND; /* for the compiler */
}
static SCM read_string(SCM port)
{
int k ,c,n;
size_t j, len;
char *p, *buffer;
SCM z;
j = 0;
len = 100;
p = buffer = must_malloc(len);
while(((c = Getc(port)) != '"') && (c != EOF)) {
if (c == '\\') {
c = Getc(port);
if (c == EOF) Serror("eof encountered after \\", NIL);
switch(c) {
case 'b' : c = '\b'; break; /* Bs */
case 'e' : c = 0x1b; break; /* Esc */
case 'n' : c = '\n'; break; /* Lf */
case 'r' : c = '\r'; break; /* Cr */
case 't' : c = '\t'; break; /* Tab */
case '\n': STk_line_counter += 1; continue;
case '0' : for( k=n=0 ; ; k++ ) {
c = Getc(port);
if (c == EOF) Serror("eof encountered after \\0", NIL);
if (isdigit(c) && (c < '8') && k < 3) /* Max = 3 digits */
n = n * 8 + c - '0';
else {
Ungetc(c, port);
break;
}
}
c = n & 0xff;
}
}
else
if (c == '\n') STk_line_counter += 1;
if ((j + 1) >= len) {
len = len + len / 2;
buffer = must_realloc(buffer, len);
p = buffer + j;
}
j++;
*p++ = c;
}
if (c == EOF) Serror("end of file while reading a string", NIL);
*p = '\0';
z = STk_makestrg(j, buffer);
free(buffer);
return z;
}
static SCM read_rec(SCM port, int case_significant)
{
int c;
for ( ; ; ) {
c = flush_ws(port, "end of file inside read encountered");
switch (c) {
case '(':
return(read_list(port, ')', case_significant));
case '[':
return(read_list(port, ']', case_significant));
case ')':
case ']':
Puts("\nread: unexpected close parenthesis", STk_curr_eport);
if (STk_current_filename != UNBOUND)
Fprintf(STk_curr_eport, " at line %d in file %s",
STk_line_counter, CHARS(STk_current_filename));
Putc('\n', STk_curr_eport);
Flush(STk_curr_eport);
break;
case '\'':
return LIST2(Sym_quote, read_rec(port, case_significant));
case '`':
return LIST2(Sym_quasiquote, read_rec(port, case_significant));
case '#':
switch(c=Getc(port)) {
case 't':
case 'T': return Truth;
case 'f':
case 'F': return Ntruth;
case '\\': read_char(port, Getc(port));
return STk_makechar(STk_string2char(STk_tkbuffer));
case '(' : {
SCM l = read_list(port, ')', case_significant);
return STk_vector(l, STk_llength(l));
}
case '!' : while ((c=Getc(port)) != '\n')
if (c == EOF) return STk_eof_object;
Ungetc(c, port);
continue;
case '|': do
do
if (c == '\n') STk_line_counter += 1;
while ((c != EOF) && (c = Getc(port)) != '|');
while ((c != EOF) && (c = Getc(port)) != '#');
c = flush_ws(port, (char *) NULL);
if (c == EOF) return STk_eof_object;
Ungetc(c,port);
continue;
case 'p':
case 'P': read_word(port, Getc(port), TRUE);
return STk_address2object(STk_tkbuffer);
case '.': return STk_eval(read_rec(port, case_significant),
MOD_ENV(STk_selected_module));
case '0':
case '1':
case '2':
case '3':
case '4':
case '5':
case '6':
case '7':
case '8':
case '9': return read_cycle(port, c, case_significant);
default: Ungetc(c, port); return read_token(port, '#', FALSE);
}
case ',': {
SCM symb;
c = Getc(port);
if (c == '@')
symb = Sym_unq_splicing;
else {
symb = Sym_unquote;
Ungetc(c, port);
}
return LIST2(symb, read_rec(port, case_significant));
}
case '"':
return read_string(port);
default:
return read_token(port, c, case_significant);
}
}
}
SCM STk_readf(SCM port, int case_significant)
{
int c;
if (cycles == NULL) STk_gc_protect(&cycles);
cycles = NIL;
c = flush_ws(port, (char *) NULL);
if (c == EOF) return(STk_eof_object);
Ungetc(c, port);
return read_rec(port, case_significant);
}