ref: e75314f9ae9f23f1bf38317673ba1c5dea52f1c0
parent: 415ef9f83bfad5d57697c0a4d9b0983fb8d2db18
author: Sigrid Solveig Haflínudóttir <sigrid@ftrv.se>
date: Tue Mar 25 13:28:21 EDT 2025
read: better whitespace handling
--- a/boot/sl.boot
+++ b/boot/sl.boot
@@ -426,8 +426,8 @@
#fn(del!)) remprop)
repl #fn("n0IIb4b5705042172514238424_5142385258485>2_51485<5047660:" #(*prompt* #fn(io-flush)
*io-out* #0#
- #fn("n02021{227351S;3q047484517585513M07584513@076504277851@30q@=079855147:5047;85w<61:" #(#fn("n02071D62:" #(#fn(read)
- *io-in*)) #fn("n1207151422061:" #(#fn(io-discardbuffer) *io-in* #fn(raise)))
+ #fn("n02021{227351S;3q047484517585513M07584513@076504277851@30q@=079855147:5047;85w<61:" #(#fn("n0207122D63:" #(#fn(read)
+ *io-in* :whitespace)) #fn("n1207151422061:" #(#fn(io-discardbuffer) *io-in* #fn(raise)))
#fn(io-eof?) *io-in* load-process void? *prompt* #fn(io-flush) *io-out* print newline void that) prompt)
#fn("n020A>121{370F<60:q:" #(#fn("n0A<60:")
#fn("n1700514D:" #(top-level-exception-handler))) reploop) newline) repl)
--- a/src/io.c
+++ b/src/io.c
@@ -6,7 +6,7 @@
#include "io.h"
static sl_v sl_linesym, sl_blocksym, sl_memorysym, sl_nonesym;
-static sl_v sl_ioinsym;
+static sl_v sl_ioinsym, sl_whitespace;
sl_v sl_iooutsym;
sl_type *sl_iotype;
@@ -146,11 +146,20 @@
BUILTIN("read", read)
{
- if(nargs > 1)
- argcount(nargs, 2);
+ bool ws = false;
+ if(nargs >= 2 && nargs <= 3){
+ int i;
+ if(args[i = 0] == sl_whitespace || (nargs > 2 && args[i = 1] == sl_whitespace)){
+ ws = args[++i] != sl_nil;
+ if(i < 2) // (read :whitespace T io)
+ args[0] = args[2];
+ nargs -= 2;
+ }
+ }
+ argcount(nargs, 1);
sl_v a = nargs == 0 ? sym_value(sl_ioinsym) : args[0];
sl_gc_handle(&a);
- sl_v v = sl_read_sexpr(a, nargs > 1 && args[1] == sl_t);
+ sl_v v = sl_read_sexpr(a, ws);
sl_free_gc_handles(1);
return ios_eof(toio(a)) ? sl_eof : v;
}
@@ -469,6 +478,7 @@
sl_linesym = mk_csym(":line");
sl_blocksym = mk_csym(":block");
sl_memorysym = mk_csym(":memory");
+ sl_whitespace = mk_csym(":whitespace");
sl_ioinsym = mk_csym("*io-in*");
sl_iooutsym = mk_csym("*io-out*");
sl_iotype = define_opaque_type(sl_iosym, sizeof(sl_ios), &io_vtable, nil);
--- a/src/read.c
+++ b/src/read.c
@@ -204,13 +204,16 @@
sl_fx x;
int ch, base;
- if(ctx->toktype != TOK_NONE)
+ if(ctx->toktype != TOK_NONE){
+ ctx->ws = false;
return ctx->toktype;
+ }
c = nextchar(ctx);
ctx->loc = RS->loc;
- ctx->ws = false;
- if(ios_eof(RS) || isspace(c))
+ if(ios_eof(RS) || isspace(c)){
+ ctx->ws = false;
return TOK_NONE;
+ }
if(c == '(')
ctx->toktype = TOK_OPEN;
else if(c == ')')
@@ -346,6 +349,7 @@
(c == 'x' && (base = 16))) && (isdigit_base(ctx->buf[1], base) || ctx->buf[1] == '-')){
if(!sl_read_numtok(&ctx->buf[1], &ctx->tokval, base))
parse_error(&ctx->loc, "invalid base %d constant", base);
+ ctx->ws = false;
return (ctx->toktype = TOK_NUM);
}
@@ -363,17 +367,23 @@
ctx->toktype = TOK_COMMAAT;
else if(ch == '.')
ctx->toktype = TOK_COMMADOT;
- else
+ else{
+ ctx->ws = false;
return ctx->toktype;
+ }
ios_getc(RS);
}else{
bool ok = read_token(ctx, c, 0);
const char *s = ctx->buf;
if(!ok){
- if(s[0] == '.' && s[1] == '\0')
+ if(s[0] == '.' && s[1] == '\0'){
+ ctx->ws = false;
return (ctx->toktype = TOK_DOT);
- if(sl_read_numtok(s, &ctx->tokval, 0))
+ }
+ if(sl_read_numtok(s, &ctx->tokval, 0)){
+ ctx->ws = false;
return (ctx->toktype = TOK_NUM);
+ }
}
ctx->toktype = TOK_SYM;
if(strcasecmp(s, "nil") == 0)
@@ -388,6 +398,7 @@
ctx->toktype = TOK_GENSYM;
}
}
+ ctx->ws = false;
return ctx->toktype;
}
--- a/src/system.sl
+++ b/src/system.sl
@@ -1346,7 +1346,7 @@
(*prompt*)
(io-flush *io-out*)
(def (prompt)
- (let ((v (trycatch (read *io-in* T)
+ (let ((v (trycatch (read *io-in* :whitespace T)
(λ (e) (io-discardbuffer *io-in*)
(raise e)))))
(and (not (io-eof? *io-in*))