parser: fix problems at EOF involving #; syntax.

This patch addresses a problem whereby if a TXR Lisp file ends with an erased object notation such as #;(a b c), there is a syntax error. The strategy is to simplify the grammar so that a single yyparse primed with SECRET_ESCAPE_E or SECRET_ESCAPE_I will read either an object, or just one instance of the #; notation. If #;OBJ is read, then the parse tree is returned as the nao value. The caller knows that #;OBJ must have occurred because there are no errors and the parser isn't at EOF, yet there is no parse tree. Then in lisp_parse we can loop on this situation, and make adjustments elsewhere also. So that iread continues to work, we must separate the parser_eof condition from the lookahead token. Under iread, we were clearing the token in prime_parser_post, but that was having the side effect of making the parser look like it is in EOF. We now preserve the EOF indication in a flag, so we can manipulate the token. * parser.h (struct parser): new member, eof. * parser.c (parser_common_init): Initialize new eof flag in parser structure to zero. (prime_parser_post): Set the eof flag if the parser's most recent token is zero. (lisp_parse_impl): Call the parser repeatedly while there are no errors, and no EOF, yet no object has been produced. This indicates that a #; erasure has been processed. (read_eval_stream): Restructure the logic here for clarity. Do not break the loop if error_val was returned from the parser, but there are no errors, and the parser isn't at EOF. This is behavior is probably redundant with respect to the loop in lisp_parse_impl. (read_eval_ret_last): Bugfixes here. Pass an error indicating value down to lisp_parse, like in read_eval_stream and make the logic similar. (parser_eof): Just return an indication based no the eof flag. * parser.y (hash_semis_n_expr, hash_semis_i_expr, ignored_i_exprs, ignored_n_exprs): Grammar rules removed. (hash_semi_or_n_expr, hash_semi_or_i_expr): New grammar rules. (spec): Retarget SECRET_ESCAPE_E and SECRET_ESCAPE_I cases to new rules. (parse): Clear eof flag to zero.
author: Kaz Kylheku <kaz@kylheku.com> 2016-12-06 21:56:25 -0800
committer: Kaz Kylheku <kaz@kylheku.com> 2016-12-06 21:56:25 -0800
commit: 600f1bda2366b82d1492eb04a7419d12f199349b (patch)
tree: 7fac52f0b0d3462ef8954b481133351a77ff17e0 /parser.c
parent: 5eaf38e345aafce2f09cafb2195608333cc6f92a (diff)
download: txr-600f1bda2366b82d1492eb04a7419d12f199349b.tar.gz
txr-600f1bda2366b82d1492eb04a7419d12f199349b.tar.bz2
txr-600f1bda2366b82d1492eb04a7419d12f199349b.zip
1 files changed, 29 insertions, 10 deletions
diff --git a/parser.c b/parser.c
index f4f1c1ce..f2a7e310 100644
--- a/parser.c
+++ b/parser.c
@@ -109,6 +109,7 @@ void parser_common_init(parser_t *p)
   p->parser = nil;
   p->lineno = 1;
   p->errors = 0;
+  p->eof = 0;
   p->stream = nil;
   p->name = nil;
   p->prepared_msg = nil;
@@ -201,6 +202,7 @@ void prime_parser(parser_t *p, val name, enum prime_parser prim)
 
 void prime_parser_post(parser_t *p, enum prime_parser prim)
 {
+  p->eof = (p->recent_tok.yy_char == 0);
   if (prim == prime_interactive)
     p->recent_tok.yy_char = 0;
 }
@@ -524,14 +526,20 @@ static val lisp_parse_impl(val interactive, val source_in, val error_stream,
 
   env_vbind(dyn_env, stderr_s, error_stream);
 
-  {
+  for (;;) {
     int gc = gc_state(0);
     enum prime_parser prime = if3(interactive, prime_interactive, prime_lisp);
     parse(pi, if3(std_error != std_null, name, lit("")), prime);
     gc_state(gc);
-    parsed = t;
+
+    if (pi->syntax_tree == nao && pi->errors == 0 && !parser_eof(parser))
+      continue;
+
+    break;
   }
 
+  parsed = t;
+
   uw_unwind {
     dyn_env = saved_dyn;
     if (!parsed) {
@@ -587,12 +595,15 @@ val read_eval_stream(val stream, val error_stream, val hash_bang_support)
     val parser = get_parser(stream);
 
     if (form == error_val) {
-      if (parser_errors(parser) == zero)
+      if (parser_errors(parser) != zero)
+        return nil;
+      if (parser_eof(parser))
         break;
-      return nil;
+      continue;
     }
 
     (void) eval_intrinsic(form, nil);
+
     if (parser_eof(parser))
       break;
   }
@@ -858,19 +869,27 @@ static val read_eval_ret_last(val env, val counter,
                               val in_stream, val out_stream)
 {
   val lineno = one;
+  val error_val = gensym(nil);
   val name = format(nil, lit("paste-~a"), counter, nao);
+  val value = nil;
 
   for (;; lineno = succ(lineno)) {
-    val form = lisp_parse(in_stream, out_stream, colon_k, name, lineno);
+    val form = lisp_parse(in_stream, out_stream, error_val, name, lineno);
     val parser = get_parser(in_stream);
-    val value = eval_intrinsic(form, nil);
 
-    if (parser_eof(parser)) {
-      prinl(value, out_stream);
-      break;
+    if (form == error_val) {
+      if (parser_errors(parser) != zero || parser_eof(parser))
+        break;
+      continue;
     }
+
+    value = eval_intrinsic(form, nil);
+
+    if (parser_eof(parser))
+      break;
   }
 
+  prinl(value, out_stream);
   return t;
 }
 
@@ -1071,7 +1090,7 @@ val parser_errors(val parser)
 val parser_eof(val parser)
 {
   parser_t *p = coerce(parser_t *, cobj_handle(parser, parser_s));
-  return tnil(p->recent_tok.yy_char == 0);
+  return tnil(p->eof);
 }
 
 static val circref(val n)
author	Kaz Kylheku <kaz@kylheku.com>	2016-12-06 21:56:25 -0800
committer	Kaz Kylheku <kaz@kylheku.com>	2016-12-06 21:56:25 -0800
commit	600f1bda2366b82d1492eb04a7419d12f199349b (patch)
tree	7fac52f0b0d3462ef8954b481133351a77ff17e0 /parser.c
parent	5eaf38e345aafce2f09cafb2195608333cc6f92a (diff)
download	txr-600f1bda2366b82d1492eb04a7419d12f199349b.tar.gz txr-600f1bda2366b82d1492eb04a7419d12f199349b.tar.bz2 txr-600f1bda2366b82d1492eb04a7419d12f199349b.zip