diff options
author | Kaz Kylheku <kaz@kylheku.com> | 2017-03-06 20:53:48 -0800 |
---|---|---|
committer | Kaz Kylheku <kaz@kylheku.com> | 2017-03-06 20:53:48 -0800 |
commit | fd87267eb4802d1e3ec3c22a48e09a86f76810ad (patch) | |
tree | 8760a2fb325d259e5e86983b20f690ee08da93c4 /parser.y | |
parent | 266e28cb7129d175ad4af5af5cb45fbbd3054862 (diff) | |
download | txr-fd87267eb4802d1e3ec3c22a48e09a86f76810ad.tar.gz txr-fd87267eb4802d1e3ec3c22a48e09a86f76810ad.tar.bz2 txr-fd87267eb4802d1e3ec3c22a48e09a86f76810ad.zip |
uref: the a.b.c syntax extended to .a.b.c
Now it is possible to use a leading dot on the referencing
dot syntax. This is the is the "unbound reference dot". It
expands to the uref macro, which denotes an unbound-reference:
it produces a function which takes an object as the argument,
and curries the reference implied by the remaining arguments.
* eval.c (uref_s): New global symbol variable.
(eval_init): Intern uref symbol and init uref_s.
* eval.h (uref_s): Declared.
* lib.c (simple_qref_args_p): A qref expression is now
also not simple if it contains an embedded uref, meaning
that it cannot be rendered into the dot notation without
ambiguity.
(obj_print_impl): Support printing (uref a b c) as .a.b.c.
* lisplib.c (struct_set_entries): Add uref to the list of
autoload triggers for struct.tl.
* parser.l (DOTDOT): Consume any leading whitespace as part
of recognizing the DOTDOT token. Otherwise the new rule
for UREFDOT, which matches (mandatory) leading space
will take precedence, causing " .." to be scanned wrong.
(UREFDOT): Rule for new kind of dot token, which is
preceded by mandatory whitespace, and isn't consing
dot (which has mandatory trailing whitespace too,
matched by an earlier rule).
* parser.y (UREFDOT): New token type.
(i_dot_expr, n_dot_expr): New grammar rules.
(list): Handle a leading dot on the first element of a list as
a special case. Things are done this way because trying to
work a UREFDOT into the grammar otherwise causes intractable
conflicts.
(i_expr): The ^, ' and , punctuators are now followed by
an i_dot_expr, so that the expression can be an unbound
dot.
(n_expr): Same change as in i_expr, but using n_dot_expr.
Plus new UREFDOT n_expr production.
* share/txr/stdlib/struct.tl (uref): New macro.
* txr.1: Documented.
Diffstat (limited to 'parser.y')
-rw-r--r-- | parser.y | 67 |
1 files changed, 54 insertions, 13 deletions
@@ -123,7 +123,7 @@ INLINE val expand_form_ver(val form, int ver) %token <val> NUMBER METANUM %token <val> HASH_N_EQUALS HASH_N_HASH -%token <chr> REGCHAR REGTOKEN LITCHAR SPLICE CONSDOT LAMBDOT +%token <chr> REGCHAR REGTOKEN LITCHAR SPLICE CONSDOT LAMBDOT UREFDOT %type <val> spec hash_semi_or_n_expr hash_semi_or_i_expr %type <val> clauses_rev clauses_opt clause @@ -135,7 +135,8 @@ INLINE val expand_form_ver(val form, int ver) %type <val> if_clause elif_clauses_opt else_clause_opt %type <val> line elems_opt elems clause_parts_h additional_parts_h %type <val> text texts elem var var_op modifiers vector hash struct range -%type <val> list exprs exprs_opt n_exprs r_exprs i_expr n_expr n_exprs_opt +%type <val> list exprs exprs_opt n_exprs r_exprs i_expr i_dot_expr +%type <val> n_expr n_exprs_opt n_dot_expr %type <val> out_clauses out_clauses_opt out_clause %type <val> repeat_clause repeat_parts_opt o_line %type <val> o_elems_opt o_elems o_elem o_var q_var rep_elem rep_parts_opt @@ -157,7 +158,7 @@ INLINE val expand_form_ver(val form, int ver) %left '|' '/' %left '&' %right '~' '*' '?' '+' '%' -%right '.' CONSDOT LAMBDOT REGCHAR REGTOKEN LITCHAR +%right '.' CONSDOT LAMBDOT UREFDOT REGCHAR REGTOKEN LITCHAR %right DOTDOT %% @@ -833,6 +834,23 @@ range : HASH_R list { if (length($2) != two) ; list : '(' n_exprs ')' { $$ = rl($2, num($1)); } + | '(' '.' n_exprs ')' { val a = car($3); + if (consp(a) && car(a) == qref_s) { + rplaca(a, uref_s); + $$ = $3; + } else { + $$ = cons(rl(rlcp(list(uref_s, a, nao), a), + num(parser->lineno)), cdr($3)); + } } + | '[' '.' n_exprs ']' { val a = car($3); + if (consp(a) && car(a) == qref_s) { + rplaca(a, uref_s); + $$ = rl(cons(dwim_s, $3), num($1)); + } else { + val ur = cons(rl(rlcp(list(uref_s, a, nao), a), + num(parser->lineno)), cdr($3)); + $$ = rl(cons(dwim_s, ur), num($1)); + } } | '(' ')' { $$ = nil; } | '(' LAMBDOT n_expr ')' { $$ = $3; } | '(' CONSDOT n_expr ')' { $$ = $3; } @@ -923,20 +941,28 @@ i_expr : SYMTOK { $$ = symhlpr($1, t); } | quasilit { $$ = $1; } | WORDS wordslit { $$ = rl($2, num($1)); } | QWORDS wordsqlit { $$ = rl(cons(quasilist_s, $2), num($1)); } - | '\'' i_expr { $$ = rl(rlcp(list(quote_s, $2, nao), $2), + | '\'' i_dot_expr { $$ = rl(rlcp(list(quote_s, $2, nao), $2), num(parser->lineno)); } - | '^' i_expr { $$ = rl(rlcp(list(sys_qquote_s, $2, nao), $2), + | '^' i_dot_expr { $$ = rl(rlcp(list(sys_qquote_s, $2, nao), $2), num(parser->lineno)); } - | ',' i_expr { $$ = rl(rlcp(list(sys_unquote_s, $2, nao), $2), + | ',' i_dot_expr { $$ = rl(rlcp(list(sys_unquote_s, $2, nao), $2), num(parser->lineno)); } - | SPLICE i_expr { $$ = rl(rlcp(list(sys_splice_s, $2, nao), $2), + | SPLICE i_dot_expr { $$ = rl(rlcp(list(sys_splice_s, $2, nao), $2), num(parser->lineno)); } | HASH_N_EQUALS { parser_circ_def(parser, $1, unique_s); } - i_expr { parser_circ_def(parser, $1, $3); + i_dot_expr { parser_circ_def(parser, $1, $3); $$ = $3; } | HASH_N_HASH { $$ = parser_circ_ref(parser, $1); } ; +i_dot_expr : '.' i_expr { if (consp($2) && car($2) == qref_s) { + $$ = rplaca($2, uref_s); + } else { + $$ = rl(rlcp(list(uref_s, $2, nao), $2), + num(parser->lineno)); + } } + | i_expr %prec LOW { $$ = $1; } + ; n_expr : SYMTOK { $$ = symhlpr($1, t); } | METANUM { $$ = cons(var_s, cons($1, nil)); rl($$, num(parser->lineno)); } @@ -952,13 +978,13 @@ n_expr : SYMTOK { $$ = symhlpr($1, t); } | quasilit { $$ = $1; } | WORDS wordslit { $$ = rl($2, num($1)); } | QWORDS wordsqlit { $$ = rl(cons(quasilist_s, $2), num($1)); } - | '\'' n_expr { $$ = rl(rlcp(list(quote_s, $2, nao), $2), + | '\'' n_dot_expr { $$ = rl(rlcp(list(quote_s, $2, nao), $2), num(parser->lineno)); } - | '^' n_expr { $$ = rl(rlcp(list(sys_qquote_s, $2, nao), $2), + | '^' n_dot_expr { $$ = rl(rlcp(list(sys_qquote_s, $2, nao), $2), num(parser->lineno)); } - | ',' n_expr { $$ = rl(rlcp(list(sys_unquote_s, $2, nao), $2), + | ',' n_dot_expr { $$ = rl(rlcp(list(sys_unquote_s, $2, nao), $2), num(parser->lineno)); } - | SPLICE n_expr { $$ = rl(rlcp(list(sys_splice_s, $2, nao), $2), + | SPLICE n_dot_expr { $$ = rl(rlcp(list(sys_splice_s, $2, nao), $2), num(parser->lineno)); } | n_expr DOTDOT n_expr { uses_or2; $$ = rlcp(list(rcons_s, $1, $3, nao), @@ -973,8 +999,14 @@ n_expr : SYMTOK { $$ = symhlpr($1, t); } or2($1, $3)), num(parser->lineno)); } } + | UREFDOT n_expr { if (consp($2) && car($2) == qref_s) { + $$ = rplaca($2, uref_s); + } else { + $$ = rl(rlcp(list(uref_s, $2, nao), $2), + num(parser->lineno)); + } } | HASH_N_EQUALS { parser_circ_def(parser, $1, unique_s); } - n_expr { parser_circ_def(parser, $1, $3); + n_dot_expr { parser_circ_def(parser, $1, $3); $$ = $3; } | HASH_N_HASH { $$ = parser_circ_ref(parser, $1); } ; @@ -983,6 +1015,15 @@ n_exprs_opt : n_exprs { $$ = $1; } | /* empty */ { $$ = nil; } ; +n_dot_expr : '.' n_expr { if (consp($2) && car($2) == qref_s) { + $$ = rplaca($2, uref_s); + } else { + $$ = rl(rlcp(list(uref_s, $2, nao), $2), + num(parser->lineno)); + } } + | n_expr %prec LOW { $$ = $1; } + ; + regex : '/' regexpr '/' { $$ = regex_compile($2, nil); end_of_regex(scnr); rl($$, num(parser->lineno)); } |