diff options
author | Kaz Kylheku <kaz@kylheku.com> | 2015-04-19 10:34:28 -0700 |
---|---|---|
committer | Kaz Kylheku <kaz@kylheku.com> | 2015-04-19 10:34:28 -0700 |
commit | e68b978b40c53b7fef21056c2d1c1dff0b6bb729 (patch) | |
tree | 840e5567f64ca21add4b26871383f72b0898c5ce /parser.l | |
parent | f6d7a2ebaad679ff8db23b3e9aa6f5a724259f1b (diff) | |
download | txr-e68b978b40c53b7fef21056c2d1c1dff0b6bb729.tar.gz txr-e68b978b40c53b7fef21056c2d1c1dff0b6bb729.tar.bz2 txr-e68b978b40c53b7fef21056c2d1c1dff0b6bb729.zip |
Do not allow unrecognized escapes in regex.
* parser.l (REGOP): New regex alias for matching all regex
special characters.
(grammar): Several rules for regex special characters merged
together. New rule introduced to match a special character
after a backslash, making it literal. The old rule which makes
literal any character after a backslash now throws an error,
unless version 105 comaptibility is selected.
* txr.1: Documented this behavior change.
Diffstat (limited to 'parser.l')
-rw-r--r-- | parser.l | 25 |
1 files changed, 14 insertions, 11 deletions
@@ -49,6 +49,7 @@ #include "hash.h" #include "parser.h" #include "eval.h" +#include "txr.h" #include "y.tab.h" #define YY_INPUT(buf, result, max_size) \ @@ -198,6 +199,8 @@ WS [\t ]* HEX [0-9A-Fa-f] OCT [0-7] +REGOP [/()|.*?+~&%\[\]\-] + ASC [\x00-\x7f] ASCN [\x00-\t\v-\x7f] U [\x80-\xbf] @@ -741,24 +744,24 @@ UONLY {U2}{U}|{U3}{U}{U}|{U4}{U}{U}{U} return ERRTOK; } -<REGEX>[.*?+~&%] { +<REGEX>{REGOP} { yylval->chr = yytext[0]; return yytext[0]; } -<REGEX>[\[\]\-] { - yylval->chr = yytext[0]; - return yytext[0]; -} - -<REGEX>[()|] { - yylval->chr = yytext[0]; - return yytext[0]; +<REGEX>[\\]{REGOP} { + yylval->chr = yytext[1]; + return REGCHAR; } <REGEX>[\\]. { - yylval->chr = yytext[1]; - return REGCHAR; + if (opt_compat && opt_compat <= 105) { + yylval->chr = yytext[1]; + return REGCHAR; + } + + yyerrprepf(yyg, lit("unrecognized escape in regex"), nao); + return ERRTOK; } <REGEX>[\\] { |