From 1c42c18e9601ee1416d61663f5a91874954c524d Mon Sep 17 00:00:00 2001 From: Brian Foley Date: Sun, 6 Jan 2019 18:32:59 -0800 Subject: awk: Fix overly permissive func arg list parsing It allows things like 'func f(a b)' and 'func f(a,)' which GNU awk forbids. function old new delta parse_program 327 367 +40 chain_expr 40 67 +27 parse_expr 891 915 +24 EMSG_TOO_FEW_ARGS 30 18 -12 ------------------------------------------------------------------------------ (add/remove: 0/0 grow/shrink: 3/1 up/down: 91/-12) Total: 79 bytes Signed-off-by: Brian Foley Signed-off-by: Denys Vlasenko --- editors/awk.c | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) (limited to 'editors') diff --git a/editors/awk.c b/editors/awk.c index 90edec8..d25508e 100644 --- a/editors/awk.c +++ b/editors/awk.c @@ -1613,12 +1613,25 @@ static void parse_program(char *p) f = newfunc(t_string); f->body.first = NULL; f->nargs = 0; - while (next_token(TC_VARIABLE | TC_SEQTERM) & TC_VARIABLE) { + /* Match func arg list: a comma sep list of >= 0 args, and a close paren */ + while (next_token(TC_VARIABLE | TC_SEQTERM | TC_COMMA)) { + /* Either an empty arg list, or trailing comma from prev iter + * must be followed by an arg */ + if (f->nargs == 0 && t_tclass == TC_SEQTERM) + break; + + /* TC_SEQSTART/TC_COMMA must be followed by TC_VARIABLE */ + if (t_tclass != TC_VARIABLE) + syntax_error(EMSG_UNEXP_TOKEN); + v = findvar(ahash, t_string); v->x.aidx = f->nargs++; + /* Arg followed either by end of arg list or 1 comma */ if (next_token(TC_COMMA | TC_SEQTERM) & TC_SEQTERM) break; + if (t_tclass != TC_COMMA) + syntax_error(EMSG_UNEXP_TOKEN); } seq = &f->body; chain_group(); -- cgit v1.1