diff options
author | Brian Foley <bpfoley@google.com> | 2019-01-06 18:32:59 -0800 |
---|---|---|
committer | Denys Vlasenko <vda.linux@googlemail.com> | 2019-01-21 12:59:19 +0100 |
commit | 1c42c18e9601ee1416d61663f5a91874954c524d (patch) | |
tree | 3ee100f9d73c739daa1effca974666a52d81c271 | |
parent | 08a514c097f1451678940a3178a9565b9d65a193 (diff) | |
download | busybox-w32-1c42c18e9601ee1416d61663f5a91874954c524d.tar.gz busybox-w32-1c42c18e9601ee1416d61663f5a91874954c524d.tar.bz2 busybox-w32-1c42c18e9601ee1416d61663f5a91874954c524d.zip |
awk: Fix overly permissive func arg list parsing
It allows things like 'func f(a b)' and 'func f(a,)' which GNU awk forbids.
function old new delta
parse_program 327 367 +40
chain_expr 40 67 +27
parse_expr 891 915 +24
EMSG_TOO_FEW_ARGS 30 18 -12
------------------------------------------------------------------------------
(add/remove: 0/0 grow/shrink: 3/1 up/down: 91/-12) Total: 79 bytes
Signed-off-by: Brian Foley <bpfoley@google.com>
Signed-off-by: Denys Vlasenko <vda.linux@googlemail.com>
-rw-r--r-- | editors/awk.c | 15 | ||||
-rwxr-xr-x | testsuite/awk.tests | 12 |
2 files changed, 26 insertions, 1 deletions
diff --git a/editors/awk.c b/editors/awk.c index 90edec82c..d25508e5d 100644 --- a/editors/awk.c +++ b/editors/awk.c | |||
@@ -1613,12 +1613,25 @@ static void parse_program(char *p) | |||
1613 | f = newfunc(t_string); | 1613 | f = newfunc(t_string); |
1614 | f->body.first = NULL; | 1614 | f->body.first = NULL; |
1615 | f->nargs = 0; | 1615 | f->nargs = 0; |
1616 | while (next_token(TC_VARIABLE | TC_SEQTERM) & TC_VARIABLE) { | 1616 | /* Match func arg list: a comma sep list of >= 0 args, and a close paren */ |
1617 | while (next_token(TC_VARIABLE | TC_SEQTERM | TC_COMMA)) { | ||
1618 | /* Either an empty arg list, or trailing comma from prev iter | ||
1619 | * must be followed by an arg */ | ||
1620 | if (f->nargs == 0 && t_tclass == TC_SEQTERM) | ||
1621 | break; | ||
1622 | |||
1623 | /* TC_SEQSTART/TC_COMMA must be followed by TC_VARIABLE */ | ||
1624 | if (t_tclass != TC_VARIABLE) | ||
1625 | syntax_error(EMSG_UNEXP_TOKEN); | ||
1626 | |||
1617 | v = findvar(ahash, t_string); | 1627 | v = findvar(ahash, t_string); |
1618 | v->x.aidx = f->nargs++; | 1628 | v->x.aidx = f->nargs++; |
1619 | 1629 | ||
1630 | /* Arg followed either by end of arg list or 1 comma */ | ||
1620 | if (next_token(TC_COMMA | TC_SEQTERM) & TC_SEQTERM) | 1631 | if (next_token(TC_COMMA | TC_SEQTERM) & TC_SEQTERM) |
1621 | break; | 1632 | break; |
1633 | if (t_tclass != TC_COMMA) | ||
1634 | syntax_error(EMSG_UNEXP_TOKEN); | ||
1622 | } | 1635 | } |
1623 | seq = &f->body; | 1636 | seq = &f->body; |
1624 | chain_group(); | 1637 | chain_group(); |
diff --git a/testsuite/awk.tests b/testsuite/awk.tests index 03fedf771..0db6a26e4 100755 --- a/testsuite/awk.tests +++ b/testsuite/awk.tests | |||
@@ -280,6 +280,18 @@ testing "awk 'delete a[v--]' evaluates v-- once" \ | |||
280 | " \ | 280 | " \ |
281 | "" "" | 281 | "" "" |
282 | 282 | ||
283 | testing "awk func arg parsing 1" \ | ||
284 | "awk 'func f(,) { }' 2>&1" "awk: cmd. line:1: Unexpected token\n" "" "" | ||
285 | |||
286 | testing "awk func arg parsing 2" \ | ||
287 | "awk 'func f(a,,b) { }' 2>&1" "awk: cmd. line:1: Unexpected token\n" "" "" | ||
288 | |||
289 | testing "awk func arg parsing 3" \ | ||
290 | "awk 'func f(a,) { }' 2>&1" "awk: cmd. line:1: Unexpected token\n" "" "" | ||
291 | |||
292 | testing "awk func arg parsing 4" \ | ||
293 | "awk 'func f(a b) { }' 2>&1" "awk: cmd. line:1: Unexpected token\n" "" "" | ||
294 | |||
283 | testing "awk handles empty ()" \ | 295 | testing "awk handles empty ()" \ |
284 | "awk 'BEGIN {print()}' 2>&1" "awk: cmd. line:1: Empty sequence\n" "" "" | 296 | "awk 'BEGIN {print()}' 2>&1" "awk: cmd. line:1: Empty sequence\n" "" "" |
285 | 297 | ||