diff options
-rw-r--r-- | lpcode.c | 43 | ||||
-rw-r--r-- | lpprint.c | 8 | ||||
-rw-r--r-- | lptree.c | 27 | ||||
-rw-r--r-- | lptree.h | 2 | ||||
-rw-r--r-- | lpvm.c | 26 | ||||
-rw-r--r-- | lpvm.h | 3 | ||||
-rw-r--r-- | testlabel.lua | 36 |
7 files changed, 123 insertions, 22 deletions
@@ -196,8 +196,8 @@ int checkaux (TTree *tree, int pred) { | |||
196 | if (checkaux(sib2(tree), pred)) return 1; | 196 | if (checkaux(sib2(tree), pred)) return 1; |
197 | /* else return checkaux(sib1(tree), pred); */ | 197 | /* else return checkaux(sib1(tree), pred); */ |
198 | tree = sib1(tree); goto tailcall; | 198 | tree = sib1(tree); goto tailcall; |
199 | case TLabChoice: /* labeled failure */ | 199 | case TLabChoice: case TRecov: /* labeled failure */ |
200 | /* in a labeled ordered choice we do not know whether sib2 will be evaluated */ | 200 | /* we do not know whether sib2 will be evaluated */ |
201 | tree = sib1(tree); goto tailcall; | 201 | tree = sib1(tree); goto tailcall; |
202 | case TCapture: case TGrammar: case TRule: | 202 | case TCapture: case TGrammar: case TRule: |
203 | /* return checkaux(sib1(tree), pred); */ | 203 | /* return checkaux(sib1(tree), pred); */ |
@@ -231,7 +231,7 @@ int fixedlenx (TTree *tree, int count, int len) { | |||
231 | return -1; /* may be a loop */ | 231 | return -1; /* may be a loop */ |
232 | /* else return fixedlenx(sib2(tree), count); */ | 232 | /* else return fixedlenx(sib2(tree), count); */ |
233 | tree = sib2(tree); goto tailcall; | 233 | tree = sib2(tree); goto tailcall; |
234 | case TSeq: { | 234 | case TSeq: case TRecov: { /* labeled failure */ |
235 | len = fixedlenx(sib1(tree), count, len); | 235 | len = fixedlenx(sib1(tree), count, len); |
236 | if (len < 0) return -1; | 236 | if (len < 0) return -1; |
237 | /* else return fixedlenx(sib2(tree), count, len); */ | 237 | /* else return fixedlenx(sib2(tree), count, len); */ |
@@ -294,6 +294,12 @@ static int getfirst (TTree *tree, const Charset *follow, Charset *firstset) { | |||
294 | loopset(i, firstset->cs[i] |= csaux.cs[i]); | 294 | loopset(i, firstset->cs[i] |= csaux.cs[i]); |
295 | return e1 | e2; | 295 | return e1 | e2; |
296 | } | 296 | } |
297 | case TRecov: { /* labeled failure */ | ||
298 | /* when p1 is not nullable, p2 has nothing to contribute; | ||
299 | and when p1 is nullable, then p2 will not match | ||
300 | return getfirst(sib1(tree), fullset, firstset); */ | ||
301 | tree = sib1(tree); follow = fullset; goto tailcall; | ||
302 | } | ||
297 | case TSeq: { | 303 | case TSeq: { |
298 | if (!nullable(sib1(tree))) { | 304 | if (!nullable(sib1(tree))) { |
299 | /* when p1 is not nullable, p2 has nothing to contribute; | 305 | /* when p1 is not nullable, p2 has nothing to contribute; |
@@ -372,7 +378,7 @@ static int headfail (TTree *tree) { | |||
372 | if (!nofail(sib2(tree))) return 0; | 378 | if (!nofail(sib2(tree))) return 0; |
373 | /* else return headfail(sib1(tree)); */ | 379 | /* else return headfail(sib1(tree)); */ |
374 | tree = sib1(tree); goto tailcall; | 380 | tree = sib1(tree); goto tailcall; |
375 | case TChoice: case TLabChoice: /* labeled failure */ | 381 | case TChoice: case TLabChoice: case TRecov: /* labeled failure */ |
376 | if (!headfail(sib1(tree))) return 0; | 382 | if (!headfail(sib1(tree))) return 0; |
377 | /* else return headfail(sib2(tree)); */ | 383 | /* else return headfail(sib2(tree)); */ |
378 | tree = sib2(tree); goto tailcall; | 384 | tree = sib2(tree); goto tailcall; |
@@ -392,7 +398,7 @@ static int needfollow (TTree *tree) { | |||
392 | case TChar: case TSet: case TAny: | 398 | case TChar: case TSet: case TAny: |
393 | case TFalse: case TTrue: case TAnd: case TNot: | 399 | case TFalse: case TTrue: case TAnd: case TNot: |
394 | case TRunTime: case TGrammar: case TCall: case TBehind: | 400 | case TRunTime: case TGrammar: case TCall: case TBehind: |
395 | case TThrow: case TLabChoice: /* (?)labeled failure */ | 401 | case TThrow: case TLabChoice: case TRecov: /* (?)labeled failure */ |
396 | return 0; | 402 | return 0; |
397 | case TChoice: case TRep: | 403 | case TChoice: case TRep: |
398 | return 1; | 404 | return 1; |
@@ -427,7 +433,7 @@ int sizei (const Instruction *i) { | |||
427 | return 2; | 433 | return 2; |
428 | case IThrow: /* labeled failure */ | 434 | case IThrow: /* labeled failure */ |
429 | return 1; | 435 | return 1; |
430 | case ILabChoice: | 436 | case ILabChoice: case IRecov: |
431 | return (CHARSETINSTSIZE - 1) + 2; /* labeled failure */ | 437 | return (CHARSETINSTSIZE - 1) + 2; /* labeled failure */ |
432 | default: return 1; | 438 | default: return 1; |
433 | } | 439 | } |
@@ -492,7 +498,8 @@ static int addinstruction (CompileState *compst, Opcode op, int aux) { | |||
492 | static int addoffsetinst (CompileState *compst, Opcode op) { | 498 | static int addoffsetinst (CompileState *compst, Opcode op) { |
493 | int i = addinstruction(compst, op, 0); /* instruction */ | 499 | int i = addinstruction(compst, op, 0); /* instruction */ |
494 | addinstruction(compst, (Opcode)0, 0); /* open space for offset */ | 500 | addinstruction(compst, (Opcode)0, 0); /* open space for offset */ |
495 | assert(op == ITestSet || sizei(&getinstr(compst, i)) == 2); | 501 | assert(op == ITestSet || sizei(&getinstr(compst, i)) == 2 || |
502 | op == IRecov || op == ILabChoice); /* labeled failure */ | ||
496 | return i; | 503 | return i; |
497 | } | 504 | } |
498 | 505 | ||
@@ -714,6 +721,21 @@ static void codelabchoice (CompileState *compst, TTree *p1, TTree *p2, int opt, | |||
714 | codegen(compst, p2, opt, NOINST, fl); | 721 | codegen(compst, p2, opt, NOINST, fl); |
715 | jumptohere(compst, pcommit); | 722 | jumptohere(compst, pcommit); |
716 | } | 723 | } |
724 | |||
725 | static void coderecovery (CompileState *compst, TTree *p1, TTree *p2, int opt, | ||
726 | const Charset *fl, const byte *cs) { | ||
727 | int emptyp2 = (p2->tag == TTrue); | ||
728 | int pcommit; | ||
729 | int test = NOINST; | ||
730 | int precovery = addoffsetinst(compst, IRecov); | ||
731 | addcharset(compst, cs); | ||
732 | codegen(compst, p1, emptyp2, test, fullset); | ||
733 | pcommit = addoffsetinst(compst, ICommit); | ||
734 | jumptohere(compst, precovery); | ||
735 | jumptohere(compst, test); | ||
736 | codegen(compst, p2, opt, NOINST, fl); | ||
737 | jumptohere(compst, pcommit); | ||
738 | } | ||
717 | /* labeled failure end */ | 739 | /* labeled failure end */ |
718 | 740 | ||
719 | 741 | ||
@@ -951,6 +973,10 @@ static void codegen (CompileState *compst, TTree *tree, int opt, int tt, | |||
951 | codelabchoice(compst, sib1(tree), sib2(tree), opt, fl, treelabelset(tree)); | 973 | codelabchoice(compst, sib1(tree), sib2(tree), opt, fl, treelabelset(tree)); |
952 | break; | 974 | break; |
953 | } | 975 | } |
976 | case TRecov: { /* labeled failure */ | ||
977 | coderecovery(compst, sib1(tree), sib2(tree), opt, fl, treelabelset(tree)); | ||
978 | break; | ||
979 | } | ||
954 | default: assert(0); | 980 | default: assert(0); |
955 | } | 981 | } |
956 | } | 982 | } |
@@ -972,7 +998,8 @@ static void peephole (CompileState *compst) { | |||
972 | redo: | 998 | redo: |
973 | switch (code[i].i.code) { | 999 | switch (code[i].i.code) { |
974 | case IChoice: case ICall: case ICommit: case IPartialCommit: | 1000 | case IChoice: case ICall: case ICommit: case IPartialCommit: |
975 | case IBackCommit: case ITestChar: case ITestSet: case ILabChoice: /* labeled failure */ | 1001 | case IBackCommit: case ITestChar: case ITestSet: |
1002 | case ILabChoice: case IRecov: /* labeled failure */ | ||
976 | case ITestAny: { /* instructions with labels */ | 1003 | case ITestAny: { /* instructions with labels */ |
977 | jumptothere(compst, i, finallabel(code, i)); /* optimize label */ | 1004 | jumptothere(compst, i, finallabel(code, i)); /* optimize label */ |
978 | break; | 1005 | break; |
@@ -61,7 +61,7 @@ void printinst (const Instruction *op, const Instruction *p) { | |||
61 | "choice", "jmp", "call", "open_call", | 61 | "choice", "jmp", "call", "open_call", |
62 | "commit", "partial_commit", "back_commit", "failtwice", "fail", "giveup", | 62 | "commit", "partial_commit", "back_commit", "failtwice", "fail", "giveup", |
63 | "fullcapture", "opencapture", "closecapture", "closeruntime", | 63 | "fullcapture", "opencapture", "closecapture", "closeruntime", |
64 | "throw", "labeled_choice" /* labeled failure */ | 64 | "throw", "labeled_choice", "recovery" /* labeled failure */ |
65 | }; | 65 | }; |
66 | printf("%02ld: %s ", (long)(p - op), names[p->i.code]); | 66 | printf("%02ld: %s ", (long)(p - op), names[p->i.code]); |
67 | switch ((Opcode)p->i.code) { | 67 | switch ((Opcode)p->i.code) { |
@@ -112,7 +112,7 @@ void printinst (const Instruction *op, const Instruction *p) { | |||
112 | printf("%d", p->i.aux); | 112 | printf("%d", p->i.aux); |
113 | break; | 113 | break; |
114 | } | 114 | } |
115 | case ILabChoice: { /* labeled failure */ | 115 | case ILabChoice: case IRecov: { /* labeled failure */ |
116 | printjmp(op, p); | 116 | printjmp(op, p); |
117 | printcharset((p+2)->buff); | 117 | printcharset((p+2)->buff); |
118 | break; | 118 | break; |
@@ -165,7 +165,7 @@ static const char *tagnames[] = { | |||
165 | "call", "opencall", "rule", "grammar", | 165 | "call", "opencall", "rule", "grammar", |
166 | "behind", | 166 | "behind", |
167 | "capture", "run-time", | 167 | "capture", "run-time", |
168 | "throw", "labeled-choice" /* labeled failure */ | 168 | "throw", "labeled-choice", "recov" /* labeled failure */ |
169 | }; | 169 | }; |
170 | 170 | ||
171 | 171 | ||
@@ -223,7 +223,7 @@ void printtree (TTree *tree, int ident) { | |||
223 | default: { | 223 | default: { |
224 | int sibs = numsiblings[tree->tag]; | 224 | int sibs = numsiblings[tree->tag]; |
225 | printf("\n"); | 225 | printf("\n"); |
226 | if (tree->tag == TLabChoice) { /* labeled failure */ | 226 | if (tree->tag == TLabChoice || tree->tag == TRecov) { /* labeled failure */ |
227 | printcharset(treelabelset(tree)); | 227 | printcharset(treelabelset(tree)); |
228 | printf("\n"); | 228 | printf("\n"); |
229 | } | 229 | } |
@@ -28,7 +28,7 @@ const byte numsiblings[] = { | |||
28 | 0, 0, 2, 1, /* call, opencall, rule, grammar */ | 28 | 0, 0, 2, 1, /* call, opencall, rule, grammar */ |
29 | 1, /* behind */ | 29 | 1, /* behind */ |
30 | 1, 1, /* capture, runtime capture */ | 30 | 1, 1, /* capture, runtime capture */ |
31 | 0, 2 /* labeled failure throw, labeled choice */ | 31 | 0, 2, 2 /* labeled failure throw, labeled choice, recovery */ |
32 | }; | 32 | }; |
33 | 33 | ||
34 | 34 | ||
@@ -525,12 +525,12 @@ static TTree *newthrowleaf (lua_State *L, int lab) { | |||
525 | return tree; | 525 | return tree; |
526 | } | 526 | } |
527 | 527 | ||
528 | static TTree *newlabchoice (lua_State *L) { | 528 | static TTree *newrootlab2sib (lua_State *L, int tag) { |
529 | int s1, s2; | 529 | int s1, s2; |
530 | TTree *tree1 = getpatt(L, 1, &s1); | 530 | TTree *tree1 = getpatt(L, 1, &s1); |
531 | TTree *tree2 = getpatt(L, 2, &s2); | 531 | TTree *tree2 = getpatt(L, 2, &s2); |
532 | TTree *tree = newtree(L, bytes2slots(LABELSETSIZE) + 1 + s1 + s2); /* create new tree */ | 532 | TTree *tree = newtree(L, bytes2slots(LABELSETSIZE) + 1 + s1 + s2); /* create new tree */ |
533 | tree->tag = TLabChoice; | 533 | tree->tag = tag; |
534 | tree->u.s.ps = 1 + s1; | 534 | tree->u.s.ps = 1 + s1; |
535 | tree->u.s.plab = 1 + s1 + s2; | 535 | tree->u.s.plab = 1 + s1 + s2; |
536 | memcpy(sib1(tree), tree1, s1 * sizeof(TTree)); | 536 | memcpy(sib1(tree), tree1, s1 * sizeof(TTree)); |
@@ -733,7 +733,7 @@ static int lp_throw (lua_State *L) { | |||
733 | */ | 733 | */ |
734 | static int lp_labchoice (lua_State *L) { | 734 | static int lp_labchoice (lua_State *L) { |
735 | int n = lua_gettop(L); | 735 | int n = lua_gettop(L); |
736 | TTree *tree = newlabchoice(L); | 736 | TTree *tree = newrootlab2sib(L, TLabChoice); |
737 | int i; | 737 | int i; |
738 | for (i = 3; i <= n; i++) { | 738 | for (i = 3; i <= n; i++) { |
739 | int d = luaL_checkinteger(L, i); | 739 | int d = luaL_checkinteger(L, i); |
@@ -742,6 +742,24 @@ static int lp_labchoice (lua_State *L) { | |||
742 | } | 742 | } |
743 | return 1; | 743 | return 1; |
744 | } | 744 | } |
745 | |||
746 | |||
747 | static int lp_recovery (lua_State *L) { | ||
748 | int n = lua_gettop(L); | ||
749 | TTree *tree = newrootlab2sib(L, TRecov); | ||
750 | if (n == 2) { /* catches fail as default */ | ||
751 | setlabel(treelabelset(tree), LFAIL); | ||
752 | } else { | ||
753 | int i; | ||
754 | for (i = 3; i <= n; i++) { | ||
755 | int d = luaL_checkinteger(L, i); | ||
756 | luaL_argcheck(L, d >= 0 && d < MAXLABELS, i, "the number of a label must be between 0 and 255"); | ||
757 | setlabel(treelabelset(tree), (byte)d); | ||
758 | } | ||
759 | } | ||
760 | return 1; | ||
761 | } | ||
762 | |||
745 | /* labeled failure end */ | 763 | /* labeled failure end */ |
746 | 764 | ||
747 | 765 | ||
@@ -1325,6 +1343,7 @@ static struct luaL_Reg pattreg[] = { | |||
1325 | {"type", lp_type}, | 1343 | {"type", lp_type}, |
1326 | {"T", lp_throw}, /* labeled failure throw */ | 1344 | {"T", lp_throw}, /* labeled failure throw */ |
1327 | {"Lc", lp_labchoice}, /* labeled failure choice */ | 1345 | {"Lc", lp_labchoice}, /* labeled failure choice */ |
1346 | {"Rec", lp_recovery}, /* labeled failure choice */ | ||
1328 | {NULL, NULL} | 1347 | {NULL, NULL} |
1329 | }; | 1348 | }; |
1330 | 1349 | ||
@@ -25,7 +25,7 @@ typedef enum TTag { | |||
25 | TBehind, /* match behind */ | 25 | TBehind, /* match behind */ |
26 | TCapture, /* regular capture */ | 26 | TCapture, /* regular capture */ |
27 | TRunTime, /* run-time capture */ | 27 | TRunTime, /* run-time capture */ |
28 | TThrow, TLabChoice /* labeled failure */ | 28 | TThrow, TLabChoice, TRecov /* labeled failure */ |
29 | } TTag; | 29 | } TTag; |
30 | 30 | ||
31 | /* number of siblings for each tree */ | 31 | /* number of siblings for each tree */ |
@@ -164,7 +164,7 @@ const char *match (lua_State *L, const char *o, const char *s, const char *e, | |||
164 | const Instruction *p = op; /* current instruction */ | 164 | const Instruction *p = op; /* current instruction */ |
165 | Labelset lsfail; | 165 | Labelset lsfail; |
166 | setlabelfail(&lsfail); | 166 | setlabelfail(&lsfail); |
167 | stack->p = &giveup; stack->s = s; stack->caplevel = 0; stack++; | 167 | stack->p = &giveup; stack->s = s; stack->ls = &lsfail; stack->caplevel = 0; stack++; /* labeled failure */ |
168 | lua_pushlightuserdata(L, stackbase); | 168 | lua_pushlightuserdata(L, stackbase); |
169 | for (;;) { | 169 | for (;;) { |
170 | #if defined(DEBUG) | 170 | #if defined(DEBUG) |
@@ -280,17 +280,31 @@ const char *match (lua_State *L, const char *o, const char *s, const char *e, | |||
280 | p += (CHARSETINSTSIZE - 1) + 2; | 280 | p += (CHARSETINSTSIZE - 1) + 2; |
281 | continue; | 281 | continue; |
282 | } | 282 | } |
283 | case IRecov: { /* labeled failure */ | ||
284 | if (stack == stacklimit) | ||
285 | stack = doublestack(L, &stacklimit, ptop); | ||
286 | stack->p = p + getoffset(p); | ||
287 | stack->s = NULL; | ||
288 | stack->ls = (const Labelset *) ((p + 2)->buff); | ||
289 | stack->caplevel = captop; | ||
290 | stack++; | ||
291 | p += (CHARSETINSTSIZE - 1) + 2; | ||
292 | continue; | ||
293 | } | ||
294 | |||
283 | case ICall: { | 295 | case ICall: { |
284 | if (stack == stacklimit) | 296 | if (stack == stacklimit) |
285 | stack = doublestack(L, &stacklimit, ptop); | 297 | stack = doublestack(L, &stacklimit, ptop); |
286 | stack->s = NULL; | 298 | stack->s = NULL; |
287 | stack->p = p + 2; /* save return address */ | 299 | stack->p = p + 2; /* save return address */ |
300 | stack->ls = NULL; | ||
288 | stack++; | 301 | stack++; |
289 | p += getoffset(p); | 302 | p += getoffset(p); |
290 | continue; | 303 | continue; |
291 | } | 304 | } |
292 | case ICommit: { | 305 | case ICommit: { |
293 | assert(stack > getstackbase(L, ptop) && (stack - 1)->s != NULL); | 306 | assert(stack > getstackbase(L, ptop) && (stack - 1)->ls != NULL); /* labeled failure */ |
307 | /* assert((stack - 1)->s != NULL); labeled failure: IRecov does not push s onto the stack */ | ||
294 | stack--; | 308 | stack--; |
295 | p += getoffset(p); | 309 | p += getoffset(p); |
296 | continue; | 310 | continue; |
@@ -322,10 +336,14 @@ const char *match (lua_State *L, const char *o, const char *s, const char *e, | |||
322 | *labelf = LFAIL; /* labeled failure */ | 336 | *labelf = LFAIL; /* labeled failure */ |
323 | *sfail = s; | 337 | *sfail = s; |
324 | fail: { /* pattern failed: try to backtrack */ | 338 | fail: { /* pattern failed: try to backtrack */ |
339 | const Labelset *auxlab = NULL; | ||
325 | do { /* remove pending calls */ | 340 | do { /* remove pending calls */ |
326 | assert(stack > getstackbase(L, ptop)); | 341 | assert(stack > getstackbase(L, ptop)); |
327 | s = (--stack)->s; | 342 | auxlab = (--stack)->ls; |
328 | } while (s == NULL || (stack->p != &giveup && !testlabel(stack->ls->cs, *labelf))); | 343 | } while (auxlab == NULL || (stack->p != &giveup && !testlabel(stack->ls->cs, *labelf))); |
344 | if (stack->p == &giveup || stack->s != NULL) { /* labeled failure */ | ||
345 | s = stack->s; | ||
346 | } | ||
329 | if (ndyncap > 0) /* is there matchtime captures? */ | 347 | if (ndyncap > 0) /* is there matchtime captures? */ |
330 | ndyncap -= removedyncap(L, capture, stack->caplevel, captop); | 348 | ndyncap -= removedyncap(L, capture, stack->caplevel, captop); |
331 | captop = stack->caplevel; | 349 | captop = stack->caplevel; |
@@ -35,7 +35,8 @@ typedef enum Opcode { | |||
35 | ICloseCapture, | 35 | ICloseCapture, |
36 | ICloseRunTime, | 36 | ICloseRunTime, |
37 | IThrow, /* "fails" with a specific label labeled failure */ | 37 | IThrow, /* "fails" with a specific label labeled failure */ |
38 | ILabChoice /* labeled choice */ | 38 | ILabChoice, /* labeled choice */ |
39 | IRecov /* stack a recovery; next fail with label 'f' will jump to 'offset' */ | ||
39 | } Opcode; | 40 | } Opcode; |
40 | 41 | ||
41 | 42 | ||
diff --git a/testlabel.lua b/testlabel.lua index 4f0768d..6ae184f 100644 --- a/testlabel.lua +++ b/testlabel.lua | |||
@@ -2,6 +2,15 @@ local m = require 'lpeglabel' | |||
2 | 2 | ||
3 | local p, r, l, s, serror | 3 | local p, r, l, s, serror |
4 | 4 | ||
5 | local function checkeqlab (x, ...) | ||
6 | y = { ... } | ||
7 | assert(type(x) == "table") | ||
8 | assert(#x == #y) | ||
9 | for i = 1, 3 do | ||
10 | assert(x[i] == y[i]) | ||
11 | end | ||
12 | end | ||
13 | |||
5 | -- throws a label | 14 | -- throws a label |
6 | p = m.T(1) | 15 | p = m.T(1) |
7 | s = "abc" | 16 | s = "abc" |
@@ -538,4 +547,31 @@ A := a;]] | |||
538 | assert(g:match(s) == terror['undefined']) | 547 | assert(g:match(s) == terror['undefined']) |
539 | 548 | ||
540 | 549 | ||
550 | print("+") | ||
551 | |||
552 | |||
553 | -- test recovery operator | ||
554 | p = m.Rec("a", "b") | ||
555 | assert(p:match("a") == 2) | ||
556 | assert(p:match("b") == 2) | ||
557 | checkeqlab({nil, 0, "c"}, p:match("c")) | ||
558 | |||
559 | p = m.Rec("a", "b", 3) | ||
560 | assert(p:match("a") == 2) | ||
561 | checkeqlab({nil, 0, "b"}, p:match("b")) | ||
562 | checkeqlab({nil, 0, "c"}, p:match("c")) | ||
563 | |||
564 | p = m.Rec(m.T(3), "b") | ||
565 | checkeqlab({nil, 3, "a"}, p:match("a")) | ||
566 | checkeqlab({nil, 3, "b"}, p:match("b")) | ||
567 | |||
568 | p = m.Rec(m.T(3), "b", 3) | ||
569 | p:pcode() | ||
570 | checkeqlab({nil, 0, "a"}, p:match("a")) | ||
571 | assert(p:match("b") == 2) | ||
572 | |||
573 | |||
541 | print("OK") | 574 | print("OK") |
575 | |||
576 | |||
577 | |||