aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--lpcode.c43
-rw-r--r--lpprint.c8
-rw-r--r--lptree.c27
-rw-r--r--lptree.h2
-rw-r--r--lpvm.c26
-rw-r--r--lpvm.h3
-rw-r--r--testlabel.lua36
7 files changed, 123 insertions, 22 deletions
diff --git a/lpcode.c b/lpcode.c
index 50e6764..2987cfc 100644
--- a/lpcode.c
+++ b/lpcode.c
@@ -196,8 +196,8 @@ int checkaux (TTree *tree, int pred) {
196 if (checkaux(sib2(tree), pred)) return 1; 196 if (checkaux(sib2(tree), pred)) return 1;
197 /* else return checkaux(sib1(tree), pred); */ 197 /* else return checkaux(sib1(tree), pred); */
198 tree = sib1(tree); goto tailcall; 198 tree = sib1(tree); goto tailcall;
199 case TLabChoice: /* labeled failure */ 199 case TLabChoice: case TRecov: /* labeled failure */
200 /* in a labeled ordered choice we do not know whether sib2 will be evaluated */ 200 /* we do not know whether sib2 will be evaluated */
201 tree = sib1(tree); goto tailcall; 201 tree = sib1(tree); goto tailcall;
202 case TCapture: case TGrammar: case TRule: 202 case TCapture: case TGrammar: case TRule:
203 /* return checkaux(sib1(tree), pred); */ 203 /* return checkaux(sib1(tree), pred); */
@@ -231,7 +231,7 @@ int fixedlenx (TTree *tree, int count, int len) {
231 return -1; /* may be a loop */ 231 return -1; /* may be a loop */
232 /* else return fixedlenx(sib2(tree), count); */ 232 /* else return fixedlenx(sib2(tree), count); */
233 tree = sib2(tree); goto tailcall; 233 tree = sib2(tree); goto tailcall;
234 case TSeq: { 234 case TSeq: case TRecov: { /* labeled failure */
235 len = fixedlenx(sib1(tree), count, len); 235 len = fixedlenx(sib1(tree), count, len);
236 if (len < 0) return -1; 236 if (len < 0) return -1;
237 /* else return fixedlenx(sib2(tree), count, len); */ 237 /* else return fixedlenx(sib2(tree), count, len); */
@@ -294,6 +294,12 @@ static int getfirst (TTree *tree, const Charset *follow, Charset *firstset) {
294 loopset(i, firstset->cs[i] |= csaux.cs[i]); 294 loopset(i, firstset->cs[i] |= csaux.cs[i]);
295 return e1 | e2; 295 return e1 | e2;
296 } 296 }
297 case TRecov: { /* labeled failure */
298 /* when p1 is not nullable, p2 has nothing to contribute;
299 and when p1 is nullable, then p2 will not match
300 return getfirst(sib1(tree), fullset, firstset); */
301 tree = sib1(tree); follow = fullset; goto tailcall;
302 }
297 case TSeq: { 303 case TSeq: {
298 if (!nullable(sib1(tree))) { 304 if (!nullable(sib1(tree))) {
299 /* when p1 is not nullable, p2 has nothing to contribute; 305 /* when p1 is not nullable, p2 has nothing to contribute;
@@ -372,7 +378,7 @@ static int headfail (TTree *tree) {
372 if (!nofail(sib2(tree))) return 0; 378 if (!nofail(sib2(tree))) return 0;
373 /* else return headfail(sib1(tree)); */ 379 /* else return headfail(sib1(tree)); */
374 tree = sib1(tree); goto tailcall; 380 tree = sib1(tree); goto tailcall;
375 case TChoice: case TLabChoice: /* labeled failure */ 381 case TChoice: case TLabChoice: case TRecov: /* labeled failure */
376 if (!headfail(sib1(tree))) return 0; 382 if (!headfail(sib1(tree))) return 0;
377 /* else return headfail(sib2(tree)); */ 383 /* else return headfail(sib2(tree)); */
378 tree = sib2(tree); goto tailcall; 384 tree = sib2(tree); goto tailcall;
@@ -392,7 +398,7 @@ static int needfollow (TTree *tree) {
392 case TChar: case TSet: case TAny: 398 case TChar: case TSet: case TAny:
393 case TFalse: case TTrue: case TAnd: case TNot: 399 case TFalse: case TTrue: case TAnd: case TNot:
394 case TRunTime: case TGrammar: case TCall: case TBehind: 400 case TRunTime: case TGrammar: case TCall: case TBehind:
395 case TThrow: case TLabChoice: /* (?)labeled failure */ 401 case TThrow: case TLabChoice: case TRecov: /* (?)labeled failure */
396 return 0; 402 return 0;
397 case TChoice: case TRep: 403 case TChoice: case TRep:
398 return 1; 404 return 1;
@@ -427,7 +433,7 @@ int sizei (const Instruction *i) {
427 return 2; 433 return 2;
428 case IThrow: /* labeled failure */ 434 case IThrow: /* labeled failure */
429 return 1; 435 return 1;
430 case ILabChoice: 436 case ILabChoice: case IRecov:
431 return (CHARSETINSTSIZE - 1) + 2; /* labeled failure */ 437 return (CHARSETINSTSIZE - 1) + 2; /* labeled failure */
432 default: return 1; 438 default: return 1;
433 } 439 }
@@ -492,7 +498,8 @@ static int addinstruction (CompileState *compst, Opcode op, int aux) {
492static int addoffsetinst (CompileState *compst, Opcode op) { 498static int addoffsetinst (CompileState *compst, Opcode op) {
493 int i = addinstruction(compst, op, 0); /* instruction */ 499 int i = addinstruction(compst, op, 0); /* instruction */
494 addinstruction(compst, (Opcode)0, 0); /* open space for offset */ 500 addinstruction(compst, (Opcode)0, 0); /* open space for offset */
495 assert(op == ITestSet || sizei(&getinstr(compst, i)) == 2); 501 assert(op == ITestSet || sizei(&getinstr(compst, i)) == 2 ||
502 op == IRecov || op == ILabChoice); /* labeled failure */
496 return i; 503 return i;
497} 504}
498 505
@@ -714,6 +721,21 @@ static void codelabchoice (CompileState *compst, TTree *p1, TTree *p2, int opt,
714 codegen(compst, p2, opt, NOINST, fl); 721 codegen(compst, p2, opt, NOINST, fl);
715 jumptohere(compst, pcommit); 722 jumptohere(compst, pcommit);
716} 723}
724
725static void coderecovery (CompileState *compst, TTree *p1, TTree *p2, int opt,
726 const Charset *fl, const byte *cs) {
727 int emptyp2 = (p2->tag == TTrue);
728 int pcommit;
729 int test = NOINST;
730 int precovery = addoffsetinst(compst, IRecov);
731 addcharset(compst, cs);
732 codegen(compst, p1, emptyp2, test, fullset);
733 pcommit = addoffsetinst(compst, ICommit);
734 jumptohere(compst, precovery);
735 jumptohere(compst, test);
736 codegen(compst, p2, opt, NOINST, fl);
737 jumptohere(compst, pcommit);
738}
717/* labeled failure end */ 739/* labeled failure end */
718 740
719 741
@@ -951,6 +973,10 @@ static void codegen (CompileState *compst, TTree *tree, int opt, int tt,
951 codelabchoice(compst, sib1(tree), sib2(tree), opt, fl, treelabelset(tree)); 973 codelabchoice(compst, sib1(tree), sib2(tree), opt, fl, treelabelset(tree));
952 break; 974 break;
953 } 975 }
976 case TRecov: { /* labeled failure */
977 coderecovery(compst, sib1(tree), sib2(tree), opt, fl, treelabelset(tree));
978 break;
979 }
954 default: assert(0); 980 default: assert(0);
955 } 981 }
956} 982}
@@ -972,7 +998,8 @@ static void peephole (CompileState *compst) {
972 redo: 998 redo:
973 switch (code[i].i.code) { 999 switch (code[i].i.code) {
974 case IChoice: case ICall: case ICommit: case IPartialCommit: 1000 case IChoice: case ICall: case ICommit: case IPartialCommit:
975 case IBackCommit: case ITestChar: case ITestSet: case ILabChoice: /* labeled failure */ 1001 case IBackCommit: case ITestChar: case ITestSet:
1002 case ILabChoice: case IRecov: /* labeled failure */
976 case ITestAny: { /* instructions with labels */ 1003 case ITestAny: { /* instructions with labels */
977 jumptothere(compst, i, finallabel(code, i)); /* optimize label */ 1004 jumptothere(compst, i, finallabel(code, i)); /* optimize label */
978 break; 1005 break;
diff --git a/lpprint.c b/lpprint.c
index 0ca0b0e..122d2e5 100644
--- a/lpprint.c
+++ b/lpprint.c
@@ -61,7 +61,7 @@ void printinst (const Instruction *op, const Instruction *p) {
61 "choice", "jmp", "call", "open_call", 61 "choice", "jmp", "call", "open_call",
62 "commit", "partial_commit", "back_commit", "failtwice", "fail", "giveup", 62 "commit", "partial_commit", "back_commit", "failtwice", "fail", "giveup",
63 "fullcapture", "opencapture", "closecapture", "closeruntime", 63 "fullcapture", "opencapture", "closecapture", "closeruntime",
64 "throw", "labeled_choice" /* labeled failure */ 64 "throw", "labeled_choice", "recovery" /* labeled failure */
65 }; 65 };
66 printf("%02ld: %s ", (long)(p - op), names[p->i.code]); 66 printf("%02ld: %s ", (long)(p - op), names[p->i.code]);
67 switch ((Opcode)p->i.code) { 67 switch ((Opcode)p->i.code) {
@@ -112,7 +112,7 @@ void printinst (const Instruction *op, const Instruction *p) {
112 printf("%d", p->i.aux); 112 printf("%d", p->i.aux);
113 break; 113 break;
114 } 114 }
115 case ILabChoice: { /* labeled failure */ 115 case ILabChoice: case IRecov: { /* labeled failure */
116 printjmp(op, p); 116 printjmp(op, p);
117 printcharset((p+2)->buff); 117 printcharset((p+2)->buff);
118 break; 118 break;
@@ -165,7 +165,7 @@ static const char *tagnames[] = {
165 "call", "opencall", "rule", "grammar", 165 "call", "opencall", "rule", "grammar",
166 "behind", 166 "behind",
167 "capture", "run-time", 167 "capture", "run-time",
168 "throw", "labeled-choice" /* labeled failure */ 168 "throw", "labeled-choice", "recov" /* labeled failure */
169}; 169};
170 170
171 171
@@ -223,7 +223,7 @@ void printtree (TTree *tree, int ident) {
223 default: { 223 default: {
224 int sibs = numsiblings[tree->tag]; 224 int sibs = numsiblings[tree->tag];
225 printf("\n"); 225 printf("\n");
226 if (tree->tag == TLabChoice) { /* labeled failure */ 226 if (tree->tag == TLabChoice || tree->tag == TRecov) { /* labeled failure */
227 printcharset(treelabelset(tree)); 227 printcharset(treelabelset(tree));
228 printf("\n"); 228 printf("\n");
229 } 229 }
diff --git a/lptree.c b/lptree.c
index 6d0f78c..c59f443 100644
--- a/lptree.c
+++ b/lptree.c
@@ -28,7 +28,7 @@ const byte numsiblings[] = {
28 0, 0, 2, 1, /* call, opencall, rule, grammar */ 28 0, 0, 2, 1, /* call, opencall, rule, grammar */
29 1, /* behind */ 29 1, /* behind */
30 1, 1, /* capture, runtime capture */ 30 1, 1, /* capture, runtime capture */
31 0, 2 /* labeled failure throw, labeled choice */ 31 0, 2, 2 /* labeled failure throw, labeled choice, recovery */
32}; 32};
33 33
34 34
@@ -525,12 +525,12 @@ static TTree *newthrowleaf (lua_State *L, int lab) {
525 return tree; 525 return tree;
526} 526}
527 527
528static TTree *newlabchoice (lua_State *L) { 528static TTree *newrootlab2sib (lua_State *L, int tag) {
529 int s1, s2; 529 int s1, s2;
530 TTree *tree1 = getpatt(L, 1, &s1); 530 TTree *tree1 = getpatt(L, 1, &s1);
531 TTree *tree2 = getpatt(L, 2, &s2); 531 TTree *tree2 = getpatt(L, 2, &s2);
532 TTree *tree = newtree(L, bytes2slots(LABELSETSIZE) + 1 + s1 + s2); /* create new tree */ 532 TTree *tree = newtree(L, bytes2slots(LABELSETSIZE) + 1 + s1 + s2); /* create new tree */
533 tree->tag = TLabChoice; 533 tree->tag = tag;
534 tree->u.s.ps = 1 + s1; 534 tree->u.s.ps = 1 + s1;
535 tree->u.s.plab = 1 + s1 + s2; 535 tree->u.s.plab = 1 + s1 + s2;
536 memcpy(sib1(tree), tree1, s1 * sizeof(TTree)); 536 memcpy(sib1(tree), tree1, s1 * sizeof(TTree));
@@ -733,7 +733,7 @@ static int lp_throw (lua_State *L) {
733*/ 733*/
734static int lp_labchoice (lua_State *L) { 734static int lp_labchoice (lua_State *L) {
735 int n = lua_gettop(L); 735 int n = lua_gettop(L);
736 TTree *tree = newlabchoice(L); 736 TTree *tree = newrootlab2sib(L, TLabChoice);
737 int i; 737 int i;
738 for (i = 3; i <= n; i++) { 738 for (i = 3; i <= n; i++) {
739 int d = luaL_checkinteger(L, i); 739 int d = luaL_checkinteger(L, i);
@@ -742,6 +742,24 @@ static int lp_labchoice (lua_State *L) {
742 } 742 }
743 return 1; 743 return 1;
744} 744}
745
746
747static int lp_recovery (lua_State *L) {
748 int n = lua_gettop(L);
749 TTree *tree = newrootlab2sib(L, TRecov);
750 if (n == 2) { /* catches fail as default */
751 setlabel(treelabelset(tree), LFAIL);
752 } else {
753 int i;
754 for (i = 3; i <= n; i++) {
755 int d = luaL_checkinteger(L, i);
756 luaL_argcheck(L, d >= 0 && d < MAXLABELS, i, "the number of a label must be between 0 and 255");
757 setlabel(treelabelset(tree), (byte)d);
758 }
759 }
760 return 1;
761}
762
745/* labeled failure end */ 763/* labeled failure end */
746 764
747 765
@@ -1325,6 +1343,7 @@ static struct luaL_Reg pattreg[] = {
1325 {"type", lp_type}, 1343 {"type", lp_type},
1326 {"T", lp_throw}, /* labeled failure throw */ 1344 {"T", lp_throw}, /* labeled failure throw */
1327 {"Lc", lp_labchoice}, /* labeled failure choice */ 1345 {"Lc", lp_labchoice}, /* labeled failure choice */
1346 {"Rec", lp_recovery}, /* labeled failure choice */
1328 {NULL, NULL} 1347 {NULL, NULL}
1329}; 1348};
1330 1349
diff --git a/lptree.h b/lptree.h
index 5ed67eb..cca346e 100644
--- a/lptree.h
+++ b/lptree.h
@@ -25,7 +25,7 @@ typedef enum TTag {
25 TBehind, /* match behind */ 25 TBehind, /* match behind */
26 TCapture, /* regular capture */ 26 TCapture, /* regular capture */
27 TRunTime, /* run-time capture */ 27 TRunTime, /* run-time capture */
28 TThrow, TLabChoice /* labeled failure */ 28 TThrow, TLabChoice, TRecov /* labeled failure */
29} TTag; 29} TTag;
30 30
31/* number of siblings for each tree */ 31/* number of siblings for each tree */
diff --git a/lpvm.c b/lpvm.c
index 4d9797c..277acf7 100644
--- a/lpvm.c
+++ b/lpvm.c
@@ -164,7 +164,7 @@ const char *match (lua_State *L, const char *o, const char *s, const char *e,
164 const Instruction *p = op; /* current instruction */ 164 const Instruction *p = op; /* current instruction */
165 Labelset lsfail; 165 Labelset lsfail;
166 setlabelfail(&lsfail); 166 setlabelfail(&lsfail);
167 stack->p = &giveup; stack->s = s; stack->caplevel = 0; stack++; 167 stack->p = &giveup; stack->s = s; stack->ls = &lsfail; stack->caplevel = 0; stack++; /* labeled failure */
168 lua_pushlightuserdata(L, stackbase); 168 lua_pushlightuserdata(L, stackbase);
169 for (;;) { 169 for (;;) {
170#if defined(DEBUG) 170#if defined(DEBUG)
@@ -280,17 +280,31 @@ const char *match (lua_State *L, const char *o, const char *s, const char *e,
280 p += (CHARSETINSTSIZE - 1) + 2; 280 p += (CHARSETINSTSIZE - 1) + 2;
281 continue; 281 continue;
282 } 282 }
283 case IRecov: { /* labeled failure */
284 if (stack == stacklimit)
285 stack = doublestack(L, &stacklimit, ptop);
286 stack->p = p + getoffset(p);
287 stack->s = NULL;
288 stack->ls = (const Labelset *) ((p + 2)->buff);
289 stack->caplevel = captop;
290 stack++;
291 p += (CHARSETINSTSIZE - 1) + 2;
292 continue;
293 }
294
283 case ICall: { 295 case ICall: {
284 if (stack == stacklimit) 296 if (stack == stacklimit)
285 stack = doublestack(L, &stacklimit, ptop); 297 stack = doublestack(L, &stacklimit, ptop);
286 stack->s = NULL; 298 stack->s = NULL;
287 stack->p = p + 2; /* save return address */ 299 stack->p = p + 2; /* save return address */
300 stack->ls = NULL;
288 stack++; 301 stack++;
289 p += getoffset(p); 302 p += getoffset(p);
290 continue; 303 continue;
291 } 304 }
292 case ICommit: { 305 case ICommit: {
293 assert(stack > getstackbase(L, ptop) && (stack - 1)->s != NULL); 306 assert(stack > getstackbase(L, ptop) && (stack - 1)->ls != NULL); /* labeled failure */
307 /* assert((stack - 1)->s != NULL); labeled failure: IRecov does not push s onto the stack */
294 stack--; 308 stack--;
295 p += getoffset(p); 309 p += getoffset(p);
296 continue; 310 continue;
@@ -322,10 +336,14 @@ const char *match (lua_State *L, const char *o, const char *s, const char *e,
322 *labelf = LFAIL; /* labeled failure */ 336 *labelf = LFAIL; /* labeled failure */
323 *sfail = s; 337 *sfail = s;
324 fail: { /* pattern failed: try to backtrack */ 338 fail: { /* pattern failed: try to backtrack */
339 const Labelset *auxlab = NULL;
325 do { /* remove pending calls */ 340 do { /* remove pending calls */
326 assert(stack > getstackbase(L, ptop)); 341 assert(stack > getstackbase(L, ptop));
327 s = (--stack)->s; 342 auxlab = (--stack)->ls;
328 } while (s == NULL || (stack->p != &giveup && !testlabel(stack->ls->cs, *labelf))); 343 } while (auxlab == NULL || (stack->p != &giveup && !testlabel(stack->ls->cs, *labelf)));
344 if (stack->p == &giveup || stack->s != NULL) { /* labeled failure */
345 s = stack->s;
346 }
329 if (ndyncap > 0) /* is there matchtime captures? */ 347 if (ndyncap > 0) /* is there matchtime captures? */
330 ndyncap -= removedyncap(L, capture, stack->caplevel, captop); 348 ndyncap -= removedyncap(L, capture, stack->caplevel, captop);
331 captop = stack->caplevel; 349 captop = stack->caplevel;
diff --git a/lpvm.h b/lpvm.h
index 4b4dda5..3c27027 100644
--- a/lpvm.h
+++ b/lpvm.h
@@ -35,7 +35,8 @@ typedef enum Opcode {
35 ICloseCapture, 35 ICloseCapture,
36 ICloseRunTime, 36 ICloseRunTime,
37 IThrow, /* "fails" with a specific label labeled failure */ 37 IThrow, /* "fails" with a specific label labeled failure */
38 ILabChoice /* labeled choice */ 38 ILabChoice, /* labeled choice */
39 IRecov /* stack a recovery; next fail with label 'f' will jump to 'offset' */
39} Opcode; 40} Opcode;
40 41
41 42
diff --git a/testlabel.lua b/testlabel.lua
index 4f0768d..6ae184f 100644
--- a/testlabel.lua
+++ b/testlabel.lua
@@ -2,6 +2,15 @@ local m = require 'lpeglabel'
2 2
3local p, r, l, s, serror 3local p, r, l, s, serror
4 4
5local function checkeqlab (x, ...)
6 y = { ... }
7 assert(type(x) == "table")
8 assert(#x == #y)
9 for i = 1, 3 do
10 assert(x[i] == y[i])
11 end
12end
13
5-- throws a label 14-- throws a label
6p = m.T(1) 15p = m.T(1)
7s = "abc" 16s = "abc"
@@ -538,4 +547,31 @@ A := a;]]
538assert(g:match(s) == terror['undefined']) 547assert(g:match(s) == terror['undefined'])
539 548
540 549
550print("+")
551
552
553-- test recovery operator
554p = m.Rec("a", "b")
555assert(p:match("a") == 2)
556assert(p:match("b") == 2)
557checkeqlab({nil, 0, "c"}, p:match("c"))
558
559p = m.Rec("a", "b", 3)
560assert(p:match("a") == 2)
561checkeqlab({nil, 0, "b"}, p:match("b"))
562checkeqlab({nil, 0, "c"}, p:match("c"))
563
564p = m.Rec(m.T(3), "b")
565checkeqlab({nil, 3, "a"}, p:match("a"))
566checkeqlab({nil, 3, "b"}, p:match("b"))
567
568p = m.Rec(m.T(3), "b", 3)
569p:pcode()
570checkeqlab({nil, 0, "a"}, p:match("a"))
571assert(p:match("b") == 2)
572
573
541print("OK") 574print("OK")
575
576
577