1*16b8cff5SYuri PankovNOTE implicit vs. explicit repetitions : 2009-02-02 2*16b8cff5SYuri Pankov 3*16b8cff5SYuri Pankov# Glenn Fowler <glenn.s.fowler@gmail.com> 4*16b8cff5SYuri Pankov# conforming matches (column 4) must match one of the following BREs 5*16b8cff5SYuri Pankov# NOMATCH 6*16b8cff5SYuri Pankov# (0,.)\((\(.\),\(.\))(?,?)(\2,\3)\)* 7*16b8cff5SYuri Pankov# (0,.)\((\(.\),\(.\))(\2,\3)(?,?)\)* 8*16b8cff5SYuri Pankov# i.e., each 3-tuple has two identical elements and one (?,?) 9*16b8cff5SYuri Pankov 10*16b8cff5SYuri PankovE ((..)|(.)) NULL NOMATCH 11*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) NULL NOMATCH 12*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) NULL NOMATCH 13*16b8cff5SYuri Pankov 14*16b8cff5SYuri PankovE ((..)|(.)){1} NULL NOMATCH 15*16b8cff5SYuri PankovE ((..)|(.)){2} NULL NOMATCH 16*16b8cff5SYuri PankovE ((..)|(.)){3} NULL NOMATCH 17*16b8cff5SYuri Pankov 18*16b8cff5SYuri PankovE ((..)|(.))* NULL (0,0) 19*16b8cff5SYuri Pankov 20*16b8cff5SYuri PankovE ((..)|(.)) a (0,1)(0,1)(?,?)(0,1) 21*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) a NOMATCH 22*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) a NOMATCH 23*16b8cff5SYuri Pankov 24*16b8cff5SYuri PankovE ((..)|(.)){1} a (0,1)(0,1)(?,?)(0,1) 25*16b8cff5SYuri PankovE ((..)|(.)){2} a NOMATCH 26*16b8cff5SYuri PankovE ((..)|(.)){3} a NOMATCH 27*16b8cff5SYuri Pankov 28*16b8cff5SYuri PankovE ((..)|(.))* a (0,1)(0,1)(?,?)(0,1) 29*16b8cff5SYuri Pankov 30*16b8cff5SYuri PankovE ((..)|(.)) aa (0,2)(0,2)(0,2)(?,?) 31*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) aa (0,2)(0,1)(?,?)(0,1)(1,2)(?,?)(1,2) 32*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) aa NOMATCH 33*16b8cff5SYuri Pankov 34*16b8cff5SYuri PankovE ((..)|(.)){1} aa (0,2)(0,2)(0,2)(?,?) 35*16b8cff5SYuri PankovE ((..)|(.)){2} aa (0,2)(1,2)(?,?)(1,2) 36*16b8cff5SYuri PankovE ((..)|(.)){3} aa NOMATCH 37*16b8cff5SYuri Pankov 38*16b8cff5SYuri PankovE ((..)|(.))* aa (0,2)(0,2)(0,2)(?,?) 39*16b8cff5SYuri Pankov 40*16b8cff5SYuri PankovE ((..)|(.)) aaa (0,2)(0,2)(0,2)(?,?) 41*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) aaa (0,3)(0,2)(0,2)(?,?)(2,3)(?,?)(2,3) 42*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) aaa (0,3)(0,1)(?,?)(0,1)(1,2)(?,?)(1,2)(2,3)(?,?)(2,3) 43*16b8cff5SYuri Pankov 44*16b8cff5SYuri PankovE ((..)|(.)){1} aaa (0,2)(0,2)(0,2)(?,?) 45*16b8cff5SYuri PankovE ((..)|(.)){2} aaa (0,3)(2,3)(?,?)(2,3) 46*16b8cff5SYuri PankovE ((..)|(.)){3} aaa (0,3)(2,3)(?,?)(2,3) 47*16b8cff5SYuri Pankov 48*16b8cff5SYuri PankovE ((..)|(.))* aaa (0,3)(2,3)(?,?)(2,3) 49*16b8cff5SYuri Pankov 50*16b8cff5SYuri PankovE ((..)|(.)) aaaa (0,2)(0,2)(0,2)(?,?) 51*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) aaaa (0,4)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?) 52*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) aaaa (0,4)(0,2)(0,2)(?,?)(2,3)(?,?)(2,3)(3,4)(?,?)(3,4) 53*16b8cff5SYuri Pankov 54*16b8cff5SYuri PankovE ((..)|(.)){1} aaaa (0,2)(0,2)(0,2)(?,?) 55*16b8cff5SYuri PankovE ((..)|(.)){2} aaaa (0,4)(2,4)(2,4)(?,?) 56*16b8cff5SYuri PankovE ((..)|(.)){3} aaaa (0,4)(3,4)(?,?)(3,4) 57*16b8cff5SYuri Pankov 58*16b8cff5SYuri PankovE ((..)|(.))* aaaa (0,4)(2,4)(2,4)(?,?) 59*16b8cff5SYuri Pankov 60*16b8cff5SYuri PankovE ((..)|(.)) aaaaa (0,2)(0,2)(0,2)(?,?) 61*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) aaaaa (0,4)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?) 62*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) aaaaa (0,5)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?)(4,5)(?,?)(4,5) 63*16b8cff5SYuri Pankov 64*16b8cff5SYuri PankovE ((..)|(.)){1} aaaaa (0,2)(0,2)(0,2)(?,?) 65*16b8cff5SYuri PankovE ((..)|(.)){2} aaaaa (0,4)(2,4)(2,4)(?,?) 66*16b8cff5SYuri PankovE ((..)|(.)){3} aaaaa (0,5)(4,5)(?,?)(4,5) 67*16b8cff5SYuri Pankov 68*16b8cff5SYuri PankovE ((..)|(.))* aaaaa (0,5)(4,5)(?,?)(4,5) 69*16b8cff5SYuri Pankov 70*16b8cff5SYuri PankovE ((..)|(.)) aaaaaa (0,2)(0,2)(0,2)(?,?) 71*16b8cff5SYuri PankovE ((..)|(.))((..)|(.)) aaaaaa (0,4)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?) 72*16b8cff5SYuri PankovE ((..)|(.))((..)|(.))((..)|(.)) aaaaaa (0,6)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?)(4,6)(4,6)(?,?) 73*16b8cff5SYuri Pankov 74*16b8cff5SYuri PankovE ((..)|(.)){1} aaaaaa (0,2)(0,2)(0,2)(?,?) 75*16b8cff5SYuri PankovE ((..)|(.)){2} aaaaaa (0,4)(2,4)(2,4)(?,?) 76*16b8cff5SYuri PankovE ((..)|(.)){3} aaaaaa (0,6)(4,6)(4,6)(?,?) 77*16b8cff5SYuri Pankov 78*16b8cff5SYuri PankovE ((..)|(.))* aaaaaa (0,6)(4,6)(4,6)(?,?) 79*16b8cff5SYuri Pankov 80*16b8cff5SYuri PankovNOTE additional repetition tests graciously provided by Chris Kuklewicz www.haskell.org 2009-02-02 81*16b8cff5SYuri Pankov 82*16b8cff5SYuri Pankov# These test a bug in OS X / FreeBSD / NetBSD, and libtree. 83*16b8cff5SYuri Pankov# Linux/GLIBC gets the {8,} and {8,8} wrong. 84*16b8cff5SYuri Pankov 85*16b8cff5SYuri Pankov:HA#100:E X(.?){0,}Y X1234567Y (0,9)(7,8) 86*16b8cff5SYuri Pankov:HA#101:E X(.?){1,}Y X1234567Y (0,9)(7,8) 87*16b8cff5SYuri Pankov:HA#102:E X(.?){2,}Y X1234567Y (0,9)(7,8) 88*16b8cff5SYuri Pankov:HA#103:E X(.?){3,}Y X1234567Y (0,9)(7,8) 89*16b8cff5SYuri Pankov:HA#104:E X(.?){4,}Y X1234567Y (0,9)(7,8) 90*16b8cff5SYuri Pankov:HA#105:E X(.?){5,}Y X1234567Y (0,9)(7,8) 91*16b8cff5SYuri Pankov:HA#106:E X(.?){6,}Y X1234567Y (0,9)(7,8) 92*16b8cff5SYuri Pankov:HA#107:E X(.?){7,}Y X1234567Y (0,9)(7,8) 93*16b8cff5SYuri Pankov:HA#108:E X(.?){8,}Y X1234567Y (0,9)(8,8) 94*16b8cff5SYuri Pankov:HA#110:E X(.?){0,8}Y X1234567Y (0,9)(7,8) 95*16b8cff5SYuri Pankov:HA#111:E X(.?){1,8}Y X1234567Y (0,9)(7,8) 96*16b8cff5SYuri Pankov:HA#112:E X(.?){2,8}Y X1234567Y (0,9)(7,8) 97*16b8cff5SYuri Pankov:HA#113:E X(.?){3,8}Y X1234567Y (0,9)(7,8) 98*16b8cff5SYuri Pankov:HA#114:E X(.?){4,8}Y X1234567Y (0,9)(7,8) 99*16b8cff5SYuri Pankov:HA#115:E X(.?){5,8}Y X1234567Y (0,9)(7,8) 100*16b8cff5SYuri Pankov:HA#116:E X(.?){6,8}Y X1234567Y (0,9)(7,8) 101*16b8cff5SYuri Pankov:HA#117:E X(.?){7,8}Y X1234567Y (0,9)(7,8) 102*16b8cff5SYuri Pankov:HA#118:E X(.?){8,8}Y X1234567Y (0,9)(8,8) 103*16b8cff5SYuri Pankov 104*16b8cff5SYuri Pankov# These test a fixed bug in my regex-tdfa that did not keep the expanded 105*16b8cff5SYuri Pankov# form properly grouped, so right association did the wrong thing with 106*16b8cff5SYuri Pankov# these ambiguous patterns (crafted just to test my code when I became 107*16b8cff5SYuri Pankov# suspicious of my implementation). The first subexpression should use 108*16b8cff5SYuri Pankov# "ab" then "a" then "bcd". 109*16b8cff5SYuri Pankov 110*16b8cff5SYuri Pankov# OS X / FreeBSD / NetBSD badly fail many of these, with impossible 111*16b8cff5SYuri Pankov# results like (0,6)(4,5)(6,6). 112*16b8cff5SYuri Pankov 113*16b8cff5SYuri Pankov:HA#260:E (a|ab|c|bcd){0,}(d*) ababcd (0,6)(3,6)(6,6) 114*16b8cff5SYuri Pankov:HA#261:E (a|ab|c|bcd){1,}(d*) ababcd (0,6)(3,6)(6,6) 115*16b8cff5SYuri Pankov:HA#262:E (a|ab|c|bcd){2,}(d*) ababcd (0,6)(3,6)(6,6) 116*16b8cff5SYuri Pankov:HA#263:E (a|ab|c|bcd){3,}(d*) ababcd (0,6)(3,6)(6,6) 117*16b8cff5SYuri Pankov:HA#264:E (a|ab|c|bcd){4,}(d*) ababcd NOMATCH 118*16b8cff5SYuri Pankov:HA#265:E (a|ab|c|bcd){0,10}(d*) ababcd (0,6)(3,6)(6,6) 119*16b8cff5SYuri Pankov:HA#266:E (a|ab|c|bcd){1,10}(d*) ababcd (0,6)(3,6)(6,6) 120*16b8cff5SYuri Pankov:HA#267:E (a|ab|c|bcd){2,10}(d*) ababcd (0,6)(3,6)(6,6) 121*16b8cff5SYuri Pankov:HA#268:E (a|ab|c|bcd){3,10}(d*) ababcd (0,6)(3,6)(6,6) 122*16b8cff5SYuri Pankov:HA#269:E (a|ab|c|bcd){4,10}(d*) ababcd NOMATCH 123*16b8cff5SYuri Pankov:HA#270:E (a|ab|c|bcd)*(d*) ababcd (0,6)(3,6)(6,6) 124*16b8cff5SYuri Pankov:HA#271:E (a|ab|c|bcd)+(d*) ababcd (0,6)(3,6)(6,6) 125*16b8cff5SYuri Pankov 126*16b8cff5SYuri Pankov# The above worked on Linux/GLIBC but the following often fail. 127*16b8cff5SYuri Pankov# They also trip up OS X / FreeBSD / NetBSD: 128*16b8cff5SYuri Pankov 129*16b8cff5SYuri Pankov:HA#280:E (ab|a|c|bcd){0,}(d*) ababcd (0,6)(3,6)(6,6) 130*16b8cff5SYuri Pankov:HA#281:E (ab|a|c|bcd){1,}(d*) ababcd (0,6)(3,6)(6,6) 131*16b8cff5SYuri Pankov:HA#282:E (ab|a|c|bcd){2,}(d*) ababcd (0,6)(3,6)(6,6) 132*16b8cff5SYuri Pankov:HA#283:E (ab|a|c|bcd){3,}(d*) ababcd (0,6)(3,6)(6,6) 133*16b8cff5SYuri Pankov:HA#284:E (ab|a|c|bcd){4,}(d*) ababcd NOMATCH 134*16b8cff5SYuri Pankov:HA#285:E (ab|a|c|bcd){0,10}(d*) ababcd (0,6)(3,6)(6,6) 135*16b8cff5SYuri Pankov:HA#286:E (ab|a|c|bcd){1,10}(d*) ababcd (0,6)(3,6)(6,6) 136*16b8cff5SYuri Pankov:HA#287:E (ab|a|c|bcd){2,10}(d*) ababcd (0,6)(3,6)(6,6) 137*16b8cff5SYuri Pankov:HA#288:E (ab|a|c|bcd){3,10}(d*) ababcd (0,6)(3,6)(6,6) 138*16b8cff5SYuri Pankov:HA#289:E (ab|a|c|bcd){4,10}(d*) ababcd NOMATCH 139*16b8cff5SYuri Pankov:HA#290:E (ab|a|c|bcd)*(d*) ababcd (0,6)(3,6)(6,6) 140*16b8cff5SYuri Pankov:HA#291:E (ab|a|c|bcd)+(d*) ababcd (0,6)(3,6)(6,6) 141