1 1.1 christos NOTE implicit vs. explicit repetitions : 2009-02-02 2 1.1 christos 3 1.1 christos # Glenn Fowler <gsf (a] research.att.com> 4 1.1 christos # conforming matches (column 4) must match one of the following BREs 5 1.1 christos # NOMATCH 6 1.1 christos # (0,.)\((\(.\),\(.\))(?,?)(\2,\3)\)* 7 1.1 christos # (0,.)\((\(.\),\(.\))(\2,\3)(?,?)\)* 8 1.1 christos # i.e., each 3-tuple has two identical elements and one (?,?) 9 1.1 christos 10 1.1 christos E ((..)|(.)) NULL NOMATCH 11 1.1 christos E ((..)|(.))((..)|(.)) NULL NOMATCH 12 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) NULL NOMATCH 13 1.1 christos 14 1.1 christos E ((..)|(.)){1} NULL NOMATCH 15 1.1 christos E ((..)|(.)){2} NULL NOMATCH 16 1.1 christos E ((..)|(.)){3} NULL NOMATCH 17 1.1 christos 18 1.1 christos E ((..)|(.))* NULL (0,0) 19 1.1 christos 20 1.1 christos E ((..)|(.)) a (0,1)(0,1)(?,?)(0,1) 21 1.1 christos E ((..)|(.))((..)|(.)) a NOMATCH 22 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) a NOMATCH 23 1.1 christos 24 1.1 christos E ((..)|(.)){1} a (0,1)(0,1)(?,?)(0,1) 25 1.1 christos E ((..)|(.)){2} a NOMATCH 26 1.1 christos E ((..)|(.)){3} a NOMATCH 27 1.1 christos 28 1.1 christos E ((..)|(.))* a (0,1)(0,1)(?,?)(0,1) 29 1.1 christos 30 1.1 christos E ((..)|(.)) aa (0,2)(0,2)(0,2)(?,?) 31 1.1 christos E ((..)|(.))((..)|(.)) aa (0,2)(0,1)(?,?)(0,1)(1,2)(?,?)(1,2) 32 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) aa NOMATCH 33 1.1 christos 34 1.1 christos E ((..)|(.)){1} aa (0,2)(0,2)(0,2)(?,?) 35 1.1 christos E ((..)|(.)){2} aa (0,2)(1,2)(?,?)(1,2) 36 1.1 christos E ((..)|(.)){3} aa NOMATCH 37 1.1 christos 38 1.1 christos E ((..)|(.))* aa (0,2)(0,2)(0,2)(?,?) 39 1.1 christos 40 1.1 christos E ((..)|(.)) aaa (0,2)(0,2)(0,2)(?,?) 41 1.1 christos E ((..)|(.))((..)|(.)) aaa (0,3)(0,2)(0,2)(?,?)(2,3)(?,?)(2,3) 42 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) aaa (0,3)(0,1)(?,?)(0,1)(1,2)(?,?)(1,2)(2,3)(?,?)(2,3) 43 1.1 christos 44 1.1 christos E ((..)|(.)){1} aaa (0,2)(0,2)(0,2)(?,?) 45 1.1 christos E ((..)|(.)){2} aaa (0,3)(2,3)(?,?)(2,3) 46 1.1 christos E ((..)|(.)){3} aaa (0,3)(2,3)(?,?)(2,3) 47 1.1 christos 48 1.1 christos E ((..)|(.))* aaa (0,3)(2,3)(?,?)(2,3) 49 1.1 christos 50 1.1 christos E ((..)|(.)) aaaa (0,2)(0,2)(0,2)(?,?) 51 1.1 christos E ((..)|(.))((..)|(.)) aaaa (0,4)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?) 52 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) aaaa (0,4)(0,2)(0,2)(?,?)(2,3)(?,?)(2,3)(3,4)(?,?)(3,4) 53 1.1 christos 54 1.1 christos E ((..)|(.)){1} aaaa (0,2)(0,2)(0,2)(?,?) 55 1.1 christos E ((..)|(.)){2} aaaa (0,4)(2,4)(2,4)(?,?) 56 1.1 christos E ((..)|(.)){3} aaaa (0,4)(3,4)(?,?)(3,4) 57 1.1 christos 58 1.1 christos E ((..)|(.))* aaaa (0,4)(2,4)(2,4)(?,?) 59 1.1 christos 60 1.1 christos E ((..)|(.)) aaaaa (0,2)(0,2)(0,2)(?,?) 61 1.1 christos E ((..)|(.))((..)|(.)) aaaaa (0,4)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?) 62 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) aaaaa (0,5)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?)(4,5)(?,?)(4,5) 63 1.1 christos 64 1.1 christos E ((..)|(.)){1} aaaaa (0,2)(0,2)(0,2)(?,?) 65 1.1 christos E ((..)|(.)){2} aaaaa (0,4)(2,4)(2,4)(?,?) 66 1.1 christos E ((..)|(.)){3} aaaaa (0,5)(4,5)(?,?)(4,5) 67 1.1 christos 68 1.1 christos E ((..)|(.))* aaaaa (0,5)(4,5)(?,?)(4,5) 69 1.1 christos 70 1.1 christos E ((..)|(.)) aaaaaa (0,2)(0,2)(0,2)(?,?) 71 1.1 christos E ((..)|(.))((..)|(.)) aaaaaa (0,4)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?) 72 1.1 christos E ((..)|(.))((..)|(.))((..)|(.)) aaaaaa (0,6)(0,2)(0,2)(?,?)(2,4)(2,4)(?,?)(4,6)(4,6)(?,?) 73 1.1 christos 74 1.1 christos E ((..)|(.)){1} aaaaaa (0,2)(0,2)(0,2)(?,?) 75 1.1 christos E ((..)|(.)){2} aaaaaa (0,4)(2,4)(2,4)(?,?) 76 1.1 christos E ((..)|(.)){3} aaaaaa (0,6)(4,6)(4,6)(?,?) 77 1.1 christos 78 1.1 christos E ((..)|(.))* aaaaaa (0,6)(4,6)(4,6)(?,?) 79 1.1 christos 80 1.1 christos NOTE additional repetition tests graciously provided by Chris Kuklewicz www.haskell.org 2009-02-02 81 1.1 christos 82 1.1 christos # These test a bug in OS X / FreeBSD / NetBSD, and libtree. 83 1.1 christos # Linux/GLIBC gets the {8,} and {8,8} wrong. 84 1.1 christos 85 1.1 christos :HA#100:E X(.?){0,}Y X1234567Y (0,9)(7,8) 86 1.1 christos :HA#101:E X(.?){1,}Y X1234567Y (0,9)(7,8) 87 1.1 christos :HA#102:E X(.?){2,}Y X1234567Y (0,9)(7,8) 88 1.1 christos :HA#103:E X(.?){3,}Y X1234567Y (0,9)(7,8) 89 1.1 christos :HA#104:E X(.?){4,}Y X1234567Y (0,9)(7,8) 90 1.1 christos :HA#105:E X(.?){5,}Y X1234567Y (0,9)(7,8) 91 1.1 christos :HA#106:E X(.?){6,}Y X1234567Y (0,9)(7,8) 92 1.1 christos :HA#107:E X(.?){7,}Y X1234567Y (0,9)(7,8) 93 1.1 christos :HA#108:E X(.?){8,}Y X1234567Y (0,9)(8,8) 94 1.1 christos :HA#110:E X(.?){0,8}Y X1234567Y (0,9)(7,8) 95 1.1 christos :HA#111:E X(.?){1,8}Y X1234567Y (0,9)(7,8) 96 1.1 christos :HA#112:E X(.?){2,8}Y X1234567Y (0,9)(7,8) 97 1.1 christos :HA#113:E X(.?){3,8}Y X1234567Y (0,9)(7,8) 98 1.1 christos :HA#114:E X(.?){4,8}Y X1234567Y (0,9)(7,8) 99 1.1 christos :HA#115:E X(.?){5,8}Y X1234567Y (0,9)(7,8) 100 1.1 christos :HA#116:E X(.?){6,8}Y X1234567Y (0,9)(7,8) 101 1.1 christos :HA#117:E X(.?){7,8}Y X1234567Y (0,9)(7,8) 102 1.1 christos :HA#118:E X(.?){8,8}Y X1234567Y (0,9)(8,8) 103 1.1 christos 104 1.1 christos # These test a fixed bug in my regex-tdfa that did not keep the expanded 105 1.1 christos # form properly grouped, so right association did the wrong thing with 106 1.1 christos # these ambiguous patterns (crafted just to test my code when I became 107 1.1 christos # suspicious of my implementation). The first subexpression should use 108 1.1 christos # "ab" then "a" then "bcd". 109 1.1 christos 110 1.1 christos # OS X / FreeBSD / NetBSD badly fail many of these, with impossible 111 1.1 christos # results like (0,6)(4,5)(6,6). 112 1.1 christos 113 1.1 christos :HA#260:E (a|ab|c|bcd){0,}(d*) ababcd (0,6)(3,6)(6,6) 114 1.1 christos :HA#261:E (a|ab|c|bcd){1,}(d*) ababcd (0,6)(3,6)(6,6) 115 1.1 christos :HA#262:E (a|ab|c|bcd){2,}(d*) ababcd (0,6)(3,6)(6,6) 116 1.1 christos :HA#263:E (a|ab|c|bcd){3,}(d*) ababcd (0,6)(3,6)(6,6) 117 1.1 christos :HA#264:E (a|ab|c|bcd){4,}(d*) ababcd NOMATCH 118 1.1 christos :HA#265:E (a|ab|c|bcd){0,10}(d*) ababcd (0,6)(3,6)(6,6) 119 1.1 christos :HA#266:E (a|ab|c|bcd){1,10}(d*) ababcd (0,6)(3,6)(6,6) 120 1.1 christos :HA#267:E (a|ab|c|bcd){2,10}(d*) ababcd (0,6)(3,6)(6,6) 121 1.1 christos :HA#268:E (a|ab|c|bcd){3,10}(d*) ababcd (0,6)(3,6)(6,6) 122 1.1 christos :HA#269:E (a|ab|c|bcd){4,10}(d*) ababcd NOMATCH 123 1.1 christos :HA#270:E (a|ab|c|bcd)*(d*) ababcd (0,6)(3,6)(6,6) 124 1.1 christos :HA#271:E (a|ab|c|bcd)+(d*) ababcd (0,6)(3,6)(6,6) 125 1.1 christos 126 1.1 christos # The above worked on Linux/GLIBC but the following often fail. 127 1.1 christos # They also trip up OS X / FreeBSD / NetBSD: 128 1.1 christos 129 1.1 christos :HA#280:E (ab|a|c|bcd){0,}(d*) ababcd (0,6)(3,6)(6,6) 130 1.1 christos :HA#281:E (ab|a|c|bcd){1,}(d*) ababcd (0,6)(3,6)(6,6) 131 1.1 christos :HA#282:E (ab|a|c|bcd){2,}(d*) ababcd (0,6)(3,6)(6,6) 132 1.1 christos :HA#283:E (ab|a|c|bcd){3,}(d*) ababcd (0,6)(3,6)(6,6) 133 1.1 christos :HA#284:E (ab|a|c|bcd){4,}(d*) ababcd NOMATCH 134 1.1 christos :HA#285:E (ab|a|c|bcd){0,10}(d*) ababcd (0,6)(3,6)(6,6) 135 1.1 christos :HA#286:E (ab|a|c|bcd){1,10}(d*) ababcd (0,6)(3,6)(6,6) 136 1.1 christos :HA#287:E (ab|a|c|bcd){2,10}(d*) ababcd (0,6)(3,6)(6,6) 137 1.1 christos :HA#288:E (ab|a|c|bcd){3,10}(d*) ababcd (0,6)(3,6)(6,6) 138 1.1 christos :HA#289:E (ab|a|c|bcd){4,10}(d*) ababcd NOMATCH 139 1.1 christos :HA#290:E (ab|a|c|bcd)*(d*) ababcd (0,6)(3,6)(6,6) 140 1.1 christos :HA#291:E (ab|a|c|bcd)+(d*) ababcd (0,6)(3,6)(6,6) 141