1#!./perl -w 2 3BEGIN { 4 chdir 't' if -d 't'; 5 @INC = '../lib'; 6} 7 8my $debug = 1; 9 10## 11## If the markers used are changed (search for "MARKER1" in regcomp.c), 12## update only these two variables, and leave the {#} in the @death/@warning 13## arrays below. The {#} is a meta-marker -- it marks where the marker should 14## go. 15 16my $marker1 = "<-- HERE"; 17my $marker2 = " <-- HERE "; 18 19## 20## Key-value pairs of code/error of code that should have fatal errors. 21## 22 23eval 'use Config'; # assume defaults if fail 24our %Config; 25my $inf_m1 = ($Config{reg_infty} || 32767) - 1; 26my $inf_p1 = $inf_m1 + 2; 27my @death = 28( 29 '/[[=foo=]]/' => 'POSIX syntax [= =] is reserved for future extensions in regex; marked by {#} in m/[[=foo=]{#}]/', 30 31 '/(?<= .*)/' => 'Variable length lookbehind not implemented in regex; marked by {#} in m/(?<= .*){#}/', 32 33 '/(?<= x{1000})/' => 'Lookbehind longer than 255 not implemented in regex; marked by {#} in m/(?<= x{1000}){#}/', 34 35 '/(?@)/' => 'Sequence (?@...) not implemented in regex; marked by {#} in m/(?@{#})/', 36 37 '/(?{ 1/' => 'Sequence (?{...}) not terminated or not {}-balanced in regex; marked by {#} in m/(?{{#} 1/', 38 39 '/(?(1x))/' => 'Switch condition not recognized in regex; marked by {#} in m/(?(1x{#}))/', 40 41 '/(?(1)x|y|z)/' => 'Switch (?(condition)... contains too many branches in regex; marked by {#} in m/(?(1)x|y|{#}z)/', 42 43 '/(?(x)y|x)/' => 'Unknown switch condition (?(x) in regex; marked by {#} in m/(?({#}x)y|x)/', 44 45 '/(?/' => 'Sequence (? incomplete in regex; marked by {#} in m/(?{#}/', 46 47 '/(?;x/' => 'Sequence (?;...) not recognized in regex; marked by {#} in m/(?;{#}x/', 48 '/(?<;x/' => 'Sequence (?<;...) not recognized in regex; marked by {#} in m/(?<;{#}x/', 49 50 '/((x)/' => 'Unmatched ( in regex; marked by {#} in m/({#}(x)/', 51 52 "/x{$inf_p1}/" => "Quantifier in {,} bigger than $inf_m1 in regex; marked by {#} in m/x{{#}$inf_p1}/", 53 54 '/x{3,1}/' => 'Can\'t do {n,m} with n > m in regex; marked by {#} in m/x{3,1}{#}/', 55 56 '/x**/' => 'Nested quantifiers in regex; marked by {#} in m/x**{#}/', 57 58 '/x[/' => 'Unmatched [ in regex; marked by {#} in m/x[{#}/', 59 60 '/*/', => 'Quantifier follows nothing in regex; marked by {#} in m/*{#}/', 61 62 '/\p{x/' => 'Missing right brace on \p{} in regex; marked by {#} in m/\p{{#}x/', 63 64 '/[\p{x]/' => 'Missing right brace on \p{} in regex; marked by {#} in m/[\p{{#}x]/', 65 66 '/(x)\2/' => 'Reference to nonexistent group in regex; marked by {#} in m/(x)\2{#}/', 67 68 'my $m = "\\\"; $m =~ $m', => 'Trailing \ in regex m/\/', 69 70 '/\x{1/' => 'Missing right brace on \x{} in regex; marked by {#} in m/\x{{#}1/', 71 72 '/[\x{X]/' => 'Missing right brace on \x{} in regex; marked by {#} in m/[\x{{#}X]/', 73 74 '/[[:barf:]]/' => 'POSIX class [:barf:] unknown in regex; marked by {#} in m/[[:barf:]{#}]/', 75 76 '/[[=barf=]]/' => 'POSIX syntax [= =] is reserved for future extensions in regex; marked by {#} in m/[[=barf=]{#}]/', 77 78 '/[[.barf.]]/' => 'POSIX syntax [. .] is reserved for future extensions in regex; marked by {#} in m/[[.barf.]{#}]/', 79 80 '/[z-a]/' => 'Invalid [] range "z-a" in regex; marked by {#} in m/[z-a{#}]/', 81 82 '/\p/' => 'Empty \p{} in regex; marked by {#} in m/\p{#}/', 83 84 '/\P{}/' => 'Empty \P{} in regex; marked by {#} in m/\P{{#}}/', 85); 86 87## 88## Key-value pairs of code/error of code that should have non-fatal warnings. 89## 90@warning = ( 91 "m/(?p{ 'a' })/" => "(?p{}) is deprecated - use (??{}) in regex; marked by {#} in m/(?p{#}{ 'a' })/", 92 93 'm/\b*/' => '\b* matches null string many times in regex; marked by {#} in m/\b*{#}/', 94 95 'm/[:blank:]/' => 'POSIX syntax [: :] belongs inside character classes in regex; marked by {#} in m/[:blank:]{#}/', 96 97 "m'[\\y]'" => 'Unrecognized escape \y in character class passed through in regex; marked by {#} in m/[\y{#}]/', 98 99 'm/[a-\d]/' => 'False [] range "a-\d" in regex; marked by {#} in m/[a-\d{#}]/', 100 'm/[\w-x]/' => 'False [] range "\w-" in regex; marked by {#} in m/[\w-{#}x]/', 101 "m'\\y'" => 'Unrecognized escape \y passed through in regex; marked by {#} in m/\y{#}/', 102); 103 104my $total = (@death + @warning)/2; 105 106# utf8 is a noop on EBCDIC platforms, it is not fatal 107my $Is_EBCDIC = (ord('A') == 193); 108if ($Is_EBCDIC) { 109 my @utf8_death = grep(/utf8/, @death); 110 $total = $total - @utf8_death; 111} 112 113print "1..$total\n"; 114 115my $count = 0; 116 117while (@death) 118{ 119 my $regex = shift @death; 120 my $result = shift @death; 121 # skip the utf8 test on EBCDIC since they do not die 122 next if ($Is_EBCDIC && $regex =~ /utf8/); 123 $count++; 124 125 $_ = "x"; 126 eval $regex; 127 if (not $@) { 128 print "# oops, $regex didn't die\nnot ok $count\n"; 129 next; 130 } 131 chomp $@; 132 $result =~ s/{\#}/$marker1/; 133 $result =~ s/{\#}/$marker2/; 134 $result .= " at "; 135 if ($@ !~ /^\Q$result/) { 136 print "# For $regex, expected:\n# $result\n# Got:\n# $@\n#\nnot "; 137 } 138 print "ok $count - $regex\n"; 139} 140 141 142our $warning; 143$SIG{__WARN__} = sub { $warning = shift }; 144 145while (@warning) 146{ 147 $count++; 148 my $regex = shift @warning; 149 my $result = shift @warning; 150 151 undef $warning; 152 $_ = "x"; 153 eval $regex; 154 155 if ($@) 156 { 157 print "# oops, $regex died with:\n#\t$@#\nnot ok $count\n"; 158 next; 159 } 160 161 if (not $warning) 162 { 163 print "# oops, $regex didn't generate a warning\nnot ok $count\n"; 164 next; 165 } 166 $result =~ s/{\#}/$marker1/; 167 $result =~ s/{\#}/$marker2/; 168 $result .= " at "; 169 if ($warning !~ /^\Q$result/) 170 { 171 print <<"EOM"; 172# For $regex, expected: 173# $result 174# Got: 175# $warning 176# 177not ok $count 178EOM 179 next; 180 } 181 print "ok $count - $regex\n"; 182} 183 184 185 186