1#!/bin/sh 2 3# SUSv3 compliant sed tests. 4# Copyright 2005 by Rob Landley <rob@landley.net> 5# Licensed under GPLv2, see file LICENSE in this source tree. 6 7. ./testing.sh 8 9# testing "description" "commands" "result" "infile" "stdin" 10 11# Corner cases 12testing "sed no files (stdin)" 'sed ""' "hello\n" "" "hello\n" 13testing "sed explicit stdin" 'sed "" -' "hello\n" "" "hello\n" 14testing "sed handles empty lines" "sed -e 's/\$/@/'" "@\n" "" "\n" 15testing "sed stdin twice" 'sed "" - -' "hello" "" "hello" 16 17# Trailing EOF. 18# Match $, at end of each file or all files? 19 20# -e corner cases 21# without -e 22# multiple -e 23# interact with a 24# -eee arg1 arg2 arg3 25# -f corner cases 26# -e -f -e 27# -n corner cases 28# no newline at EOF? 29# -r corner cases 30# Just make sure it works. 31# -i corner cases: 32# sed -i - 33# permissions 34# -i on a symlink 35# on a directory 36# With $ last-line test 37# Continue with \ 38# End of script with trailing \ 39 40# command list 41testing "sed accepts blanks before command" "sed -e '1 d'" "" "" "" 42testing "sed accepts newlines in -e" "sed -e 'i\ 431 44a\ 453'" "1\n2\n3\n" "" "2\n" 46testing "sed accepts multiple -e" "sed -e 'i\' -e '1' -e 'a\' -e '3'" \ 47 "1\n2\n3\n" "" "2\n" 48 49# substitutions 50testing "sed -n" "sed -n -e s/foo/bar/ -e s/bar/baz/" "" "" "foo\n" 51testing "sed with empty match" "sed 's/z*//g'" "string\n" "" "string\n" 52testing "sed s//p" "sed -e s/foo/bar/p -e s/bar/baz/p" "bar\nbaz\nbaz\n" \ 53 "" "foo\n" 54testing "sed -n s//p" "sed -ne s/abc/def/p" "def\n" "" "abc\n" 55testing "sed s//g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5,\n" \ 56 "" "12345\n" 57testing "sed s arbitrary delimiter" "sed -e 's woo boing '" "boing\n" "" "woo\n" 58testing "sed s chains" "sed -e s/foo/bar/ -e s/bar/baz/" "baz\n" "" "foo\n" 59testing "sed s chains2" "sed -e s/foo/bar/ -e s/baz/nee/" "bar\n" "" "foo\n" 60testing "sed s [delimiter]" "sed -e 's@[@]@@'" "onetwo" "" "one@two" 61testing "sed s with \\t (GNU ext)" "sed 's/\t/ /'" "one two" "" "one\ttwo" 62 63# branch 64testing "sed b (branch)" "sed -e 'b one;p;: one'" "foo\n" "" "foo\n" 65testing "sed b (branch with no label jumps to end)" "sed -e 'b;p'" \ 66 "foo\n" "" "foo\n" 67 68# test and branch 69testing "sed t (test/branch)" "sed -e 's/a/1/;t one;p;: one;p'" \ 70 "1\n1\nb\nb\nb\nc\nc\nc\n" "" "a\nb\nc\n" 71testing "sed t (test/branch clears test bit)" "sed -e 's/a/b/;:loop;t loop'" \ 72 "b\nb\nc\n" "" "a\nb\nc\n" 73testing "sed T (!test/branch)" "sed -e 's/a/1/;T notone;p;: notone;p'" \ 74 "1\n1\n1\nb\nb\nc\nc\n" "" "a\nb\nc\n" 75 76testing "sed n (flushes pattern space, terminates early)" "sed -e 'n;p'" \ 77 "a\nb\nb\nc\n" "" "a\nb\nc\n" 78 79# non-GNU sed: N does _not_ flush pattern space, therefore c is eaten @ script end 80# GNU sed: N flushes pattern space, therefore c is printed too @ script end 81testing "sed N (flushes pattern space (GNU behavior))" "sed -e 'N;p'" \ 82 "a\nb\na\nb\nc\n" "" "a\nb\nc\n" 83 84testing "sed N test2" "sed ':a;N;s/\n/ /;ta'" \ 85 "a b c\n" "" "a\nb\nc\n" 86 87testing "sed N test3" "sed 'N;s/\n/ /'" \ 88 "a b\nc\n" "" "a\nb\nc\n" 89 90testing "sed address match newline" 'sed "/b/N;/b\\nc/i woo"' \ 91 "a\nwoo\nb\nc\nd\n" "" "a\nb\nc\nd\n" 92 93# Multiple lines in pattern space 94testing "sed N (stops at end of input) and P (prints to first newline only)" \ 95 "sed -n 'N;P;p'" "a\na\nb\n" "" "a\nb\nc\n" 96 97# Hold space 98testing "sed G (append hold space to pattern space)" 'sed G' "a\n\nb\n\nc\n\n" \ 99 "" "a\nb\nc\n" 100#testing "sed g/G (swap/append hold and patter space)" 101#testing "sed g (swap hold/pattern space)" 102 103testing "sed d ends script iteration" \ 104 "sed -e '/ook/d;s/ook/ping/p;i woot'" "" "" "ook\n" 105testing "sed d ends script iteration (2)" \ 106 "sed -e '/ook/d;a\' -e 'bang'" "woot\nbang\n" "" "ook\nwoot\n" 107 108# Multiple files, with varying newlines and NUL bytes 109test x"$SKIP_KNOWN_BUGS" = x"" && { 110testing "sed embedded NUL" "sed -e 's/woo/bang/'" "\0bang\0woo\0" "" \ 111 "\0woo\0woo\0" 112} 113testing "sed embedded NUL g" "sed -e 's/woo/bang/g'" "bang\0bang\0" "" \ 114 "woo\0woo\0" 115test x"$SKIP_KNOWN_BUGS" = x"" && { 116$ECHO -e "/woo/a he\0llo" > sed.commands 117testing "sed NUL in command" "sed -f sed.commands" "woo\nhe\0llo\n" "" "woo" 118rm sed.commands 119} 120 121# sed has funky behavior with newlines at the end of file. Test lots of 122# corner cases with the optional newline appending behavior. 123 124testing "sed normal newlines" "sed -e 's/woo/bang/' input -" "bang\nbang\n" \ 125 "woo\n" "woo\n" 126testing "sed leave off trailing newline" "sed -e 's/woo/bang/' input -" \ 127 "bang\nbang" "woo\n" "woo" 128testing "sed autoinsert newline" "sed -e 's/woo/bang/' input -" "bang\nbang" \ 129 "woo" "woo" 130testing "sed empty file plus cat" "sed -e 's/nohit//' input -" "one\ntwo" \ 131 "" "one\ntwo" 132testing "sed cat plus empty file" "sed -e 's/nohit//' input -" "one\ntwo" \ 133 "one\ntwo" "" 134testing "sed append autoinserts newline" "sed -e '/woot/a woo' -" \ 135 "woot\nwoo\n" "" "woot" 136testing "sed append autoinserts newline 2" "sed -e '/oot/a woo' - input" \ 137 "woot\nwoo\nboot\nwoo\n" "boot" "woot" 138testing "sed append autoinserts newline 3" "sed -e '/oot/a woo' -i input && cat input" \ 139 "boot\nwoo\n" "boot" "" 140testing "sed insert doesn't autoinsert newline" "sed -e '/woot/i woo' -" \ 141 "woo\nwoot" "" "woot" 142testing "sed print autoinsert newlines" "sed -e 'p' -" "one\none" "" "one" 143testing "sed print autoinsert newlines two files" "sed -e 'p' input -" \ 144 "one\none\ntwo\ntwo" "one" "two" 145testing "sed noprint, no match, no newline" "sed -ne 's/woo/bang/' input" \ 146 "" "no\n" "" 147testing "sed selective matches with one nl" "sed -ne 's/woo/bang/p' input -" \ 148 "a bang\nc bang\n" "a woo\nb no" "c woo\nd no" 149testing "sed selective matches insert newline" \ 150 "sed -ne 's/woo/bang/p' input -" "a bang\nb bang\nd bang" \ 151 "a woo\nb woo" "c no\nd woo" 152testing "sed selective matches noinsert newline" \ 153 "sed -ne 's/woo/bang/p' input -" "a bang\nb bang" "a woo\nb woo" \ 154 "c no\nd no" 155testing "sed clusternewline" \ 156 "sed -e '/one/a 111' -e '/two/i 222' -e p input -" \ 157 "one\none\n111\n222\ntwo\ntwo" "one" "two" 158testing "sed subst+write" \ 159 "sed -e 's/i/z/' -e 'woutputw' input -; $ECHO -n X; cat outputw" \ 160 "thzngy\nagaznXthzngy\nagazn" "thingy" "again" 161rm outputw 162testing "sed trailing NUL" \ 163 "sed 's/i/z/' input -" \ 164 "a\0b\0\nc" "a\0b\0" "c" 165testing "sed escaped newline in command" \ 166 "sed 's/a/z\\ 167z/' input" \ 168 "z\nz" "a" "" 169 170# Test end-of-file matching behavior 171 172testing "sed match EOF" "sed -e '"'$p'"'" "hello\nthere\nthere" "" \ 173 "hello\nthere" 174testing "sed match EOF two files" "sed -e '"'$p'"' input -" \ 175 "one\ntwo\nthree\nfour\nfour" "one\ntwo" "three\nfour" 176# sed match EOF inline: gnu sed 4.1.5 outputs this: 177#00000000 6f 6e 65 0a 6f 6f 6b 0a 6f 6f 6b 0a 74 77 6f 0a |one.ook.ook.two.| 178#00000010 0a 74 68 72 65 65 0a 6f 6f 6b 0a 6f 6f 6b 0a 66 |.three.ook.ook.f| 179#00000020 6f 75 72 |our| 180# which looks buggy to me. 181$ECHO -ne "three\nfour" > input2 182testing "sed match EOF inline" \ 183 "sed -e '"'$i ook'"' -i input input2 && cat input input2" \ 184 "one\nook\ntwothree\nook\nfour" "one\ntwo" "" 185rm input2 186 187# Test lie-to-autoconf 188 189testing "sed lie-to-autoconf" "sed --version | grep -o 'GNU sed version '" \ 190 "GNU sed version \n" "" "" 191 192# Jump to nonexistent label 193test x"$SKIP_KNOWN_BUGS" = x"" && { 194# Incompatibility: illegal jump is not detected if input is "" 195# (that is, no lines at all). GNU sed 4.1.5 complains even in this case 196testing "sed nonexistent label" "sed -e 'b walrus' 2>/dev/null || echo yes" \ 197 "yes\n" "" "" 198} 199 200testing "sed backref from empty s uses range regex" \ 201 "sed -e '/woot/s//eep \0 eep/'" "eep woot eep" "" "woot" 202 203testing "sed backref from empty s uses range regex with newline" \ 204 "sed -e '/woot/s//eep \0 eep/'" "eep woot eep\n" "" "woot\n" 205 206# -i with no filename 207 208touch ./- # Detect gnu failure mode here. 209testing "sed -i with no arg [GNUFAIL]" "sed -e '' -i 2> /dev/null || echo yes" \ 210 "yes\n" "" "" 211rm ./- # Clean up 212 213testing "sed s/xxx/[/" "sed -e 's/xxx/[/'" "[\n" "" "xxx\n" 214 215# Ponder this a bit more, why "woo not found" from gnu version? 216#testing "sed doesn't substitute in deleted line" \ 217# "sed -e '/ook/d;s/ook//;t woo;a bang;'" "bang" "" "ook\n" 218 219# This makes both seds very unhappy. Why? 220#testing "sed -g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5," \ 221# "" "12345" 222 223# testing "description" "commands" "result" "infile" "stdin" 224 225testing "sed n command must reset 'substituted' bit" \ 226 "sed 's/1/x/;T;n;: next;s/3/y/;t quit;n;b next;: quit;q'" \ 227 "0\nx\n2\ny\n" "" "0\n1\n2\n3\n" 228 229testing "sed d does not break n,m matching" \ 230 "sed -n '1d;1,3p'" \ 231 "second\nthird\n" "" "first\nsecond\nthird\nfourth\n" 232 233testing "sed d does not break n,regex matching" \ 234 "sed -n '1d;1,/hir/p'" \ 235 "second\nthird\n" "" "first\nsecond\nthird\nfourth\n" 236 237testing "sed d does not break n,regex matching #2" \ 238 "sed -n '1,5d;1,/hir/p'" \ 239 "second2\nthird2\n" "" \ 240 "first\nsecond\nthird\nfourth\n""first2\nsecond2\nthird2\nfourth2\n" 241 242testing "sed 2d;2,1p (gnu compat)" \ 243 "sed -n '2d;2,1p'" \ 244 "third\n" "" \ 245 "first\nsecond\nthird\nfourth\n" 246 247# Regex means: "match / at BOL or nothing, then one or more not-slashes". 248# The bug was that second slash in /usr/lib was treated as "at BOL" too. 249testing "sed beginning (^) matches only once" \ 250 "sed 's,\(^/\|\)[^/][^/]*,>\0<,g'" \ 251 ">/usr</>lib<\n" "" \ 252 "/usr/lib\n" 253 254testing "sed c" \ 255 "sed 'crepl'" \ 256 "repl\nrepl\n" "" \ 257 "first\nsecond\n" 258 259testing "sed nested {}s" \ 260 "sed '/asd/ { p; /s/ { s/s/c/ }; p; q }'" \ 261 "qwe\nasd\nacd\nacd\n" "" \ 262 "qwe\nasd\nzxc\n" 263 264testing "sed a cmd ended by double backslash" \ 265 "sed -e '/| one /a \\ 266 | three \\\\' -e '/| one-/a \\ 267 | three-* \\\\'" \ 268' | one \\ 269 | three \\ 270 | two \\ 271' '' \ 272' | one \\ 273 | two \\ 274' 275 276testing "sed a cmd understands \\n,\\t,\\r" \ 277 "sed '/1/a\\\\t\\rzero\\none\\\\ntwo\\\\\\nthree'" \ 278"\ 279line1 280\t\rzero 281one\\\\ntwo\\ 282three 283" "" "line1\n" 284 285testing "sed i cmd understands \\n,\\t,\\r" \ 286 "sed '/1/i\\\\t\\rzero\\none\\\\ntwo\\\\\\nthree'" \ 287"\ 288\t\rzero 289one\\\\ntwo\\ 290three 291line1 292" "" "line1\n" 293 294# first three lines are deleted; 4th line is matched and printed by "2,3" and by "4" ranges 295testing "sed with N skipping lines past ranges on next cmds" \ 296 "sed -n '1{N;N;d};1p;2,3p;3p;4p'" \ 297 "4\n4\n" "" "1\n2\n3\n4\n" 298 299testing "sed -i with address modifies all files, not only first" \ 300 "cp input input2; sed -i -e '1s/foo/bar/' input input2 && cat input input2; rm input2" \ 301 "bar\nbar\n" "foo\n" "" 302 303testing "sed understands \r" \ 304 "sed 's/r/\r/'" \ 305 "\rrr\n" "" "rrr\n" 306 307testing "sed -i finishes ranges correctly" \ 308 "sed '1,2d' -i input; echo \$?; cat input" \ 309 "0\n3\n4\n" "1\n2\n3\n4\n" "" 310 311testing "sed zero chars match/replace advances correctly 1" \ 312 "sed 's/l*/@/g'" \ 313 "@h@e@o@\n" "" "helllo\n" 314 315testing "sed zero chars match/replace advances correctly 2" \ 316 "sed 's [^ .]* x g'" \ 317 "x x.x\n" "" " a.b\n" 318 319testing "sed zero chars match/replace logic must not falsely trigger here 1" \ 320 "sed 's/a/A/g'" \ 321 "_AAA1AA\n" "" "_aaa1aa\n" 322 323testing "sed zero chars match/replace logic must not falsely trigger here 2" \ 324 "sed 's/ *$/_/g'" \ 325 "qwerty_\n" "" "qwerty\n" 326 327testing "sed /\$_in_regex/ should not match newlines, only end-of-line" \ 328 "sed ': testcont; /\\\\$/{ =; N; b testcont }'" \ 329 "\ 330this is a regular line 3312 332line with \\ 333continuation 334more regular lines 3355 336line with \\ 337continuation 338" \ 339 "" "\ 340this is a regular line 341line with \\ 342continuation 343more regular lines 344line with \\ 345continuation 346" 347 348testing "sed s///NUM test" \ 349 "sed -e 's/a/b/2; s/a/c/g'" \ 350 "cb\n" "" "aa\n" 351 352testing "sed /regex/,N{...} addresses work" \ 353 "sed /^2/,2{d}" \ 354 "1\n3\n4\n5\n" \ 355 "" \ 356 "1\n2\n3\n4\n5\n" 357 358testing "sed /regex/,+N{...} addresses work" \ 359 "sed /^2/,+2{d}" \ 360 "1\n5\n" \ 361 "" \ 362 "1\n2\n3\n4\n5\n" 363 364testing "sed /regex/,+N{...} addresses work 2" \ 365 "sed -n '/a/,+1 p'" \ 366 "a\n1\na\n2\na\n3\n" \ 367 "" \ 368 "a\n1\nc\nc\na\n2\na\n3\n" 369 370testing "sed /regex/,+N{...} -i works" \ 371 "cat - >input2; sed /^4/,+2{d} -i input input2; echo \$?; cat input input2; rm input2" \ 372 "0\n""1\n2\n3\n7\n8\n""1\n2\n7\n8\n" \ 373 "1\n2\n3\n4\n5\n6\n7\n8\n" \ 374 "1\n2\n4\n5\n6\n7\n8\n" \ 375 376# GNU sed 4.2.1 would also accept "/^4/,+{d}" with the same meaning, we don't 377testing "sed /regex/,+0{...} -i works" \ 378 "cat - >input2; sed /^4/,+0{d} -i input input2; echo \$?; cat input input2; rm input2" \ 379 "0\n""1\n2\n3\n5\n6\n7\n8\n""1\n2\n5\n6\n7\n8\n" \ 380 "1\n2\n3\n4\n5\n6\n7\n8\n" \ 381 "1\n2\n4\n5\n6\n7\n8\n" \ 382 383# GNU sed 4.2.1 would also accept "/^4/,+d" with the same meaning, we don't 384testing "sed /regex/,+0<cmd> -i works" \ 385 "cat - >input2; sed /^4/,+0d -i input input2; echo \$?; cat input input2; rm input2" \ 386 "0\n""1\n2\n3\n5\n6\n7\n8\n""1\n2\n5\n6\n7\n8\n" \ 387 "1\n2\n3\n4\n5\n6\n7\n8\n" \ 388 "1\n2\n4\n5\n6\n7\n8\n" \ 389 390testing "sed 's///w FILE'" \ 391 "sed 's/qwe/ZZZ/wz'; cat z; rm z" \ 392 "123\nZZZ\nasd\n""ZZZ\n" \ 393 "" \ 394 "123\nqwe\nasd\n" 395 396testing "sed uses previous regexp" \ 397 "sed '/w/p;//q'" \ 398 "q\nw\nw\n" \ 399 "" \ 400 "q\nw\ne\nr\n" 401 402# testing "description" "commands" "result" "infile" "stdin" 403 404exit $FAILCOUNT 405