busybox/testsuite/sed.tests
<<
>>
Prefs
   1#!/bin/sh
   2
   3# SUSv3 compliant sed tests.
   4# Copyright 2005 by Rob Landley <rob@landley.net>
   5# Licensed under GPLv2, see file LICENSE in this source tree.
   6
   7. ./testing.sh
   8
   9# testing "description" "commands" "result" "infile" "stdin"
  10
  11# Corner cases
  12testing "sed no files (stdin)" 'sed ""' "hello\n" "" "hello\n"
  13testing "sed explicit stdin" 'sed "" -' "hello\n" "" "hello\n"
  14testing "sed handles empty lines" "sed -e 's/\$/@/'" "@\n" "" "\n"
  15testing "sed stdin twice" 'sed "" - -' "hello" "" "hello"
  16
  17# Trailing EOF.
  18#       Match $, at end of each file or all files?
  19
  20# -e corner cases
  21#       without -e
  22#       multiple -e
  23#               interact with a
  24#       -eee arg1 arg2 arg3
  25# -f corner cases
  26#       -e -f -e
  27# -n corner cases
  28#       no newline at EOF?
  29# -r corner cases
  30#       Just make sure it works.
  31# -i corner cases:
  32#       sed -i -
  33#       permissions
  34#       -i on a symlink
  35#       on a directory
  36#       With $ last-line test
  37# Continue with \
  38#       End of script with trailing \
  39
  40# command list
  41testing "sed accepts blanks before command" "sed -e '1 d'" "" "" ""
  42testing "sed accepts newlines in -e" "sed -e 'i\
  431
  44a\
  453'" "1\n2\n3\n" "" "2\n"
  46testing "sed accepts multiple -e" "sed -e 'i\' -e '1' -e 'a\' -e '3'" \
  47        "1\n2\n3\n" "" "2\n"
  48
  49# substitutions
  50testing "sed -n" "sed -n -e s/foo/bar/ -e s/bar/baz/" "" "" "foo\n"
  51testing "sed with empty match" "sed 's/z*//g'" "string\n" "" "string\n"
  52testing "sed s//p" "sed -e s/foo/bar/p -e s/bar/baz/p" "bar\nbaz\nbaz\n" \
  53        "" "foo\n"
  54testing "sed -n s//p" "sed -ne s/abc/def/p" "def\n" "" "abc\n"
  55testing "sed s//g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5,\n" \
  56        "" "12345\n"
  57testing "sed s arbitrary delimiter" "sed -e 's woo boing '" "boing\n" "" "woo\n"
  58testing "sed s chains" "sed -e s/foo/bar/ -e s/bar/baz/" "baz\n" "" "foo\n"
  59testing "sed s chains2" "sed -e s/foo/bar/ -e s/baz/nee/" "bar\n" "" "foo\n"
  60testing "sed s [delimiter]" "sed -e 's@[@]@@'" "onetwo" "" "one@two"
  61testing "sed s with \\t (GNU ext)" "sed 's/\t/ /'" "one two" "" "one\ttwo"
  62
  63# branch
  64testing "sed b (branch)" "sed -e 'b one;p;: one'" "foo\n" "" "foo\n"
  65testing "sed b (branch with no label jumps to end)" "sed -e 'b;p'" \
  66        "foo\n" "" "foo\n"
  67
  68# test and branch
  69testing "sed t (test/branch)" "sed -e 's/a/1/;t one;p;: one;p'" \
  70        "1\n1\nb\nb\nb\nc\nc\nc\n" "" "a\nb\nc\n"
  71testing "sed t (test/branch clears test bit)" "sed -e 's/a/b/;:loop;t loop'" \
  72        "b\nb\nc\n" "" "a\nb\nc\n"
  73testing "sed T (!test/branch)" "sed -e 's/a/1/;T notone;p;: notone;p'" \
  74        "1\n1\n1\nb\nb\nc\nc\n" "" "a\nb\nc\n"
  75
  76testing "sed n (flushes pattern space, terminates early)" "sed -e 'n;p'" \
  77        "a\nb\nb\nc\n" "" "a\nb\nc\n"
  78
  79# non-GNU sed: N does _not_ flush pattern space, therefore c is eaten @ script end
  80# GNU sed: N flushes pattern space, therefore c is printed too @ script end
  81testing "sed N (flushes pattern space (GNU behavior))" "sed -e 'N;p'" \
  82        "a\nb\na\nb\nc\n" "" "a\nb\nc\n"
  83
  84testing "sed N test2" "sed ':a;N;s/\n/ /;ta'" \
  85        "a b c\n" "" "a\nb\nc\n"
  86
  87testing "sed N test3" "sed 'N;s/\n/ /'" \
  88        "a b\nc\n" "" "a\nb\nc\n"
  89
  90testing "sed address match newline" 'sed "/b/N;/b\\nc/i woo"' \
  91        "a\nwoo\nb\nc\nd\n" "" "a\nb\nc\nd\n"
  92
  93# Multiple lines in pattern space
  94testing "sed N (stops at end of input) and P (prints to first newline only)" \
  95        "sed -n 'N;P;p'" "a\na\nb\n" "" "a\nb\nc\n"
  96
  97# Hold space
  98testing "sed G (append hold space to pattern space)" 'sed G' "a\n\nb\n\nc\n\n" \
  99        "" "a\nb\nc\n"
 100#testing "sed g/G (swap/append hold and patter space)"
 101#testing "sed g (swap hold/pattern space)"
 102
 103testing "sed d ends script iteration" \
 104        "sed -e '/ook/d;s/ook/ping/p;i woot'" "" "" "ook\n"
 105testing "sed d ends script iteration (2)" \
 106        "sed -e '/ook/d;a\' -e 'bang'" "woot\nbang\n" "" "ook\nwoot\n"
 107
 108# Multiple files, with varying newlines and NUL bytes
 109test x"$SKIP_KNOWN_BUGS" = x"" && {
 110testing "sed embedded NUL" "sed -e 's/woo/bang/'" "\0bang\0woo\0" "" \
 111        "\0woo\0woo\0"
 112}
 113testing "sed embedded NUL g" "sed -e 's/woo/bang/g'" "bang\0bang\0" "" \
 114        "woo\0woo\0"
 115test x"$SKIP_KNOWN_BUGS" = x"" && {
 116$ECHO -e "/woo/a he\0llo" > sed.commands
 117testing "sed NUL in command" "sed -f sed.commands" "woo\nhe\0llo\n" "" "woo"
 118rm sed.commands
 119}
 120
 121# sed has funky behavior with newlines at the end of file.  Test lots of
 122# corner cases with the optional newline appending behavior.
 123
 124testing "sed normal newlines" "sed -e 's/woo/bang/' input -" "bang\nbang\n" \
 125        "woo\n" "woo\n"
 126testing "sed leave off trailing newline" "sed -e 's/woo/bang/' input -" \
 127        "bang\nbang" "woo\n" "woo"
 128testing "sed autoinsert newline" "sed -e 's/woo/bang/' input -" "bang\nbang" \
 129        "woo" "woo"
 130testing "sed empty file plus cat" "sed -e 's/nohit//' input -" "one\ntwo" \
 131        "" "one\ntwo"
 132testing "sed cat plus empty file" "sed -e 's/nohit//' input -" "one\ntwo" \
 133        "one\ntwo" ""
 134testing "sed append autoinserts newline" "sed -e '/woot/a woo' -" \
 135        "woot\nwoo\n" "" "woot"
 136testing "sed append autoinserts newline 2" "sed -e '/oot/a woo' - input" \
 137        "woot\nwoo\nboot\nwoo\n" "boot" "woot"
 138testing "sed append autoinserts newline 3" "sed -e '/oot/a woo' -i input && cat input" \
 139        "boot\nwoo\n" "boot" ""
 140testing "sed insert doesn't autoinsert newline" "sed -e '/woot/i woo' -" \
 141        "woo\nwoot" "" "woot"
 142testing "sed print autoinsert newlines" "sed -e 'p' -" "one\none" "" "one"
 143testing "sed print autoinsert newlines two files" "sed -e 'p' input -" \
 144        "one\none\ntwo\ntwo" "one" "two"
 145testing "sed noprint, no match, no newline" "sed -ne 's/woo/bang/' input" \
 146        "" "no\n" ""
 147testing "sed selective matches with one nl" "sed -ne 's/woo/bang/p' input -" \
 148        "a bang\nc bang\n" "a woo\nb no" "c woo\nd no"
 149testing "sed selective matches insert newline" \
 150        "sed -ne 's/woo/bang/p' input -" "a bang\nb bang\nd bang" \
 151        "a woo\nb woo" "c no\nd woo"
 152testing "sed selective matches noinsert newline" \
 153        "sed -ne 's/woo/bang/p' input -" "a bang\nb bang" "a woo\nb woo" \
 154        "c no\nd no"
 155testing "sed clusternewline" \
 156        "sed -e '/one/a 111' -e '/two/i 222' -e p input -" \
 157        "one\none\n111\n222\ntwo\ntwo" "one" "two"
 158testing "sed subst+write" \
 159        "sed -e 's/i/z/' -e 'woutputw' input -; $ECHO -n X; cat outputw" \
 160        "thzngy\nagaznXthzngy\nagazn" "thingy" "again"
 161rm outputw
 162testing "sed trailing NUL" \
 163        "sed 's/i/z/' input -" \
 164        "a\0b\0\nc" "a\0b\0" "c"
 165testing "sed escaped newline in command" \
 166        "sed 's/a/z\\
 167z/' input" \
 168        "z\nz" "a" ""
 169
 170# Test end-of-file matching behavior
 171
 172testing "sed match EOF" "sed -e '"'$p'"'" "hello\nthere\nthere" "" \
 173        "hello\nthere"
 174testing "sed match EOF two files" "sed -e '"'$p'"' input -" \
 175        "one\ntwo\nthree\nfour\nfour" "one\ntwo" "three\nfour"
 176# sed match EOF inline: gnu sed 4.1.5 outputs this:
 177#00000000  6f 6e 65 0a 6f 6f 6b 0a  6f 6f 6b 0a 74 77 6f 0a  |one.ook.ook.two.|
 178#00000010  0a 74 68 72 65 65 0a 6f  6f 6b 0a 6f 6f 6b 0a 66  |.three.ook.ook.f|
 179#00000020  6f 75 72                                          |our|
 180# which looks buggy to me.
 181$ECHO -ne "three\nfour" > input2
 182testing "sed match EOF inline" \
 183        "sed -e '"'$i ook'"' -i input input2 && cat input input2" \
 184        "one\nook\ntwothree\nook\nfour" "one\ntwo" ""
 185rm input2
 186
 187# Test lie-to-autoconf
 188
 189testing "sed lie-to-autoconf" "sed --version | grep -o 'GNU sed version '" \
 190        "GNU sed version \n" "" ""
 191
 192# Jump to nonexistent label
 193test x"$SKIP_KNOWN_BUGS" = x"" && {
 194# Incompatibility: illegal jump is not detected if input is ""
 195# (that is, no lines at all). GNU sed 4.1.5 complains even in this case
 196testing "sed nonexistent label" "sed -e 'b walrus' 2>/dev/null || echo yes" \
 197        "yes\n" "" ""
 198}
 199
 200testing "sed backref from empty s uses range regex" \
 201        "sed -e '/woot/s//eep \0 eep/'" "eep woot eep" "" "woot"
 202
 203testing "sed backref from empty s uses range regex with newline" \
 204        "sed -e '/woot/s//eep \0 eep/'" "eep woot eep\n" "" "woot\n"
 205
 206# -i with no filename
 207
 208touch ./-  # Detect gnu failure mode here.
 209testing "sed -i with no arg [GNUFAIL]" "sed -e '' -i 2> /dev/null || echo yes" \
 210        "yes\n" "" ""
 211rm ./-     # Clean up
 212
 213testing "sed s/xxx/[/" "sed -e 's/xxx/[/'" "[\n" "" "xxx\n"
 214
 215# Ponder this a bit more, why "woo not found" from gnu version?
 216#testing "sed doesn't substitute in deleted line" \
 217#       "sed -e '/ook/d;s/ook//;t woo;a bang;'" "bang" "" "ook\n"
 218
 219# This makes both seds very unhappy.  Why?
 220#testing "sed -g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5," \
 221#       "" "12345"
 222
 223# testing "description" "commands" "result" "infile" "stdin"
 224
 225testing "sed n command must reset 'substituted' bit" \
 226        "sed 's/1/x/;T;n;: next;s/3/y/;t quit;n;b next;: quit;q'" \
 227        "0\nx\n2\ny\n" "" "0\n1\n2\n3\n"
 228
 229testing "sed d does not break n,m matching" \
 230        "sed -n '1d;1,3p'" \
 231        "second\nthird\n" "" "first\nsecond\nthird\nfourth\n"
 232
 233testing "sed d does not break n,regex matching" \
 234        "sed -n '1d;1,/hir/p'" \
 235        "second\nthird\n" "" "first\nsecond\nthird\nfourth\n"
 236
 237testing "sed d does not break n,regex matching #2" \
 238        "sed -n '1,5d;1,/hir/p'" \
 239        "second2\nthird2\n" "" \
 240        "first\nsecond\nthird\nfourth\n""first2\nsecond2\nthird2\nfourth2\n"
 241
 242testing "sed 2d;2,1p (gnu compat)" \
 243        "sed -n '2d;2,1p'" \
 244        "third\n" "" \
 245        "first\nsecond\nthird\nfourth\n"
 246
 247# Regex means: "match / at BOL or nothing, then one or more not-slashes".
 248# The bug was that second slash in /usr/lib was treated as "at BOL" too.
 249testing "sed beginning (^) matches only once" \
 250        "sed 's,\(^/\|\)[^/][^/]*,>\0<,g'" \
 251        ">/usr</>lib<\n" "" \
 252        "/usr/lib\n"
 253
 254testing "sed c" \
 255        "sed 'crepl'" \
 256        "repl\nrepl\n" "" \
 257        "first\nsecond\n"
 258
 259testing "sed nested {}s" \
 260        "sed '/asd/ { p; /s/ { s/s/c/ }; p; q }'" \
 261        "qwe\nasd\nacd\nacd\n" "" \
 262        "qwe\nasd\nzxc\n"
 263
 264testing "sed a cmd ended by double backslash" \
 265        "sed -e '/| one /a \\
 266        | three \\\\' -e '/| one-/a \\
 267        | three-* \\\\'" \
 268'       | one \\
 269        | three \\
 270        | two \\
 271' '' \
 272'       | one \\
 273        | two \\
 274'
 275
 276testing "sed a cmd understands \\n,\\t,\\r" \
 277        "sed '/1/a\\\\t\\rzero\\none\\\\ntwo\\\\\\nthree'" \
 278"\
 279line1
 280\t\rzero
 281one\\\\ntwo\\
 282three
 283" "" "line1\n"
 284
 285testing "sed i cmd understands \\n,\\t,\\r" \
 286        "sed '/1/i\\\\t\\rzero\\none\\\\ntwo\\\\\\nthree'" \
 287"\
 288\t\rzero
 289one\\\\ntwo\\
 290three
 291line1
 292" "" "line1\n"
 293
 294# first three lines are deleted; 4th line is matched and printed by "2,3" and by "4" ranges
 295testing "sed with N skipping lines past ranges on next cmds" \
 296        "sed -n '1{N;N;d};1p;2,3p;3p;4p'" \
 297        "4\n4\n" "" "1\n2\n3\n4\n"
 298
 299testing "sed -i with address modifies all files, not only first" \
 300        "cp input input2; sed -i -e '1s/foo/bar/' input input2 && cat input input2; rm input2" \
 301        "bar\nbar\n" "foo\n" ""
 302
 303testing "sed understands \r" \
 304        "sed 's/r/\r/'" \
 305        "\rrr\n" "" "rrr\n"
 306
 307testing "sed -i finishes ranges correctly" \
 308        "sed '1,2d' -i input; echo \$?; cat input" \
 309        "0\n3\n4\n" "1\n2\n3\n4\n" ""
 310
 311testing "sed zero chars match/replace advances correctly 1" \
 312        "sed 's/l*/@/g'" \
 313        "@h@e@o@\n" "" "helllo\n"
 314
 315testing "sed zero chars match/replace advances correctly 2" \
 316        "sed 's [^ .]* x g'" \
 317        "x x.x\n" "" " a.b\n"
 318
 319testing "sed zero chars match/replace logic must not falsely trigger here 1" \
 320        "sed 's/a/A/g'" \
 321        "_AAA1AA\n" "" "_aaa1aa\n"
 322
 323testing "sed zero chars match/replace logic must not falsely trigger here 2" \
 324        "sed 's/ *$/_/g'" \
 325        "qwerty_\n" "" "qwerty\n"
 326
 327testing "sed /\$_in_regex/ should not match newlines, only end-of-line" \
 328        "sed ': testcont; /\\\\$/{ =; N; b testcont }'" \
 329        "\
 330this is a regular line
 3312
 332line with \\
 333continuation
 334more regular lines
 3355
 336line with \\
 337continuation
 338" \
 339        "" "\
 340this is a regular line
 341line with \\
 342continuation
 343more regular lines
 344line with \\
 345continuation
 346"
 347
 348testing "sed s///NUM test" \
 349        "sed -e 's/a/b/2; s/a/c/g'" \
 350        "cb\n" "" "aa\n"
 351
 352testing "sed /regex/,N{...} addresses work" \
 353        "sed /^2/,2{d}" \
 354        "1\n3\n4\n5\n" \
 355        "" \
 356        "1\n2\n3\n4\n5\n"
 357
 358testing "sed /regex/,+N{...} addresses work" \
 359        "sed /^2/,+2{d}" \
 360        "1\n5\n" \
 361        "" \
 362        "1\n2\n3\n4\n5\n"
 363
 364testing "sed /regex/,+N{...} addresses work 2" \
 365        "sed -n '/a/,+1 p'" \
 366        "a\n1\na\n2\na\n3\n" \
 367        "" \
 368        "a\n1\nc\nc\na\n2\na\n3\n"
 369
 370testing "sed /regex/,+N{...} -i works" \
 371        "cat - >input2; sed /^4/,+2{d} -i input input2; echo \$?; cat input input2; rm input2" \
 372        "0\n""1\n2\n3\n7\n8\n""1\n2\n7\n8\n" \
 373        "1\n2\n3\n4\n5\n6\n7\n8\n" \
 374        "1\n2\n4\n5\n6\n7\n8\n" \
 375
 376# GNU sed 4.2.1 would also accept "/^4/,+{d}" with the same meaning, we don't
 377testing "sed /regex/,+0{...} -i works" \
 378        "cat - >input2; sed /^4/,+0{d} -i input input2; echo \$?; cat input input2; rm input2" \
 379        "0\n""1\n2\n3\n5\n6\n7\n8\n""1\n2\n5\n6\n7\n8\n" \
 380        "1\n2\n3\n4\n5\n6\n7\n8\n" \
 381        "1\n2\n4\n5\n6\n7\n8\n" \
 382
 383# GNU sed 4.2.1 would also accept "/^4/,+d" with the same meaning, we don't
 384testing "sed /regex/,+0<cmd> -i works" \
 385        "cat - >input2; sed /^4/,+0d -i input input2; echo \$?; cat input input2; rm input2" \
 386        "0\n""1\n2\n3\n5\n6\n7\n8\n""1\n2\n5\n6\n7\n8\n" \
 387        "1\n2\n3\n4\n5\n6\n7\n8\n" \
 388        "1\n2\n4\n5\n6\n7\n8\n" \
 389
 390testing "sed 's///w FILE'" \
 391        "sed 's/qwe/ZZZ/wz'; cat z; rm z" \
 392        "123\nZZZ\nasd\n""ZZZ\n" \
 393        "" \
 394        "123\nqwe\nasd\n"
 395
 396testing "sed uses previous regexp" \
 397        "sed '/w/p;//q'" \
 398        "q\nw\nw\n" \
 399        "" \
 400        "q\nw\ne\nr\n"
 401
 402# testing "description" "commands" "result" "infile" "stdin"
 403
 404exit $FAILCOUNT
 405