Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 1 | #!/bin/sh |
| 2 | |
| 3 | # SUSv3 compliant sed tests. |
| 4 | # Copyright 2005 by Rob Landley <rob@landley.net> |
| 5 | # Licensed under GPL v2, see file LICENSE for details. |
| 6 | |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 7 | . testing.sh |
| 8 | |
| 9 | # testing "description" "arguments" "result" "infile" "stdin" |
| 10 | |
| 11 | # Corner cases |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 12 | testing "sed no files (stdin)" 'sed ""' "hello\n" "" "hello\n" |
| 13 | testing "sed explicit stdin" 'sed "" -' "hello\n" "" "hello\n" |
| 14 | testing "sed handles empty lines" "sed -e 's/\$/@/'" "@\n" "" "\n" |
| 15 | testing "sed stdin twice" 'sed "" - -' "hello" "" "hello" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 16 | |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 17 | # Trailing EOF. |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 18 | # Match $, at end of each file or all files? |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 19 | |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 20 | # -e corner cases |
| 21 | # without -e |
| 22 | # multiple -e |
| 23 | # interact with a |
| 24 | # -eee arg1 arg2 arg3 |
| 25 | # -f corner cases |
| 26 | # -e -f -e |
| 27 | # -n corner cases |
| 28 | # no newline at EOF? |
| 29 | # -r corner cases |
| 30 | # Just make sure it works. |
| 31 | # -i corner cases: |
| 32 | # sed -i - |
| 33 | # permissions |
| 34 | # -i on a symlink |
| 35 | # on a directory |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 36 | # With $ last-line test |
| 37 | # Continue with \ |
| 38 | # End of script with trailing \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 39 | |
| 40 | # command list |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 41 | testing "sed accepts blanks before command" "sed -e '1 d'" "" "" "" |
| 42 | testing "sed accepts newlines in -e" "sed -e 'i\ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 43 | 1 |
| 44 | a\ |
| 45 | 3'" "1\n2\n3\n" "" "2\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 46 | testing "sed accepts multiple -e" "sed -e 'i\' -e '1' -e 'a\' -e '3'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 47 | "1\n2\n3\n" "" "2\n" |
| 48 | |
| 49 | # substitutions |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 50 | testing "sed -n" "sed -n -e s/foo/bar/ -e s/bar/baz/" "" "" "foo\n" |
| 51 | testing "sed s//p" "sed -e s/foo/bar/p -e s/bar/baz/p" "bar\nbaz\nbaz\n" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 52 | "" "foo\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 53 | testing "sed -n s//p" "sed -ne s/abc/def/p" "def\n" "" "abc\n" |
| 54 | testing "sed s//g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5,\n" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 55 | "" "12345\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 56 | testing "sed s arbitrary delimiter" "sed -e 's woo boing '" "boing\n" "" "woo\n" |
| 57 | testing "sed s chains" "sed -e s/foo/bar/ -e s/bar/baz/" "baz\n" "" "foo\n" |
| 58 | testing "sed s chains2" "sed -e s/foo/bar/ -e s/baz/nee/" "bar\n" "" "foo\n" |
| 59 | testing "sed s [delimiter]" "sed -e 's@[@]@@'" "onetwo" "" "one@two" |
Denis Vlasenko | 4027664 | 2007-11-13 16:48:10 +0000 | [diff] [blame] | 60 | testing "sed s with \\t (GNU ext)" "sed 's/\t/ /'" "one two" "" "one\ttwo" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 61 | |
| 62 | # branch |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 63 | testing "sed b (branch)" "sed -e 'b one;p;: one'" "foo\n" "" "foo\n" |
| 64 | testing "sed b (branch with no label jumps to end)" "sed -e 'b;p'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 65 | "foo\n" "" "foo\n" |
| 66 | |
| 67 | # test and branch |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 68 | testing "sed t (test/branch)" "sed -e 's/a/1/;t one;p;: one;p'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 69 | "1\n1\nb\nb\nb\nc\nc\nc\n" "" "a\nb\nc\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 70 | testing "sed t (test/branch clears test bit)" "sed -e 's/a/b/;:loop;t loop'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 71 | "b\nb\nc\n" "" "a\nb\nc\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 72 | testing "sed T (!test/branch)" "sed -e 's/a/1/;T notone;p;: notone;p'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 73 | "1\n1\n1\nb\nb\nc\nc\n" "" "a\nb\nc\n" |
| 74 | |
| 75 | # Normal sed end-of-script doesn't print "c" because n flushed the pattern |
| 76 | # space. If n hits EOF, pattern space is empty when script ends. |
| 77 | # Query: how does this interact with no newline at EOF? |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 78 | testing "sed n (flushes pattern space, terminates early)" "sed -e 'n;p'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 79 | "a\nb\nb\nc\n" "" "a\nb\nc\n" |
| 80 | # N does _not_ flush pattern space, therefore c is still in there @ script end. |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 81 | testing "sed N (doesn't flush pattern space when terminating)" "sed -e 'N;p'" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 82 | "a\nb\na\nb\nc\n" "" "a\nb\nc\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 83 | testing "sed address match newline" 'sed "/b/N;/b\\nc/i woo"' \ |
| 84 | "a\nwoo\nb\nc\nd\n" "" "a\nb\nc\nd\n" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 85 | |
| 86 | # Multiple lines in pattern space |
| 87 | testing "sed N (stops at end of input) and P (prints to first newline only)" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 88 | "sed -n 'N;P;p'" "a\na\nb\n" "" "a\nb\nc\n" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 89 | |
| 90 | # Hold space |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 91 | testing "sed G (append hold space to pattern space)" 'sed G' "a\n\nb\n\nc\n\n" \ |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 92 | "" "a\nb\nc\n" |
| 93 | #testing "sed g/G (swap/append hold and patter space)" |
| 94 | #testing "sed g (swap hold/pattern space)" |
| 95 | |
| 96 | testing "sed d ends script iteration" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 97 | "sed -e '/ook/d;s/ook/ping/p;i woot'" "" "" "ook\n" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 98 | testing "sed d ends script iteration (2)" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 99 | "sed -e '/ook/d;a\' -e 'bang'" "woot\nbang\n" "" "ook\nwoot\n" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 100 | |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 101 | # Multiple files, with varying newlines and NUL bytes |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 102 | testing "sed embedded NUL" "sed -e 's/woo/bang/'" "\0bang\0woo\0" "" \ |
| 103 | "\0woo\0woo\0" |
| 104 | testing "sed embedded NUL g" "sed -e 's/woo/bang/g'" "bang\0bang\0" "" \ |
| 105 | "woo\0woo\0" |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 106 | echo -e "/woo/a he\0llo" > sed.commands |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 107 | testing "sed NUL in command" "sed -f sed.commands" "woo\nhe\0llo\n" "" "woo" |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 108 | rm sed.commands |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 109 | |
| 110 | # sed has funky behavior with newlines at the end of file. Test lots of |
| 111 | # corner cases with the optional newline appending behavior. |
| 112 | |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 113 | testing "sed normal newlines" "sed -e 's/woo/bang/' input -" "bang\nbang\n" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 114 | "woo\n" "woo\n" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 115 | testing "sed leave off trailing newline" "sed -e 's/woo/bang/' input -" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 116 | "bang\nbang" "woo\n" "woo" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 117 | testing "sed autoinsert newline" "sed -e 's/woo/bang/' input -" "bang\nbang" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 118 | "woo" "woo" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 119 | testing "sed empty file plus cat" "sed -e 's/nohit//' input -" "one\ntwo" \ |
Denis Vlasenko | 9213a9e | 2006-09-17 16:28:10 +0000 | [diff] [blame] | 120 | "" "one\ntwo" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 121 | testing "sed cat plus empty file" "sed -e 's/nohit//' input -" "one\ntwo" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 122 | "one\ntwo" "" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 123 | testing "sed append autoinserts newline" "sed -e '/woot/a woo' -" \ |
| 124 | "woot\nwoo\n" "" "woot" |
| 125 | testing "sed insert doesn't autoinsert newline" "sed -e '/woot/i woo' -" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 126 | "woo\nwoot" "" "woot" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 127 | testing "sed print autoinsert newlines" "sed -e 'p' -" "one\none" "" "one" |
| 128 | testing "sed print autoinsert newlines two files" "sed -e 'p' input -" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 129 | "one\none\ntwo\ntwo" "one" "two" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 130 | testing "sed noprint, no match, no newline" "sed -ne 's/woo/bang/' input" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 131 | "" "no\n" "" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 132 | testing "sed selective matches with one nl" "sed -ne 's/woo/bang/p' input -" \ |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 133 | "a bang\nc bang\n" "a woo\nb no" "c woo\nd no" |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 134 | testing "sed selective matches insert newline" \ |
| 135 | "sed -ne 's/woo/bang/p' input -" "a bang\nb bang\nd bang" \ |
| 136 | "a woo\nb woo" "c no\nd woo" |
| 137 | testing "sed selective matches noinsert newline" \ |
| 138 | "sed -ne 's/woo/bang/p' input -" "a bang\nb bang" "a woo\nb woo" \ |
| 139 | "c no\nd no" |
| 140 | testing "sed clusternewline" \ |
| 141 | "sed -e '/one/a 111' -e '/two/i 222' -e p input -" \ |
Denis Vlasenko | 9213a9e | 2006-09-17 16:28:10 +0000 | [diff] [blame] | 142 | "one\none\n111\n222\ntwo\ntwo" "one" "two" |
Denis Vlasenko | fe7a9f1 | 2007-01-29 14:31:47 +0000 | [diff] [blame] | 143 | testing "sed subst+write" \ |
| 144 | "sed -e 's/i/z/' -e 'woutputw' input -; echo -n X; cat outputw" \ |
| 145 | "thzngy\nagaznXthzngy\nagazn" "thingy" "again" |
| 146 | rm outputw |
Denis Vlasenko | 8681180 | 2007-01-29 17:10:19 +0000 | [diff] [blame] | 147 | testing "sed trailing NUL" \ |
| 148 | "sed 's/i/z/' input -" \ |
| 149 | "a\0b\0\nc" "a\0b\0" "c" |
Denis Vlasenko | 4b0bb9e | 2007-03-16 23:36:58 +0000 | [diff] [blame] | 150 | testing "sed escaped newline in command" \ |
| 151 | "sed 's/a/z\\ |
| 152 | z/' input" \ |
| 153 | "z\nz" "a" "" |
Rob Landley | 6b6edf9 | 2006-02-23 23:13:16 +0000 | [diff] [blame] | 154 | |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 155 | # Test end-of-file matching behavior |
| 156 | |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 157 | testing "sed match EOF" "sed -e '"'$p'"'" "hello\nthere\nthere" "" \ |
| 158 | "hello\nthere" |
| 159 | testing "sed match EOF two files" "sed -e '"'$p'"' input -" \ |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 160 | "one\ntwo\nthree\nfour\nfour" "one\ntwo" "three\nfour" |
Denis Vlasenko | 826c85f | 2007-01-28 23:26:15 +0000 | [diff] [blame] | 161 | # sed match EOF inline: gnu sed 4.1.5 outputs this: |
| 162 | #00000000 6f 6e 65 0a 6f 6f 6b 0a 6f 6f 6b 0a 74 77 6f 0a |one.ook.ook.two.| |
| 163 | #00000010 0a 74 68 72 65 65 0a 6f 6f 6b 0a 6f 6f 6b 0a 66 |.three.ook.ook.f| |
| 164 | #00000020 6f 75 72 |our| |
| 165 | # which looks buggy to me. |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 166 | echo -ne "three\nfour" > input2 |
| 167 | testing "sed match EOF inline" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 168 | "sed -e '"'$i ook'"' -i input input2 && cat input input2" \ |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 169 | "one\nook\ntwothree\nook\nfour" "one\ntwo" "" |
| 170 | rm input2 |
| 171 | |
| 172 | # Test lie-to-autoconf |
| 173 | |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 174 | testing "sed lie-to-autoconf" "sed --version | grep -o 'GNU sed version '" \ |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 175 | "GNU sed version \n" "" "" |
| 176 | |
| 177 | # Jump to nonexistent label |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 178 | testing "sed nonexistent label" "sed -e 'b walrus' 2> /dev/null || echo yes" \ |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 179 | "yes\n" "" "" |
| 180 | |
| 181 | testing "sed backref from empty s uses range regex" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 182 | "sed -e '/woot/s//eep \0 eep/'" "eep woot eep" "" "woot" |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 183 | |
| 184 | testing "sed backref from empty s uses range regex with newline" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 185 | "sed -e '/woot/s//eep \0 eep/'" "eep woot eep\n" "" "woot\n" |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 186 | |
| 187 | # -i with no filename |
| 188 | |
| 189 | touch ./- # Detect gnu failure mode here. |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 190 | testing "sed -i with no arg [GNUFAIL]" "sed -e '' -i 2> /dev/null || echo yes" \ |
Rob Landley | e8e7811 | 2006-03-01 16:32:01 +0000 | [diff] [blame] | 191 | "yes\n" "" "" |
| 192 | rm ./- # Clean up |
| 193 | |
Rob Landley | 4795e4e | 2006-07-26 17:25:08 +0000 | [diff] [blame] | 194 | testing "sed s/xxx/[/" "sed -e 's/xxx/[/'" "[\n" "" "xxx\n" |
| 195 | |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 196 | # Ponder this a bit more, why "woo not found" from gnu version? |
| 197 | #testing "sed doesn't substitute in deleted line" \ |
Rob Landley | 4bb1b04 | 2006-03-16 15:20:45 +0000 | [diff] [blame] | 198 | # "sed -e '/ook/d;s/ook//;t woo;a bang;'" "bang" "" "ook\n" |
Rob Landley | 990025a | 2005-11-10 06:26:40 +0000 | [diff] [blame] | 199 | |
| 200 | # This makes both seds very unhappy. Why? |
| 201 | #testing "sed -g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5," \ |
| 202 | # "" "12345" |
| 203 | |
| 204 | exit $FAILCOUNT |