blob: ba163e9e92ecad29f2b341b4386213b923484d82 [file] [log] [blame]
Rob Landley990025a2005-11-10 06:26:40 +00001#!/bin/sh
2
3# SUSv3 compliant sed tests.
4# Copyright 2005 by Rob Landley <rob@landley.net>
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +02005# Licensed under GPLv2, see file LICENSE in this source tree.
Rob Landley990025a2005-11-10 06:26:40 +00006
Mike Frysingercaa79402009-11-04 18:41:22 -05007. ./testing.sh
Rob Landley990025a2005-11-10 06:26:40 +00008
Denys Vlasenkoa7d6bb32011-08-16 13:29:34 +02009# testing "description" "commands" "result" "infile" "stdin"
Rob Landley990025a2005-11-10 06:26:40 +000010
11# Corner cases
Rob Landley4bb1b042006-03-16 15:20:45 +000012testing "sed no files (stdin)" 'sed ""' "hello\n" "" "hello\n"
13testing "sed explicit stdin" 'sed "" -' "hello\n" "" "hello\n"
14testing "sed handles empty lines" "sed -e 's/\$/@/'" "@\n" "" "\n"
15testing "sed stdin twice" 'sed "" - -' "hello" "" "hello"
Rob Landley990025a2005-11-10 06:26:40 +000016
Rob Landley990025a2005-11-10 06:26:40 +000017# Trailing EOF.
Rob Landley990025a2005-11-10 06:26:40 +000018# Match $, at end of each file or all files?
Rob Landleye8e78112006-03-01 16:32:01 +000019
Rob Landley990025a2005-11-10 06:26:40 +000020# -e corner cases
21# without -e
22# multiple -e
23# interact with a
24# -eee arg1 arg2 arg3
25# -f corner cases
26# -e -f -e
27# -n corner cases
28# no newline at EOF?
29# -r corner cases
30# Just make sure it works.
31# -i corner cases:
32# sed -i -
33# permissions
34# -i on a symlink
35# on a directory
Rob Landleye8e78112006-03-01 16:32:01 +000036# With $ last-line test
37# Continue with \
38# End of script with trailing \
Rob Landley990025a2005-11-10 06:26:40 +000039
40# command list
Rob Landley4bb1b042006-03-16 15:20:45 +000041testing "sed accepts blanks before command" "sed -e '1 d'" "" "" ""
42testing "sed accepts newlines in -e" "sed -e 'i\
Rob Landley990025a2005-11-10 06:26:40 +0000431
44a\
453'" "1\n2\n3\n" "" "2\n"
Rob Landley4bb1b042006-03-16 15:20:45 +000046testing "sed accepts multiple -e" "sed -e 'i\' -e '1' -e 'a\' -e '3'" \
Rob Landley990025a2005-11-10 06:26:40 +000047 "1\n2\n3\n" "" "2\n"
48
49# substitutions
Rob Landley4bb1b042006-03-16 15:20:45 +000050testing "sed -n" "sed -n -e s/foo/bar/ -e s/bar/baz/" "" "" "foo\n"
51testing "sed s//p" "sed -e s/foo/bar/p -e s/bar/baz/p" "bar\nbaz\nbaz\n" \
Rob Landley990025a2005-11-10 06:26:40 +000052 "" "foo\n"
Rob Landley4bb1b042006-03-16 15:20:45 +000053testing "sed -n s//p" "sed -ne s/abc/def/p" "def\n" "" "abc\n"
Denys Vlasenko6ae64262009-07-18 16:22:26 +020054test x"$SKIP_KNOWN_BUGS" = x"" && {
Rob Landley4bb1b042006-03-16 15:20:45 +000055testing "sed s//g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5,\n" \
Rob Landley990025a2005-11-10 06:26:40 +000056 "" "12345\n"
Denys Vlasenko6ae64262009-07-18 16:22:26 +020057}
Rob Landley4bb1b042006-03-16 15:20:45 +000058testing "sed s arbitrary delimiter" "sed -e 's woo boing '" "boing\n" "" "woo\n"
59testing "sed s chains" "sed -e s/foo/bar/ -e s/bar/baz/" "baz\n" "" "foo\n"
60testing "sed s chains2" "sed -e s/foo/bar/ -e s/baz/nee/" "bar\n" "" "foo\n"
61testing "sed s [delimiter]" "sed -e 's@[@]@@'" "onetwo" "" "one@two"
Denis Vlasenko40276642007-11-13 16:48:10 +000062testing "sed s with \\t (GNU ext)" "sed 's/\t/ /'" "one two" "" "one\ttwo"
Rob Landley990025a2005-11-10 06:26:40 +000063
64# branch
Rob Landley4bb1b042006-03-16 15:20:45 +000065testing "sed b (branch)" "sed -e 'b one;p;: one'" "foo\n" "" "foo\n"
66testing "sed b (branch with no label jumps to end)" "sed -e 'b;p'" \
Rob Landley990025a2005-11-10 06:26:40 +000067 "foo\n" "" "foo\n"
68
69# test and branch
Rob Landley4bb1b042006-03-16 15:20:45 +000070testing "sed t (test/branch)" "sed -e 's/a/1/;t one;p;: one;p'" \
Rob Landley990025a2005-11-10 06:26:40 +000071 "1\n1\nb\nb\nb\nc\nc\nc\n" "" "a\nb\nc\n"
Rob Landley4bb1b042006-03-16 15:20:45 +000072testing "sed t (test/branch clears test bit)" "sed -e 's/a/b/;:loop;t loop'" \
Rob Landley990025a2005-11-10 06:26:40 +000073 "b\nb\nc\n" "" "a\nb\nc\n"
Rob Landley4bb1b042006-03-16 15:20:45 +000074testing "sed T (!test/branch)" "sed -e 's/a/1/;T notone;p;: notone;p'" \
Rob Landley990025a2005-11-10 06:26:40 +000075 "1\n1\n1\nb\nb\nc\nc\n" "" "a\nb\nc\n"
76
Denys Vlasenko6ae64262009-07-18 16:22:26 +020077test x"$SKIP_KNOWN_BUGS" = x"" && {
Rob Landley990025a2005-11-10 06:26:40 +000078# Normal sed end-of-script doesn't print "c" because n flushed the pattern
79# space. If n hits EOF, pattern space is empty when script ends.
80# Query: how does this interact with no newline at EOF?
Rob Landley4bb1b042006-03-16 15:20:45 +000081testing "sed n (flushes pattern space, terminates early)" "sed -e 'n;p'" \
Rob Landley990025a2005-11-10 06:26:40 +000082 "a\nb\nb\nc\n" "" "a\nb\nc\n"
Denys Vlasenko6ae64262009-07-18 16:22:26 +020083}
Denys Vlasenko0d555fc2010-08-16 16:26:33 +020084# non-GNU sed: N does _not_ flush pattern space, therefore c is eaten @ script end
85# GNU sed: N flushes pattern space, therefore c is printed too @ script end
86testing "sed N (flushes pattern space (GNU behavior))" "sed -e 'N;p'" \
87 "a\nb\na\nb\nc\n" "" "a\nb\nc\n"
88
89testing "sed N test2" "sed ':a;N;s/\n/ /;ta'" \
90 "a b c\n" "" "a\nb\nc\n"
91
92testing "sed N test3" "sed 'N;s/\n/ /'" \
93 "a b\nc\n" "" "a\nb\nc\n"
94
Rob Landley4bb1b042006-03-16 15:20:45 +000095testing "sed address match newline" 'sed "/b/N;/b\\nc/i woo"' \
96 "a\nwoo\nb\nc\nd\n" "" "a\nb\nc\nd\n"
Rob Landley990025a2005-11-10 06:26:40 +000097
98# Multiple lines in pattern space
99testing "sed N (stops at end of input) and P (prints to first newline only)" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000100 "sed -n 'N;P;p'" "a\na\nb\n" "" "a\nb\nc\n"
Rob Landley990025a2005-11-10 06:26:40 +0000101
102# Hold space
Rob Landley4bb1b042006-03-16 15:20:45 +0000103testing "sed G (append hold space to pattern space)" 'sed G' "a\n\nb\n\nc\n\n" \
Rob Landley990025a2005-11-10 06:26:40 +0000104 "" "a\nb\nc\n"
105#testing "sed g/G (swap/append hold and patter space)"
106#testing "sed g (swap hold/pattern space)"
107
108testing "sed d ends script iteration" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000109 "sed -e '/ook/d;s/ook/ping/p;i woot'" "" "" "ook\n"
Rob Landley990025a2005-11-10 06:26:40 +0000110testing "sed d ends script iteration (2)" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000111 "sed -e '/ook/d;a\' -e 'bang'" "woot\nbang\n" "" "ook\nwoot\n"
Rob Landley990025a2005-11-10 06:26:40 +0000112
Rob Landley6b6edf92006-02-23 23:13:16 +0000113# Multiple files, with varying newlines and NUL bytes
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200114test x"$SKIP_KNOWN_BUGS" = x"" && {
Rob Landley4bb1b042006-03-16 15:20:45 +0000115testing "sed embedded NUL" "sed -e 's/woo/bang/'" "\0bang\0woo\0" "" \
116 "\0woo\0woo\0"
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200117}
Rob Landley4bb1b042006-03-16 15:20:45 +0000118testing "sed embedded NUL g" "sed -e 's/woo/bang/g'" "bang\0bang\0" "" \
119 "woo\0woo\0"
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200120test x"$SKIP_KNOWN_BUGS" = x"" && {
Denys Vlasenkoe82cf332010-05-12 15:59:32 +0200121$ECHO -e "/woo/a he\0llo" > sed.commands
Rob Landley4bb1b042006-03-16 15:20:45 +0000122testing "sed NUL in command" "sed -f sed.commands" "woo\nhe\0llo\n" "" "woo"
Rob Landleye8e78112006-03-01 16:32:01 +0000123rm sed.commands
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200124}
Rob Landley6b6edf92006-02-23 23:13:16 +0000125
126# sed has funky behavior with newlines at the end of file. Test lots of
127# corner cases with the optional newline appending behavior.
128
Rob Landley4bb1b042006-03-16 15:20:45 +0000129testing "sed normal newlines" "sed -e 's/woo/bang/' input -" "bang\nbang\n" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000130 "woo\n" "woo\n"
Rob Landley4bb1b042006-03-16 15:20:45 +0000131testing "sed leave off trailing newline" "sed -e 's/woo/bang/' input -" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000132 "bang\nbang" "woo\n" "woo"
Rob Landley4bb1b042006-03-16 15:20:45 +0000133testing "sed autoinsert newline" "sed -e 's/woo/bang/' input -" "bang\nbang" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000134 "woo" "woo"
Rob Landley4bb1b042006-03-16 15:20:45 +0000135testing "sed empty file plus cat" "sed -e 's/nohit//' input -" "one\ntwo" \
Denis Vlasenko9213a9e2006-09-17 16:28:10 +0000136 "" "one\ntwo"
Rob Landley4bb1b042006-03-16 15:20:45 +0000137testing "sed cat plus empty file" "sed -e 's/nohit//' input -" "one\ntwo" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000138 "one\ntwo" ""
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200139test x"$SKIP_KNOWN_BUGS" = x"" && {
Rob Landley4bb1b042006-03-16 15:20:45 +0000140testing "sed append autoinserts newline" "sed -e '/woot/a woo' -" \
141 "woot\nwoo\n" "" "woot"
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200142}
Rob Landley4bb1b042006-03-16 15:20:45 +0000143testing "sed insert doesn't autoinsert newline" "sed -e '/woot/i woo' -" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000144 "woo\nwoot" "" "woot"
Rob Landley4bb1b042006-03-16 15:20:45 +0000145testing "sed print autoinsert newlines" "sed -e 'p' -" "one\none" "" "one"
146testing "sed print autoinsert newlines two files" "sed -e 'p' input -" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000147 "one\none\ntwo\ntwo" "one" "two"
Rob Landley4bb1b042006-03-16 15:20:45 +0000148testing "sed noprint, no match, no newline" "sed -ne 's/woo/bang/' input" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000149 "" "no\n" ""
Rob Landley4bb1b042006-03-16 15:20:45 +0000150testing "sed selective matches with one nl" "sed -ne 's/woo/bang/p' input -" \
Rob Landley6b6edf92006-02-23 23:13:16 +0000151 "a bang\nc bang\n" "a woo\nb no" "c woo\nd no"
Rob Landley4bb1b042006-03-16 15:20:45 +0000152testing "sed selective matches insert newline" \
153 "sed -ne 's/woo/bang/p' input -" "a bang\nb bang\nd bang" \
154 "a woo\nb woo" "c no\nd woo"
155testing "sed selective matches noinsert newline" \
156 "sed -ne 's/woo/bang/p' input -" "a bang\nb bang" "a woo\nb woo" \
157 "c no\nd no"
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200158test x"$SKIP_KNOWN_BUGS" = x"" && {
Rob Landley4bb1b042006-03-16 15:20:45 +0000159testing "sed clusternewline" \
160 "sed -e '/one/a 111' -e '/two/i 222' -e p input -" \
Denis Vlasenko9213a9e2006-09-17 16:28:10 +0000161 "one\none\n111\n222\ntwo\ntwo" "one" "two"
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200162}
Denis Vlasenkofe7a9f12007-01-29 14:31:47 +0000163testing "sed subst+write" \
Denys Vlasenkoe82cf332010-05-12 15:59:32 +0200164 "sed -e 's/i/z/' -e 'woutputw' input -; $ECHO -n X; cat outputw" \
Denis Vlasenkofe7a9f12007-01-29 14:31:47 +0000165 "thzngy\nagaznXthzngy\nagazn" "thingy" "again"
166rm outputw
Denis Vlasenko86811802007-01-29 17:10:19 +0000167testing "sed trailing NUL" \
168 "sed 's/i/z/' input -" \
169 "a\0b\0\nc" "a\0b\0" "c"
Denis Vlasenko4b0bb9e2007-03-16 23:36:58 +0000170testing "sed escaped newline in command" \
171 "sed 's/a/z\\
172z/' input" \
173 "z\nz" "a" ""
Rob Landley6b6edf92006-02-23 23:13:16 +0000174
Rob Landleye8e78112006-03-01 16:32:01 +0000175# Test end-of-file matching behavior
176
Rob Landley4bb1b042006-03-16 15:20:45 +0000177testing "sed match EOF" "sed -e '"'$p'"'" "hello\nthere\nthere" "" \
178 "hello\nthere"
179testing "sed match EOF two files" "sed -e '"'$p'"' input -" \
Rob Landleye8e78112006-03-01 16:32:01 +0000180 "one\ntwo\nthree\nfour\nfour" "one\ntwo" "three\nfour"
Denis Vlasenko826c85f2007-01-28 23:26:15 +0000181# sed match EOF inline: gnu sed 4.1.5 outputs this:
182#00000000 6f 6e 65 0a 6f 6f 6b 0a 6f 6f 6b 0a 74 77 6f 0a |one.ook.ook.two.|
183#00000010 0a 74 68 72 65 65 0a 6f 6f 6b 0a 6f 6f 6b 0a 66 |.three.ook.ook.f|
184#00000020 6f 75 72 |our|
185# which looks buggy to me.
Denis Vlasenkoabe49fa2008-07-11 21:41:14 +0000186$ECHO -ne "three\nfour" > input2
Rob Landleye8e78112006-03-01 16:32:01 +0000187testing "sed match EOF inline" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000188 "sed -e '"'$i ook'"' -i input input2 && cat input input2" \
Rob Landleye8e78112006-03-01 16:32:01 +0000189 "one\nook\ntwothree\nook\nfour" "one\ntwo" ""
190rm input2
191
192# Test lie-to-autoconf
193
Rob Landley4bb1b042006-03-16 15:20:45 +0000194testing "sed lie-to-autoconf" "sed --version | grep -o 'GNU sed version '" \
Rob Landleye8e78112006-03-01 16:32:01 +0000195 "GNU sed version \n" "" ""
196
197# Jump to nonexistent label
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200198test x"$SKIP_KNOWN_BUGS" = x"" && {
199# Incompatibility: illegal jump is not detected if input is ""
200# (that is, no lines at all). GNU sed 4.1.5 complains even in this case
201testing "sed nonexistent label" "sed -e 'b walrus' 2>/dev/null || echo yes" \
Rob Landleye8e78112006-03-01 16:32:01 +0000202 "yes\n" "" ""
Denys Vlasenko6ae64262009-07-18 16:22:26 +0200203}
Rob Landleye8e78112006-03-01 16:32:01 +0000204
205testing "sed backref from empty s uses range regex" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000206 "sed -e '/woot/s//eep \0 eep/'" "eep woot eep" "" "woot"
Rob Landleye8e78112006-03-01 16:32:01 +0000207
208testing "sed backref from empty s uses range regex with newline" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000209 "sed -e '/woot/s//eep \0 eep/'" "eep woot eep\n" "" "woot\n"
Rob Landleye8e78112006-03-01 16:32:01 +0000210
211# -i with no filename
212
213touch ./- # Detect gnu failure mode here.
Rob Landley4bb1b042006-03-16 15:20:45 +0000214testing "sed -i with no arg [GNUFAIL]" "sed -e '' -i 2> /dev/null || echo yes" \
Rob Landleye8e78112006-03-01 16:32:01 +0000215 "yes\n" "" ""
216rm ./- # Clean up
217
Rob Landley4795e4e2006-07-26 17:25:08 +0000218testing "sed s/xxx/[/" "sed -e 's/xxx/[/'" "[\n" "" "xxx\n"
219
Rob Landley990025a2005-11-10 06:26:40 +0000220# Ponder this a bit more, why "woo not found" from gnu version?
221#testing "sed doesn't substitute in deleted line" \
Rob Landley4bb1b042006-03-16 15:20:45 +0000222# "sed -e '/ook/d;s/ook//;t woo;a bang;'" "bang" "" "ook\n"
Rob Landley990025a2005-11-10 06:26:40 +0000223
224# This makes both seds very unhappy. Why?
225#testing "sed -g (exhaustive)" "sed -e 's/[[:space:]]*/,/g'" ",1,2,3,4,5," \
226# "" "12345"
227
Denys Vlasenkoa7d6bb32011-08-16 13:29:34 +0200228# testing "description" "commands" "result" "infile" "stdin"
Denis Vlasenkof39c7c02008-02-28 17:59:01 +0000229
230testing "sed n command must reset 'substituted' bit" \
231 "sed 's/1/x/;T;n;: next;s/3/y/;t quit;n;b next;: quit;q'" \
232 "0\nx\n2\ny\n" "" "0\n1\n2\n3\n"
233
Denys Vlasenko8bca3e22009-06-30 19:19:37 +0200234testing "sed d does not break n,m matching" \
235 "sed -n '1d;1,3p'" \
236 "second\nthird\n" "" "first\nsecond\nthird\nfourth\n"
237
238testing "sed d does not break n,regex matching" \
239 "sed -n '1d;1,/hir/p'" \
240 "second\nthird\n" "" "first\nsecond\nthird\nfourth\n"
241
242testing "sed d does not break n,regex matching #2" \
243 "sed -n '1,5d;1,/hir/p'" \
244 "second2\nthird2\n" "" \
245 "first\nsecond\nthird\nfourth\n""first2\nsecond2\nthird2\nfourth2\n"
246
Denys Vlasenkoae68f112009-07-10 11:55:20 +0200247testing "sed 2d;2,1p (gnu compat)" \
248 "sed -n '2d;2,1p'" \
249 "third\n" "" \
250 "first\nsecond\nthird\nfourth\n"
251
Denys Vlasenkof210cff2009-08-17 01:35:04 +0200252# Regex means: "match / at BOL or nothing, then one or more not-slashes".
253# The bug was that second slash in /usr/lib was treated as "at BOL" too.
254testing "sed beginning (^) matches only once" \
255 "sed 's,\(^/\|\)[^/][^/]*,>\0<,g'" \
256 ">/usr</>lib<\n" "" \
257 "/usr/lib\n"
258
Denys Vlasenko96a18332010-04-19 22:36:07 -0400259testing "sed c" \
260 "sed 'crepl'" \
261 "repl\nrepl\n" "" \
262 "first\nsecond\n"
263
Denys Vlasenkof2c16ed2010-04-20 04:00:03 -0400264testing "sed nested {}s" \
265 "sed '/asd/ { p; /s/ { s/s/c/ }; p; q }'" \
266 "qwe\nasd\nacd\nacd\n" "" \
267 "qwe\nasd\nzxc\n"
268
Denys Vlasenkoa2215b92010-05-12 01:49:04 +0200269testing "sed a cmd ended by double backslash" \
270 "sed -e '/| one /a \\
271 | three \\\\' -e '/| one-/a \\
272 | three-* \\\\'" \
273' | one \\
274 | three \\
275 | two \\
276' '' \
277' | one \\
278 | two \\
279'
280
Denys Vlasenko2e284a42010-08-01 04:14:46 +0200281# first three lines are deleted; 4th line is matched and printed by "2,3" and by "4" ranges
Denys Vlasenkobf5f99f2010-06-04 01:29:52 +0200282testing "sed with N skipping lines past ranges on next cmds" \
283 "sed -n '1{N;N;d};1p;2,3p;3p;4p'" \
284 "4\n4\n" "" "1\n2\n3\n4\n"
285
Denys Vlasenko2e284a42010-08-01 04:14:46 +0200286testing "sed -i with address modifies all files, not only first" \
287 "cp input input2; sed -i -e '1s/foo/bar/' input input2 && cat input input2; rm input2" \
Denys Vlasenkob883bc92010-08-01 04:19:59 +0200288 "bar\nbar\n" "foo\n" ""
Denys Vlasenko2e284a42010-08-01 04:14:46 +0200289
Denys Vlasenko6a0abcc2011-05-03 00:52:22 +0200290testing "sed understands \r" \
291 "sed 's/r/\r/'" \
292 "\rrr\n" "" "rrr\n"
Denys Vlasenko2e284a42010-08-01 04:14:46 +0200293
Denys Vlasenkoa7d6bb32011-08-16 13:29:34 +0200294testing "sed -i finishes ranges correctly" \
295 "sed '1,2d' -i input; echo \$?; cat input" \
296 "0\n3\n4\n" "1\n2\n3\n4\n" ""
297
298# testing "description" "commands" "result" "infile" "stdin"
Denys Vlasenkoa2215b92010-05-12 01:49:04 +0200299
Rob Landley990025a2005-11-10 06:26:40 +0000300exit $FAILCOUNT