diff options
author | Denis Vlasenko <vda.linux@googlemail.com> | 2007-11-13 17:13:31 +0000 |
---|---|---|
committer | Denis Vlasenko <vda.linux@googlemail.com> | 2007-11-13 17:13:31 +0000 |
commit | 72cc9641f80b6981cc97fd66feb8d5842ea5ed03 (patch) | |
tree | c8bb972fb90b451faae4dfe60cd3f33a77d40bff /editors | |
parent | 40276648ab31822068c3408ae43a5ecaafd03a5c (diff) | |
download | busybox-w32-72cc9641f80b6981cc97fd66feb8d5842ea5ed03.tar.gz busybox-w32-72cc9641f80b6981cc97fd66feb8d5842ea5ed03.tar.bz2 busybox-w32-72cc9641f80b6981cc97fd66feb8d5842ea5ed03.zip |
add sed mini-doc
Diffstat (limited to 'editors')
-rw-r--r-- | editors/sed1line.txt | 425 | ||||
-rw-r--r-- | editors/sed_summary.htm | 220 |
2 files changed, 645 insertions, 0 deletions
diff --git a/editors/sed1line.txt b/editors/sed1line.txt new file mode 100644 index 000000000..11a2e36be --- /dev/null +++ b/editors/sed1line.txt | |||
@@ -0,0 +1,425 @@ | |||
1 | http://www.student.northpark.edu/pemente/sed/sed1line.txt | ||
2 | ------------------------------------------------------------------------- | ||
3 | HANDY ONE-LINERS FOR SED (Unix stream editor) Apr. 26, 2004 | ||
4 | compiled by Eric Pement - pemente[at]northpark[dot]edu version 5.4 | ||
5 | Latest version of this file is usually at: | ||
6 | http://sed.sourceforge.net/sed1line.txt | ||
7 | http://www.student.northpark.edu/pemente/sed/sed1line.txt | ||
8 | This file is also available in Portuguese at: | ||
9 | http://www.lrv.ufsc.br/wmaker/sed_ptBR.html | ||
10 | |||
11 | FILE SPACING: | ||
12 | |||
13 | # double space a file | ||
14 | sed G | ||
15 | |||
16 | # double space a file which already has blank lines in it. Output file | ||
17 | # should contain no more than one blank line between lines of text. | ||
18 | sed '/^$/d;G' | ||
19 | |||
20 | # triple space a file | ||
21 | sed 'G;G' | ||
22 | |||
23 | # undo double-spacing (assumes even-numbered lines are always blank) | ||
24 | sed 'n;d' | ||
25 | |||
26 | # insert a blank line above every line which matches "regex" | ||
27 | sed '/regex/{x;p;x;}' | ||
28 | |||
29 | # insert a blank line below every line which matches "regex" | ||
30 | sed '/regex/G' | ||
31 | |||
32 | # insert a blank line above and below every line which matches "regex" | ||
33 | sed '/regex/{x;p;x;G;}' | ||
34 | |||
35 | NUMBERING: | ||
36 | |||
37 | # number each line of a file (simple left alignment). Using a tab (see | ||
38 | # note on '\t' at end of file) instead of space will preserve margins. | ||
39 | sed = filename | sed 'N;s/\n/\t/' | ||
40 | |||
41 | # number each line of a file (number on left, right-aligned) | ||
42 | sed = filename | sed 'N; s/^/ /; s/ *\(.\{6,\}\)\n/\1 /' | ||
43 | |||
44 | # number each line of file, but only print numbers if line is not blank | ||
45 | sed '/./=' filename | sed '/./N; s/\n/ /' | ||
46 | |||
47 | # count lines (emulates "wc -l") | ||
48 | sed -n '$=' | ||
49 | |||
50 | TEXT CONVERSION AND SUBSTITUTION: | ||
51 | |||
52 | # IN UNIX ENVIRONMENT: convert DOS newlines (CR/LF) to Unix format | ||
53 | sed 's/.$//' # assumes that all lines end with CR/LF | ||
54 | sed 's/^M$//' # in bash/tcsh, press Ctrl-V then Ctrl-M | ||
55 | sed 's/\x0D$//' # gsed 3.02.80, but top script is easier | ||
56 | |||
57 | # IN UNIX ENVIRONMENT: convert Unix newlines (LF) to DOS format | ||
58 | sed "s/$/`echo -e \\\r`/" # command line under ksh | ||
59 | sed 's/$'"/`echo \\\r`/" # command line under bash | ||
60 | sed "s/$/`echo \\\r`/" # command line under zsh | ||
61 | sed 's/$/\r/' # gsed 3.02.80 | ||
62 | |||
63 | # IN DOS ENVIRONMENT: convert Unix newlines (LF) to DOS format | ||
64 | sed "s/$//" # method 1 | ||
65 | sed -n p # method 2 | ||
66 | |||
67 | # IN DOS ENVIRONMENT: convert DOS newlines (CR/LF) to Unix format | ||
68 | # Can only be done with UnxUtils sed, version 4.0.7 or higher. | ||
69 | # Cannot be done with other DOS versions of sed. Use "tr" instead. | ||
70 | sed "s/\r//" infile >outfile # UnxUtils sed v4.0.7 or higher | ||
71 | tr -d \r <infile >outfile # GNU tr version 1.22 or higher | ||
72 | |||
73 | # delete leading whitespace (spaces, tabs) from front of each line | ||
74 | # aligns all text flush left | ||
75 | sed 's/^[ \t]*//' # see note on '\t' at end of file | ||
76 | |||
77 | # delete trailing whitespace (spaces, tabs) from end of each line | ||
78 | sed 's/[ \t]*$//' # see note on '\t' at end of file | ||
79 | |||
80 | # delete BOTH leading and trailing whitespace from each line | ||
81 | sed 's/^[ \t]*//;s/[ \t]*$//' | ||
82 | |||
83 | # insert 5 blank spaces at beginning of each line (make page offset) | ||
84 | sed 's/^/ /' | ||
85 | |||
86 | # align all text flush right on a 79-column width | ||
87 | sed -e :a -e 's/^.\{1,78\}$/ &/;ta' # set at 78 plus 1 space | ||
88 | |||
89 | # center all text in the middle of 79-column width. In method 1, | ||
90 | # spaces at the beginning of the line are significant, and trailing | ||
91 | # spaces are appended at the end of the line. In method 2, spaces at | ||
92 | # the beginning of the line are discarded in centering the line, and | ||
93 | # no trailing spaces appear at the end of lines. | ||
94 | sed -e :a -e 's/^.\{1,77\}$/ & /;ta' # method 1 | ||
95 | sed -e :a -e 's/^.\{1,77\}$/ &/;ta' -e 's/\( *\)\1/\1/' # method 2 | ||
96 | |||
97 | # substitute (find and replace) "foo" with "bar" on each line | ||
98 | sed 's/foo/bar/' # replaces only 1st instance in a line | ||
99 | sed 's/foo/bar/4' # replaces only 4th instance in a line | ||
100 | sed 's/foo/bar/g' # replaces ALL instances in a line | ||
101 | sed 's/\(.*\)foo\(.*foo\)/\1bar\2/' # replace the next-to-last case | ||
102 | sed 's/\(.*\)foo/\1bar/' # replace only the last case | ||
103 | |||
104 | # substitute "foo" with "bar" ONLY for lines which contain "baz" | ||
105 | sed '/baz/s/foo/bar/g' | ||
106 | |||
107 | # substitute "foo" with "bar" EXCEPT for lines which contain "baz" | ||
108 | sed '/baz/!s/foo/bar/g' | ||
109 | |||
110 | # change "scarlet" or "ruby" or "puce" to "red" | ||
111 | sed 's/scarlet/red/g;s/ruby/red/g;s/puce/red/g' # most seds | ||
112 | gsed 's/scarlet\|ruby\|puce/red/g' # GNU sed only | ||
113 | |||
114 | # reverse order of lines (emulates "tac") | ||
115 | # bug/feature in HHsed v1.5 causes blank lines to be deleted | ||
116 | sed '1!G;h;$!d' # method 1 | ||
117 | sed -n '1!G;h;$p' # method 2 | ||
118 | |||
119 | # reverse each character on the line (emulates "rev") | ||
120 | sed '/\n/!G;s/\(.\)\(.*\n\)/&\2\1/;//D;s/.//' | ||
121 | |||
122 | # join pairs of lines side-by-side (like "paste") | ||
123 | sed '$!N;s/\n/ /' | ||
124 | |||
125 | # if a line ends with a backslash, append the next line to it | ||
126 | sed -e :a -e '/\\$/N; s/\\\n//; ta' | ||
127 | |||
128 | # if a line begins with an equal sign, append it to the previous line | ||
129 | # and replace the "=" with a single space | ||
130 | sed -e :a -e '$!N;s/\n=/ /;ta' -e 'P;D' | ||
131 | |||
132 | # add commas to numeric strings, changing "1234567" to "1,234,567" | ||
133 | gsed ':a;s/\B[0-9]\{3\}\>/,&/;ta' # GNU sed | ||
134 | sed -e :a -e 's/\(.*[0-9]\)\([0-9]\{3\}\)/\1,\2/;ta' # other seds | ||
135 | |||
136 | # add commas to numbers with decimal points and minus signs (GNU sed) | ||
137 | gsed ':a;s/\(^\|[^0-9.]\)\([0-9]\+\)\([0-9]\{3\}\)/\1\2,\3/g;ta' | ||
138 | |||
139 | # add a blank line every 5 lines (after lines 5, 10, 15, 20, etc.) | ||
140 | gsed '0~5G' # GNU sed only | ||
141 | sed 'n;n;n;n;G;' # other seds | ||
142 | |||
143 | SELECTIVE PRINTING OF CERTAIN LINES: | ||
144 | |||
145 | # print first 10 lines of file (emulates behavior of "head") | ||
146 | sed 10q | ||
147 | |||
148 | # print first line of file (emulates "head -1") | ||
149 | sed q | ||
150 | |||
151 | # print the last 10 lines of a file (emulates "tail") | ||
152 | sed -e :a -e '$q;N;11,$D;ba' | ||
153 | |||
154 | # print the last 2 lines of a file (emulates "tail -2") | ||
155 | sed '$!N;$!D' | ||
156 | |||
157 | # print the last line of a file (emulates "tail -1") | ||
158 | sed '$!d' # method 1 | ||
159 | sed -n '$p' # method 2 | ||
160 | |||
161 | # print only lines which match regular expression (emulates "grep") | ||
162 | sed -n '/regexp/p' # method 1 | ||
163 | sed '/regexp/!d' # method 2 | ||
164 | |||
165 | # print only lines which do NOT match regexp (emulates "grep -v") | ||
166 | sed -n '/regexp/!p' # method 1, corresponds to above | ||
167 | sed '/regexp/d' # method 2, simpler syntax | ||
168 | |||
169 | # print the line immediately before a regexp, but not the line | ||
170 | # containing the regexp | ||
171 | sed -n '/regexp/{g;1!p;};h' | ||
172 | |||
173 | # print the line immediately after a regexp, but not the line | ||
174 | # containing the regexp | ||
175 | sed -n '/regexp/{n;p;}' | ||
176 | |||
177 | # print 1 line of context before and after regexp, with line number | ||
178 | # indicating where the regexp occurred (similar to "grep -A1 -B1") | ||
179 | sed -n -e '/regexp/{=;x;1!p;g;$!N;p;D;}' -e h | ||
180 | |||
181 | # grep for AAA and BBB and CCC (in any order) | ||
182 | sed '/AAA/!d; /BBB/!d; /CCC/!d' | ||
183 | |||
184 | # grep for AAA and BBB and CCC (in that order) | ||
185 | sed '/AAA.*BBB.*CCC/!d' | ||
186 | |||
187 | # grep for AAA or BBB or CCC (emulates "egrep") | ||
188 | sed -e '/AAA/b' -e '/BBB/b' -e '/CCC/b' -e d # most seds | ||
189 | gsed '/AAA\|BBB\|CCC/!d' # GNU sed only | ||
190 | |||
191 | # print paragraph if it contains AAA (blank lines separate paragraphs) | ||
192 | # HHsed v1.5 must insert a 'G;' after 'x;' in the next 3 scripts below | ||
193 | sed -e '/./{H;$!d;}' -e 'x;/AAA/!d;' | ||
194 | |||
195 | # print paragraph if it contains AAA and BBB and CCC (in any order) | ||
196 | sed -e '/./{H;$!d;}' -e 'x;/AAA/!d;/BBB/!d;/CCC/!d' | ||
197 | |||
198 | # print paragraph if it contains AAA or BBB or CCC | ||
199 | sed -e '/./{H;$!d;}' -e 'x;/AAA/b' -e '/BBB/b' -e '/CCC/b' -e d | ||
200 | gsed '/./{H;$!d;};x;/AAA\|BBB\|CCC/b;d' # GNU sed only | ||
201 | |||
202 | # print only lines of 65 characters or longer | ||
203 | sed -n '/^.\{65\}/p' | ||
204 | |||
205 | # print only lines of less than 65 characters | ||
206 | sed -n '/^.\{65\}/!p' # method 1, corresponds to above | ||
207 | sed '/^.\{65\}/d' # method 2, simpler syntax | ||
208 | |||
209 | # print section of file from regular expression to end of file | ||
210 | sed -n '/regexp/,$p' | ||
211 | |||
212 | # print section of file based on line numbers (lines 8-12, inclusive) | ||
213 | sed -n '8,12p' # method 1 | ||
214 | sed '8,12!d' # method 2 | ||
215 | |||
216 | # print line number 52 | ||
217 | sed -n '52p' # method 1 | ||
218 | sed '52!d' # method 2 | ||
219 | sed '52q;d' # method 3, efficient on large files | ||
220 | |||
221 | # beginning at line 3, print every 7th line | ||
222 | gsed -n '3~7p' # GNU sed only | ||
223 | sed -n '3,${p;n;n;n;n;n;n;}' # other seds | ||
224 | |||
225 | # print section of file between two regular expressions (inclusive) | ||
226 | sed -n '/Iowa/,/Montana/p' # case sensitive | ||
227 | |||
228 | SELECTIVE DELETION OF CERTAIN LINES: | ||
229 | |||
230 | # print all of file EXCEPT section between 2 regular expressions | ||
231 | sed '/Iowa/,/Montana/d' | ||
232 | |||
233 | # delete duplicate, consecutive lines from a file (emulates "uniq"). | ||
234 | # First line in a set of duplicate lines is kept, rest are deleted. | ||
235 | sed '$!N; /^\(.*\)\n\1$/!P; D' | ||
236 | |||
237 | # delete duplicate, nonconsecutive lines from a file. Beware not to | ||
238 | # overflow the buffer size of the hold space, or else use GNU sed. | ||
239 | sed -n 'G; s/\n/&&/; /^\([ -~]*\n\).*\n\1/d; s/\n//; h; P' | ||
240 | |||
241 | # delete all lines except duplicate lines (emulates "uniq -d"). | ||
242 | sed '$!N; s/^\(.*\)\n\1$/\1/; t; D' | ||
243 | |||
244 | # delete the first 10 lines of a file | ||
245 | sed '1,10d' | ||
246 | |||
247 | # delete the last line of a file | ||
248 | sed '$d' | ||
249 | |||
250 | # delete the last 2 lines of a file | ||
251 | sed 'N;$!P;$!D;$d' | ||
252 | |||
253 | # delete the last 10 lines of a file | ||
254 | sed -e :a -e '$d;N;2,10ba' -e 'P;D' # method 1 | ||
255 | sed -n -e :a -e '1,10!{P;N;D;};N;ba' # method 2 | ||
256 | |||
257 | # delete every 8th line | ||
258 | gsed '0~8d' # GNU sed only | ||
259 | sed 'n;n;n;n;n;n;n;d;' # other seds | ||
260 | |||
261 | # delete ALL blank lines from a file (same as "grep '.' ") | ||
262 | sed '/^$/d' # method 1 | ||
263 | sed '/./!d' # method 2 | ||
264 | |||
265 | # delete all CONSECUTIVE blank lines from file except the first; also | ||
266 | # deletes all blank lines from top and end of file (emulates "cat -s") | ||
267 | sed '/./,/^$/!d' # method 1, allows 0 blanks at top, 1 at EOF | ||
268 | sed '/^$/N;/\n$/D' # method 2, allows 1 blank at top, 0 at EOF | ||
269 | |||
270 | # delete all CONSECUTIVE blank lines from file except the first 2: | ||
271 | sed '/^$/N;/\n$/N;//D' | ||
272 | |||
273 | # delete all leading blank lines at top of file | ||
274 | sed '/./,$!d' | ||
275 | |||
276 | # delete all trailing blank lines at end of file | ||
277 | sed -e :a -e '/^\n*$/{$d;N;ba' -e '}' # works on all seds | ||
278 | sed -e :a -e '/^\n*$/N;/\n$/ba' # ditto, except for gsed 3.02* | ||
279 | |||
280 | # delete the last line of each paragraph | ||
281 | sed -n '/^$/{p;h;};/./{x;/./p;}' | ||
282 | |||
283 | SPECIAL APPLICATIONS: | ||
284 | |||
285 | # remove nroff overstrikes (char, backspace) from man pages. The 'echo' | ||
286 | # command may need an -e switch if you use Unix System V or bash shell. | ||
287 | sed "s/.`echo \\\b`//g" # double quotes required for Unix environment | ||
288 | sed 's/.^H//g' # in bash/tcsh, press Ctrl-V and then Ctrl-H | ||
289 | sed 's/.\x08//g' # hex expression for sed v1.5 | ||
290 | |||
291 | # get Usenet/e-mail message header | ||
292 | sed '/^$/q' # deletes everything after first blank line | ||
293 | |||
294 | # get Usenet/e-mail message body | ||
295 | sed '1,/^$/d' # deletes everything up to first blank line | ||
296 | |||
297 | # get Subject header, but remove initial "Subject: " portion | ||
298 | sed '/^Subject: */!d; s///;q' | ||
299 | |||
300 | # get return address header | ||
301 | sed '/^Reply-To:/q; /^From:/h; /./d;g;q' | ||
302 | |||
303 | # parse out the address proper. Pulls out the e-mail address by itself | ||
304 | # from the 1-line return address header (see preceding script) | ||
305 | sed 's/ *(.*)//; s/>.*//; s/.*[:<] *//' | ||
306 | |||
307 | # add a leading angle bracket and space to each line (quote a message) | ||
308 | sed 's/^/> /' | ||
309 | |||
310 | # delete leading angle bracket & space from each line (unquote a message) | ||
311 | sed 's/^> //' | ||
312 | |||
313 | # remove most HTML tags (accommodates multiple-line tags) | ||
314 | sed -e :a -e 's/<[^>]*>//g;/</N;//ba' | ||
315 | |||
316 | # extract multi-part uuencoded binaries, removing extraneous header | ||
317 | # info, so that only the uuencoded portion remains. Files passed to | ||
318 | # sed must be passed in the proper order. Version 1 can be entered | ||
319 | # from the command line; version 2 can be made into an executable | ||
320 | # Unix shell script. (Modified from a script by Rahul Dhesi.) | ||
321 | sed '/^end/,/^begin/d' file1 file2 ... fileX | uudecode # vers. 1 | ||
322 | sed '/^end/,/^begin/d' "$@" | uudecode # vers. 2 | ||
323 | |||
324 | # zip up each .TXT file individually, deleting the source file and | ||
325 | # setting the name of each .ZIP file to the basename of the .TXT file | ||
326 | # (under DOS: the "dir /b" switch returns bare filenames in all caps). | ||
327 | echo @echo off >zipup.bat | ||
328 | dir /b *.txt | sed "s/^\(.*\)\.TXT/pkzip -mo \1 \1.TXT/" >>zipup.bat | ||
329 | |||
330 | TYPICAL USE: Sed takes one or more editing commands and applies all of | ||
331 | them, in sequence, to each line of input. After all the commands have | ||
332 | been applied to the first input line, that line is output and a second | ||
333 | input line is taken for processing, and the cycle repeats. The | ||
334 | preceding examples assume that input comes from the standard input | ||
335 | device (i.e, the console, normally this will be piped input). One or | ||
336 | more filenames can be appended to the command line if the input does | ||
337 | not come from stdin. Output is sent to stdout (the screen). Thus: | ||
338 | |||
339 | cat filename | sed '10q' # uses piped input | ||
340 | sed '10q' filename # same effect, avoids a useless "cat" | ||
341 | sed '10q' filename > newfile # redirects output to disk | ||
342 | |||
343 | For additional syntax instructions, including the way to apply editing | ||
344 | commands from a disk file instead of the command line, consult "sed & | ||
345 | awk, 2nd Edition," by Dale Dougherty and Arnold Robbins (O'Reilly, | ||
346 | 1997; http://www.ora.com), "UNIX Text Processing," by Dale Dougherty | ||
347 | and Tim O'Reilly (Hayden Books, 1987) or the tutorials by Mike Arst | ||
348 | distributed in U-SEDIT2.ZIP (many sites). To fully exploit the power | ||
349 | of sed, one must understand "regular expressions." For this, see | ||
350 | "Mastering Regular Expressions" by Jeffrey Friedl (O'Reilly, 1997). | ||
351 | The manual ("man") pages on Unix systems may be helpful (try "man | ||
352 | sed", "man regexp", or the subsection on regular expressions in "man | ||
353 | ed"), but man pages are notoriously difficult. They are not written to | ||
354 | teach sed use or regexps to first-time users, but as a reference text | ||
355 | for those already acquainted with these tools. | ||
356 | |||
357 | QUOTING SYNTAX: The preceding examples use single quotes ('...') | ||
358 | instead of double quotes ("...") to enclose editing commands, since | ||
359 | sed is typically used on a Unix platform. Single quotes prevent the | ||
360 | Unix shell from intrepreting the dollar sign ($) and backquotes | ||
361 | (`...`), which are expanded by the shell if they are enclosed in | ||
362 | double quotes. Users of the "csh" shell and derivatives will also need | ||
363 | to quote the exclamation mark (!) with the backslash (i.e., \!) to | ||
364 | properly run the examples listed above, even within single quotes. | ||
365 | Versions of sed written for DOS invariably require double quotes | ||
366 | ("...") instead of single quotes to enclose editing commands. | ||
367 | |||
368 | USE OF '\t' IN SED SCRIPTS: For clarity in documentation, we have used | ||
369 | the expression '\t' to indicate a tab character (0x09) in the scripts. | ||
370 | However, most versions of sed do not recognize the '\t' abbreviation, | ||
371 | so when typing these scripts from the command line, you should press | ||
372 | the TAB key instead. '\t' is supported as a regular expression | ||
373 | metacharacter in awk, perl, and HHsed, sedmod, and GNU sed v3.02.80. | ||
374 | |||
375 | VERSIONS OF SED: Versions of sed do differ, and some slight syntax | ||
376 | variation is to be expected. In particular, most do not support the | ||
377 | use of labels (:name) or branch instructions (b,t) within editing | ||
378 | commands, except at the end of those commands. We have used the syntax | ||
379 | which will be portable to most users of sed, even though the popular | ||
380 | GNU versions of sed allow a more succinct syntax. When the reader sees | ||
381 | a fairly long command such as this: | ||
382 | |||
383 | sed -e '/AAA/b' -e '/BBB/b' -e '/CCC/b' -e d | ||
384 | |||
385 | it is heartening to know that GNU sed will let you reduce it to: | ||
386 | |||
387 | sed '/AAA/b;/BBB/b;/CCC/b;d' # or even | ||
388 | sed '/AAA\|BBB\|CCC/b;d' | ||
389 | |||
390 | In addition, remember that while many versions of sed accept a command | ||
391 | like "/one/ s/RE1/RE2/", some do NOT allow "/one/! s/RE1/RE2/", which | ||
392 | contains space before the 's'. Omit the space when typing the command. | ||
393 | |||
394 | OPTIMIZING FOR SPEED: If execution speed needs to be increased (due to | ||
395 | large input files or slow processors or hard disks), substitution will | ||
396 | be executed more quickly if the "find" expression is specified before | ||
397 | giving the "s/.../.../" instruction. Thus: | ||
398 | |||
399 | sed 's/foo/bar/g' filename # standard replace command | ||
400 | sed '/foo/ s/foo/bar/g' filename # executes more quickly | ||
401 | sed '/foo/ s//bar/g' filename # shorthand sed syntax | ||
402 | |||
403 | On line selection or deletion in which you only need to output lines | ||
404 | from the first part of the file, a "quit" command (q) in the script | ||
405 | will drastically reduce processing time for large files. Thus: | ||
406 | |||
407 | sed -n '45,50p' filename # print line nos. 45-50 of a file | ||
408 | sed -n '51q;45,50p' filename # same, but executes much faster | ||
409 | |||
410 | If you have any additional scripts to contribute or if you find errors | ||
411 | in this document, please send e-mail to the compiler. Indicate the | ||
412 | version of sed you used, the operating system it was compiled for, and | ||
413 | the nature of the problem. Various scripts in this file were written | ||
414 | or contributed by: | ||
415 | |||
416 | Al Aab <af137@freenet.toronto.on.ca> # "seders" list moderator | ||
417 | Edgar Allen <era@sky.net> # various | ||
418 | Yiorgos Adamopoulos <adamo@softlab.ece.ntua.gr> | ||
419 | Dale Dougherty <dale@songline.com> # author of "sed & awk" | ||
420 | Carlos Duarte <cdua@algos.inesc.pt> # author of "do it with sed" | ||
421 | Eric Pement <pemente@northpark.edu> # author of this document | ||
422 | Ken Pizzini <ken@halcyon.com> # author of GNU sed v3.02 | ||
423 | S.G. Ravenhall <stew.ravenhall@totalise.co.uk> # great de-html script | ||
424 | Greg Ubben <gsu@romulus.ncsc.mil> # many contributions & much help | ||
425 | ------------------------------------------------------------------------- | ||
diff --git a/editors/sed_summary.htm b/editors/sed_summary.htm new file mode 100644 index 000000000..4ac9b16f6 --- /dev/null +++ b/editors/sed_summary.htm | |||
@@ -0,0 +1,220 @@ | |||
1 | <html> | ||
2 | |||
3 | <head><title>Command Summary for sed (sed & awk, Second Edition)</title> | ||
4 | </head> | ||
5 | |||
6 | <body> | ||
7 | |||
8 | <h2>Command Summary for sed</h2> | ||
9 | |||
10 | <dl> | ||
11 | |||
12 | <dt><b>: </b> <b> :</b><em>label</em></dt> | ||
13 | <dd>Label a line in the script for the transfer of control by | ||
14 | <b>b</b> or <b>t</b>. | ||
15 | <em>label</em> may contain up to seven characters. | ||
16 | (The POSIX standard says that an implementation can allow longer | ||
17 | labels if it wishes to. GNU sed allows labels to be of any length.) | ||
18 | </p></dd> | ||
19 | |||
20 | |||
21 | <dt><b>=</b> [<em>address</em>]<b>=</b></dt> | ||
22 | <dd>Write to standard output the line number of addressed line.</p></dd> | ||
23 | |||
24 | |||
25 | <dt><b>a</b> [<em>address</em>]<b>a\</b></dt> | ||
26 | <dd><em>text</em></p> | ||
27 | |||
28 | <p>Append <em>text</em> | ||
29 | following each line matched by <em>address</em>. If | ||
30 | <em>text</em> goes over more than one line, newlines | ||
31 | must be "hidden" by preceding them with a backslash. The | ||
32 | <em>text</em> will be terminated by the first | ||
33 | newline that is not hidden in this way. The | ||
34 | <em>text</em> is not available in the pattern space | ||
35 | and subsequent commands cannot be applied to it. The results of this | ||
36 | command are sent to standard output when the list of editing commands | ||
37 | is finished, regardless of what happens to the current line in the | ||
38 | pattern space.</p></dd> | ||
39 | |||
40 | |||
41 | <dt><b>b</b> [<em>address1</em>[,<em>address2</em>]]<b>b</b>[<em>label</em>]</dt> | ||
42 | <dd>Transfer control unconditionally (branch) to | ||
43 | <b>:</b><em>label</em> elsewhere in | ||
44 | script. That is, the command following the | ||
45 | <em>label</em> is the next command applied to the | ||
46 | current line. If no <em>label</em> is specified, | ||
47 | control falls through to the end of the script, so no more commands | ||
48 | are applied to the current line.</p></dd> | ||
49 | |||
50 | |||
51 | <dt><b>c</b> [<em>address1</em>[,<em>address2</em>]]<b>c\</b></dt> | ||
52 | <dd><em>text</em></p> | ||
53 | |||
54 | <p>Replace (change) the lines selected by the address with | ||
55 | <em>text</em>. When a range of lines is specified, | ||
56 | all lines as a group are replaced by a single copy of | ||
57 | <em>text</em>. The newline following each line of | ||
58 | <em>text</em> must be escaped by a backslash, except | ||
59 | the last line. The contents of the pattern space are, in effect, | ||
60 | deleted and no subsequent editing commands can be applied to it (or to | ||
61 | <em>text</em>).</p></dd> | ||
62 | |||
63 | |||
64 | <dt><b>d</b> [<em>address1</em>[,<em>address2</em>]]<b>d</b></dt> | ||
65 | <dd>Delete line(s) from pattern space. Thus, the line is not passed to standard | ||
66 | output. A new line of input is read and editing resumes with first | ||
67 | command in script.</p></dd> | ||
68 | |||
69 | |||
70 | <dt><b>D</b> [<em>address1</em>[,<em>address2</em>]]<b>D</b></dt> | ||
71 | <dd>Delete first part (up to embedded newline) of multiline pattern space created | ||
72 | by <b>N</b> command and resume editing with first command in | ||
73 | script. If this command empties the pattern space, then a new line | ||
74 | of input is read, as if the <b>d</b> command had been executed.</p></dd> | ||
75 | |||
76 | |||
77 | <dt><b>g</b> [<em>address1</em>[,<em>address2</em>]]<b>g</b></dt> | ||
78 | <dd>Copy (get) contents of hold space (see <b>h</b> or | ||
79 | <b>H</b> command) into the pattern space, wiping out | ||
80 | previous contents.</p></dd> | ||
81 | |||
82 | |||
83 | <dt><b>G</b> [<em>address1</em>[,<em>address2</em>]]<b>G</b></dt> | ||
84 | <dd>Append newline followed by contents of hold space (see | ||
85 | <b>h</b> or <b>H</b> command) to contents of | ||
86 | the pattern space. If hold space is empty, a newline is still | ||
87 | appended to the pattern space.</p></dd> | ||
88 | |||
89 | |||
90 | <dt><b>h</b> [<em>address1</em>[,<em>address2</em>]]<b>h</b></dt> | ||
91 | <dd>Copy pattern space into hold space, a special temporary buffer. | ||
92 | Previous contents of hold space are wiped out.</p></dd> | ||
93 | |||
94 | |||
95 | <dt><b>H</b> [<em>address1</em>[,<em>address2</em>]]<b>H</b></dt> | ||
96 | <dd>Append newline and contents of pattern space to contents of the hold | ||
97 | space. Even if hold space is empty, this command still appends the | ||
98 | newline first.</p></dd> | ||
99 | |||
100 | |||
101 | <dt><b>i</b> [<em>address1</em>]<b>i\</b></dt> | ||
102 | <dd><em>text</em></p> | ||
103 | |||
104 | <p>Insert <em>text</em> before each line matched by | ||
105 | <em>address</em>. (See <b>a</b> for | ||
106 | details on <em>text</em>.)</p></dd> | ||
107 | |||
108 | |||
109 | <dt><b>l</b> [<em>address1</em>[,<em>address2</em>]]<b>l</b></dt> | ||
110 | <dd>List the contents of the pattern space, showing nonprinting characters | ||
111 | as ASCII codes. Long lines are wrapped.</p></dd> | ||
112 | |||
113 | |||
114 | <dt><b>n</b> [<em>address1</em>[,<em>address2</em>]]<b>n</b></dt> | ||
115 | <dd>Read next line of input into pattern space. Current line is sent to | ||
116 | standard output. New line becomes current line and increments line | ||
117 | counter. Control passes to command following <b>n</b> | ||
118 | instead of resuming at the top of the script.</p></dd> | ||
119 | |||
120 | |||
121 | <dt><b>N</b> [<em>address1</em>[,<em>address2</em>]]<b>N</b></dt> | ||
122 | <dd>Append next input line to contents of pattern space; the new line is | ||
123 | separated from the previous contents of the pattern space by a newline. | ||
124 | (This command is designed to allow pattern matches across two | ||
125 | lines. Using \n to match the embedded newline, you can match | ||
126 | patterns across multiple lines.)</p></dd> | ||
127 | |||
128 | |||
129 | <dt><b>p</b> [<em>address1</em>[,<em>address2</em>]]<b>p</b></dt> | ||
130 | <dd>Print the addressed line(s). Note that this can result in duplicate | ||
131 | output unless default output is suppressed by using "#n" or | ||
132 | the <span class="option">-n</span> | ||
133 | |||
134 | command-line option. Typically used before commands that change flow | ||
135 | control (<b>d</b>, <b>n</b>, | ||
136 | <b>b</b>) and might prevent the current line from being | ||
137 | output.</p></dd> | ||
138 | |||
139 | |||
140 | <dt><b>P</b> [<em>address1</em>[,<em>address2</em>]]<b>P</b></dt> | ||
141 | <dd>Print first part (up to embedded newline) of multiline pattern space | ||
142 | created by <b>N</b> command. Same as <b>p</b> | ||
143 | if <b>N</b> has not been applied to a line.</p></dd> | ||
144 | |||
145 | |||
146 | <dt><b>q</b> [<em>address</em>]<b>q</b></dt> | ||
147 | <dd>Quit when <em>address</em> is encountered. The | ||
148 | addressed line is first written to output (if default output is not | ||
149 | suppressed), along with any text appended to it by previous | ||
150 | <b>a</b> or <b>r</b> commands.</p></dd> | ||
151 | |||
152 | |||
153 | <dt><b>r</b> [<em>address</em>]<b>r</b> <em>file</em></dt> | ||
154 | <dd>Read contents of <em>file</em> and append after the | ||
155 | contents of the pattern space. Exactly one space must be put between | ||
156 | <b>r</b> and the filename.</p></dd> | ||
157 | |||
158 | |||
159 | <dt><b>s</b> [<em>address1</em>[,<em>address2</em>]]<b>s</b>/<em>pattern</em>/<em>replacement</em>/[<em>flags</em>]</dt> | ||
160 | <dd>Substitute <em>replacement</em> for | ||
161 | <em>pattern</em> on each addressed line. If pattern | ||
162 | addresses are used, the pattern <b>//</b> represents the | ||
163 | last pattern address specified. The following flags can be specified:</p> | ||
164 | |||
165 | <dl> | ||
166 | |||
167 | <dt><b>n</b></dt> | ||
168 | <dd>Replace <em>n</em>th instance of | ||
169 | /<em>pattern</em>/ on each addressed line. | ||
170 | <em>n</em> is any number in the range 1 to 512, and | ||
171 | the default is 1.</p></dd> | ||
172 | |||
173 | <dt><b>g</b></dt> | ||
174 | <dd>Replace all instances of /<em>pattern</em>/ on each | ||
175 | addressed line, not just the first instance.</p></dd> | ||
176 | |||
177 | <dt><b>p</b></dt> | ||
178 | <dd>Print the line if a successful substitution is done. If several | ||
179 | successful substitutions are done, multiple copies of the line will be | ||
180 | printed.</p></dd> | ||
181 | |||
182 | <dt><b>w</b> <em>file</em></dt> | ||
183 | <dd>Write the line to <em>file</em> if a replacement | ||
184 | was done. A maximum of 10 different <em>files</em> can be opened.</p></dd> | ||
185 | |||
186 | </dl> | ||
187 | |||
188 | </dd> | ||
189 | |||
190 | |||
191 | <dt><b>t</b> [<em>address1</em>[,<em>address2</em>]]<b>t </b>[<em>label</em>]</dt> | ||
192 | <dd>Test if successful substitutions have been made on addressed lines, | ||
193 | and if so, branch to line marked by :<em>label</em>. | ||
194 | (See <b>b</b> and <b>:</b>.) If label is not | ||
195 | specified, control falls through to bottom of script.</p></dd> | ||
196 | |||
197 | |||
198 | <dt><b>w</b> [<em>address1</em>[,<em>address2</em>]]<b>w</b> <em>file</em></dt> | ||
199 | <dd>Append contents of pattern space to <em>file</em>. | ||
200 | This action occurs when the command is encountered rather than when | ||
201 | the pattern space is output. Exactly one space must separate the | ||
202 | <b>w</b> and the filename. A maximum of 10 different | ||
203 | files can be opened in a script. This command will create the file if | ||
204 | it does not exist; if the file exists, its contents will be | ||
205 | overwritten each time the script is executed. Multiple write commands | ||
206 | that direct output to the same file append to the end of the file.</p></dd> | ||
207 | |||
208 | |||
209 | <dt><b>x</b> [<em>address1</em>[,<em>address2</em>]]<b>x</b></dt> | ||
210 | <dd>Exchange contents of the pattern space with the contents of the hold | ||
211 | space.</p></dd> | ||
212 | |||
213 | |||
214 | <dt><b>y</b> [<em>address1</em>[,<em>address2</em>]]<b>y</b>/<em>abc</em>/<em>xyz</em>/</dt> | ||
215 | <dd>Transform each character by position in string | ||
216 | <em>abc</em> to its equivalent in string | ||
217 | <em>xyz</em>.</p></dd> | ||
218 | |||
219 | |||
220 | </dl> | ||