blob: 0e7306377d540e761ae21cd6657bfaae892209a8 [file] [log] [blame]
"Robert P. J. Day"63fc1a92006-07-02 19:47:05 +00001/* vi: set sw=4 ts=4: */
Glenn L McGrathf01b8052003-04-27 06:02:14 +00002/* fold -- wrap each input line to fit in specified width.
3
4 Written by David MacKenzie, djm@gnu.ai.mit.edu.
5 Copyright (C) 91, 1995-2002 Free Software Foundation, Inc.
6
7 Modified for busybox based on coreutils v 5.0
Denis Vlasenko0beaff82007-09-21 13:16:32 +00008 Copyright (C) 2003 Glenn McGrath
Glenn L McGrathf01b8052003-04-27 06:02:14 +00009
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +020010 Licensed under GPLv2 or later, see file LICENSE in this source tree.
Glenn L McGrathf01b8052003-04-27 06:02:14 +000011*/
Pere Orga34425382011-03-31 14:43:25 +020012
13//usage:#define fold_trivial_usage
14//usage: "[-bs] [-w WIDTH] [FILE]..."
15//usage:#define fold_full_usage "\n\n"
16//usage: "Wrap input lines in each FILE (or stdin), writing to stdout\n"
Pere Orga34425382011-03-31 14:43:25 +020017//usage: "\n -b Count bytes rather than columns"
18//usage: "\n -s Break at spaces"
19//usage: "\n -w Use WIDTH columns instead of 80"
20
Denis Vlasenkob6adbf12007-05-26 19:00:18 +000021#include "libbb.h"
Denys Vlasenko28055022010-01-04 20:49:58 +010022#include "unicode.h"
Glenn L McGrathf01b8052003-04-27 06:02:14 +000023
Dan Fandrich2d1a78b2010-09-30 14:31:12 -070024/* This is a NOEXEC applet. Be very careful! */
25
Denis Vlasenko62a90cd2008-03-17 09:07:36 +000026/* Must match getopt32 call */
27#define FLAG_COUNT_BYTES 1
28#define FLAG_BREAK_SPACES 2
29#define FLAG_WIDTH 4
Glenn L McGrathf01b8052003-04-27 06:02:14 +000030
31/* Assuming the current column is COLUMN, return the column that
32 printing C will move the cursor to.
33 The first column is 0. */
Denys Vlasenko28055022010-01-04 20:49:58 +010034static int adjust_column(unsigned column, char c)
Glenn L McGrathf01b8052003-04-27 06:02:14 +000035{
Denys Vlasenko28055022010-01-04 20:49:58 +010036 if (option_mask32 & FLAG_COUNT_BYTES)
37 return ++column;
38
39 if (c == '\t')
40 return column + 8 - column % 8;
41
42 if (c == '\b') {
43 if ((int)--column < 0)
Glenn L McGrathf01b8052003-04-27 06:02:14 +000044 column = 0;
Denys Vlasenko28055022010-01-04 20:49:58 +010045 }
46 else if (c == '\r')
47 column = 0;
48 else { /* just a printable char */
49 if (unicode_status != UNICODE_ON /* every byte is a new char */
50 || (c & 0xc0) != 0x80 /* it isn't a 2nd+ byte of a Unicode char */
51 ) {
Glenn L McGrathf01b8052003-04-27 06:02:14 +000052 column++;
Denys Vlasenko28055022010-01-04 20:49:58 +010053 }
54 }
Glenn L McGrathf01b8052003-04-27 06:02:14 +000055 return column;
56}
57
Denys Vlasenko28055022010-01-04 20:49:58 +010058/* Note that this function can write NULs, unlike fputs etc. */
59static void write2stdout(const void *buf, unsigned size)
60{
61 fwrite(buf, 1, size, stdout);
62}
63
Denis Vlasenko9b49a5e2007-10-11 10:05:36 +000064int fold_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
Denys Vlasenkoded688c2009-11-04 15:31:19 +010065int fold_main(int argc UNUSED_PARAM, char **argv)
Glenn L McGrathf01b8052003-04-27 06:02:14 +000066{
Denis Vlasenko931de892007-06-21 12:43:45 +000067 char *line_out = NULL;
Denys Vlasenko28055022010-01-04 20:49:58 +010068 const char *w_opt = "80";
69 unsigned width;
70 smallint exitcode = EXIT_SUCCESS;
71
72 init_unicode();
Glenn L McGrathf01b8052003-04-27 06:02:14 +000073
Denis Vlasenko08492072006-12-22 13:56:36 +000074 if (ENABLE_INCLUDE_SUSv2) {
Rob Landleyf8fd4db2006-01-30 01:30:39 +000075 /* Turn any numeric options into -w options. */
Denys Vlasenko28055022010-01-04 20:49:58 +010076 int i;
Denys Vlasenkoded688c2009-11-04 15:31:19 +010077 for (i = 1; argv[i]; i++) {
Denys Vlasenko28055022010-01-04 20:49:58 +010078 const char *a = argv[i];
79 if (*a == '-') {
80 a++;
Denis Vlasenko62a90cd2008-03-17 09:07:36 +000081 if (*a == '-' && !a[1]) /* "--" */
Rob Landleyf8fd4db2006-01-30 01:30:39 +000082 break;
Denis Vlasenko62a90cd2008-03-17 09:07:36 +000083 if (isdigit(*a))
Rob Landleyd921b2e2006-08-03 15:41:12 +000084 argv[i] = xasprintf("-w%s", a);
Glenn L McGrathf01b8052003-04-27 06:02:14 +000085 }
86 }
87 }
88
Denis Vlasenko62a90cd2008-03-17 09:07:36 +000089 getopt32(argv, "bsw:", &w_opt);
Denys Vlasenko28055022010-01-04 20:49:58 +010090 width = xatou_range(w_opt, 1, 10000);
Glenn L McGrathf01b8052003-04-27 06:02:14 +000091
92 argv += optind;
Denis Vlasenko62a90cd2008-03-17 09:07:36 +000093 if (!*argv)
Denis Vlasenkoa41fdf32007-01-29 22:51:00 +000094 *--argv = (char*)"-";
Glenn L McGrathf01b8052003-04-27 06:02:14 +000095
96 do {
Denis Vlasenkoddec5af2006-10-26 23:25:17 +000097 FILE *istream = fopen_or_warn_stdin(*argv);
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +000098 int c;
Denys Vlasenko28055022010-01-04 20:49:58 +010099 unsigned column = 0; /* Screen column where next char will go */
100 unsigned offset_out = 0; /* Index in 'line_out' for next char */
Glenn L McGrathf01b8052003-04-27 06:02:14 +0000101
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000102 if (istream == NULL) {
Denys Vlasenko28055022010-01-04 20:49:58 +0100103 exitcode = EXIT_FAILURE;
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000104 continue;
105 }
Glenn L McGrathf01b8052003-04-27 06:02:14 +0000106
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000107 while ((c = getc(istream)) != EOF) {
Denys Vlasenko28055022010-01-04 20:49:58 +0100108 /* We grow line_out in chunks of 0x1000 bytes */
109 if ((offset_out & 0xfff) == 0) {
110 line_out = xrealloc(line_out, offset_out + 0x1000);
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000111 }
Denys Vlasenko28055022010-01-04 20:49:58 +0100112 rescan:
113 line_out[offset_out] = c;
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000114 if (c == '\n') {
Denys Vlasenko28055022010-01-04 20:49:58 +0100115 write2stdout(line_out, offset_out + 1);
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000116 column = offset_out = 0;
117 continue;
118 }
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000119 column = adjust_column(column, c);
Denys Vlasenko28055022010-01-04 20:49:58 +0100120 if (column <= width || offset_out == 0) {
121 /* offset_out == 0 case happens
122 * with small width (say, 1) and tabs.
123 * The very first tab already goes to column 8,
124 * but we must not wrap it */
125 offset_out++;
126 continue;
Glenn L McGrathf01b8052003-04-27 06:02:14 +0000127 }
128
Denys Vlasenko28055022010-01-04 20:49:58 +0100129 /* This character would make the line too long.
130 * Print the line plus a newline, and make this character
131 * start the next line */
132 if (option_mask32 & FLAG_BREAK_SPACES) {
133 unsigned i;
134 unsigned logical_end;
135
136 /* Look for the last blank. */
137 for (logical_end = offset_out - 1; (int)logical_end >= 0; logical_end--) {
138 if (!isblank(line_out[logical_end]))
139 continue;
140
141 /* Found a space or tab.
142 * Output up to and including it, and start a new line */
143 logical_end++;
144 /*line_out[logical_end] = '\n'; - NO! this nukes one buffered character */
145 write2stdout(line_out, logical_end);
146 putchar('\n');
147 /* Move the remainder to the beginning of the next line.
148 * The areas being copied here might overlap. */
149 memmove(line_out, line_out + logical_end, offset_out - logical_end);
150 offset_out -= logical_end;
151 for (column = i = 0; i < offset_out; i++) {
152 column = adjust_column(column, line_out[i]);
153 }
154 goto rescan;
155 }
156 /* No blank found, wrap will split the overlong word */
157 }
158 /* Output what we accumulated up to now, and start a new line */
159 line_out[offset_out] = '\n';
160 write2stdout(line_out, offset_out + 1);
161 column = offset_out = 0;
162 goto rescan;
163 } /* while (not EOF) */
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000164
165 if (offset_out) {
Denys Vlasenko28055022010-01-04 20:49:58 +0100166 write2stdout(line_out, offset_out);
Bernhard Reutner-Fischer4bf31272006-01-30 17:41:06 +0000167 }
168
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000169 if (fclose_if_not_stdin(istream)) {
Denys Vlasenko28055022010-01-04 20:49:58 +0100170 bb_simple_perror_msg(*argv);
171 exitcode = EXIT_FAILURE;
Glenn L McGrathf01b8052003-04-27 06:02:14 +0000172 }
173 } while (*++argv);
174
Denys Vlasenko28055022010-01-04 20:49:58 +0100175 fflush_stdout_and_exit(exitcode);
Glenn L McGrathf01b8052003-04-27 06:02:14 +0000176}