blob: 73ab0ece326e8aeef970ba5139fc2c6f94c275e5 [file] [log] [blame]
Denis Vlasenko3952f202007-08-13 14:10:24 +00001/* expand - convert tabs to spaces
2 * unexpand - convert spaces to tabs
3 *
4 * Copyright (C) 89, 91, 1995-2006 Free Software Foundation, Inc.
5 *
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +02006 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
Denis Vlasenko3952f202007-08-13 14:10:24 +00007 *
8 * David MacKenzie <djm@gnu.ai.mit.edu>
9 *
10 * Options for expand:
11 * -t num --tabs=NUM Convert tabs to num spaces (default 8 spaces).
12 * -i --initial Only convert initial tabs on each line to spaces.
13 *
14 * Options for unexpand:
15 * -a --all Convert all blanks, instead of just initial blanks.
16 * -f --first-only Convert only leading sequences of blanks (default).
17 * -t num --tabs=NUM Have tabs num characters apart instead of 8.
18 *
19 * Busybox version (C) 2007 by Tito Ragusa <farmatito@tiscali.it>
20 *
21 * Caveat: this versions of expand and unexpand don't accept tab lists.
22 */
Pere Orga34425382011-03-31 14:43:25 +020023
24//usage:#define expand_trivial_usage
25//usage: "[-i] [-t N] [FILE]..."
26//usage:#define expand_full_usage "\n\n"
27//usage: "Convert tabs to spaces, writing to stdout\n"
28//usage: "\nOptions:"
29//usage: IF_FEATURE_EXPAND_LONG_OPTIONS(
30//usage: "\n -i,--initial Don't convert tabs after non blanks"
31//usage: "\n -t,--tabs=N Tabstops every N chars"
32//usage: )
33//usage: IF_NOT_FEATURE_EXPAND_LONG_OPTIONS(
34//usage: "\n -i Don't convert tabs after non blanks"
35//usage: "\n -t Tabstops every N chars"
36//usage: )
37
38//usage:#define unexpand_trivial_usage
39//usage: "[-fa][-t N] [FILE]..."
40//usage:#define unexpand_full_usage "\n\n"
41//usage: "Convert spaces to tabs, writing to stdout\n"
42//usage: "\nOptions:"
43//usage: IF_FEATURE_UNEXPAND_LONG_OPTIONS(
44//usage: "\n -a,--all Convert all blanks"
45//usage: "\n -f,--first-only Convert only leading blanks"
46//usage: "\n -t,--tabs=N Tabstops every N chars"
47//usage: )
48//usage: IF_NOT_FEATURE_UNEXPAND_LONG_OPTIONS(
49//usage: "\n -a Convert all blanks"
50//usage: "\n -f Convert only leading blanks"
51//usage: "\n -t N Tabstops every N chars"
52//usage: )
53
Denis Vlasenko3952f202007-08-13 14:10:24 +000054#include "libbb.h"
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010055#include "unicode.h"
Denis Vlasenko3952f202007-08-13 14:10:24 +000056
57enum {
58 OPT_INITIAL = 1 << 0,
59 OPT_TABS = 1 << 1,
60 OPT_ALL = 1 << 2,
61};
62
Denis Vlasenko3952f202007-08-13 14:10:24 +000063#if ENABLE_EXPAND
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010064static void expand(FILE *file, unsigned tab_size, unsigned opt)
Denis Vlasenko3952f202007-08-13 14:10:24 +000065{
66 char *line;
Denis Vlasenko3952f202007-08-13 14:10:24 +000067
Denis Vlasenko3952f202007-08-13 14:10:24 +000068 while ((line = xmalloc_fgets(file)) != NULL) {
Denis Vlasenko3139ea72008-12-14 15:45:25 +000069 unsigned char c;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010070 char *ptr;
71 char *ptr_strbeg;
Denis Vlasenko3139ea72008-12-14 15:45:25 +000072
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010073 ptr = ptr_strbeg = line;
Denis Vlasenko3139ea72008-12-14 15:45:25 +000074 while ((c = *ptr) != '\0') {
75 if ((opt & OPT_INITIAL) && !isblank(c)) {
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010076 /* not space or tab */
Denis Vlasenko3139ea72008-12-14 15:45:25 +000077 break;
Denis Vlasenko3952f202007-08-13 14:10:24 +000078 }
Denis Vlasenko3139ea72008-12-14 15:45:25 +000079 if (c == '\t') {
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010080 unsigned len;
81 *ptr = '\0';
Denys Vlasenko19158a82010-03-26 14:06:56 +010082# if ENABLE_UNICODE_SUPPORT
Tomas Heinrich1abc07d2010-03-26 09:40:47 +010083 {
84 uni_stat_t uni_stat;
85 printable_string(&uni_stat, ptr_strbeg);
86 len = uni_stat.unicode_width;
87 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010088# else
89 len = ptr - ptr_strbeg;
90# endif
91 len = tab_size - (len % tab_size);
92 /*while (ptr[1] == '\t') { ptr++; len += tab_size; } - can handle many tabs at once */
93 printf("%s%*s", ptr_strbeg, len, "");
94 ptr_strbeg = ptr + 1;
Denis Vlasenko3952f202007-08-13 14:10:24 +000095 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010096 ptr++;
Denis Vlasenko3952f202007-08-13 14:10:24 +000097 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010098 fputs(ptr_strbeg, stdout);
Denis Vlasenko3139ea72008-12-14 15:45:25 +000099 free(line);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000100 }
101}
102#endif
103
104#if ENABLE_UNEXPAND
Denis Vlasenko3139ea72008-12-14 15:45:25 +0000105static void unexpand(FILE *file, unsigned tab_size, unsigned opt)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000106{
107 char *line;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000108
109 while ((line = xmalloc_fgets(file)) != NULL) {
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000110 char *ptr = line;
111 unsigned column = 0;
112
113 while (*ptr) {
114 unsigned n;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100115 unsigned len = 0;
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000116
117 while (*ptr == ' ') {
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000118 ptr++;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100119 len++;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000120 }
Tomas Heinrich968951f2010-03-26 09:46:07 +0100121 column += len;
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000122 if (*ptr == '\t') {
123 column += tab_size - (column % tab_size);
124 ptr++;
125 continue;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000126 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000127
128 n = column / tab_size;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100129 if (n) {
130 len = column = column % tab_size;
131 while (n--)
132 putchar('\t');
133 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000134
135 if ((opt & OPT_INITIAL) && ptr != line) {
Tomas Heinrich968951f2010-03-26 09:46:07 +0100136 printf("%*s%s", len, "", ptr);
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000137 break;
138 }
139 n = strcspn(ptr, "\t ");
Tomas Heinrich968951f2010-03-26 09:46:07 +0100140 printf("%*s%.*s", len, "", n, ptr);
Denys Vlasenko19158a82010-03-26 14:06:56 +0100141# if ENABLE_UNICODE_SUPPORT
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100142 {
143 char c;
Tomas Heinrich1abc07d2010-03-26 09:40:47 +0100144 uni_stat_t uni_stat;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100145 c = ptr[n];
146 ptr[n] = '\0';
Tomas Heinrich1abc07d2010-03-26 09:40:47 +0100147 printable_string(&uni_stat, ptr);
148 len = uni_stat.unicode_width;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100149 ptr[n] = c;
150 }
151# else
152 len = n;
153# endif
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000154 ptr += n;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100155 column = (column + len) % tab_size;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000156 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000157 free(line);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000158 }
159}
160#endif
161
Denis Vlasenko9b49a5e2007-10-11 10:05:36 +0000162int expand_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
Denis Vlasenkoa60f84e2008-07-05 09:18:54 +0000163int expand_main(int argc UNUSED_PARAM, char **argv)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000164{
165 /* Default 8 spaces for 1 tab */
166 const char *opt_t = "8";
167 FILE *file;
168 unsigned tab_size;
169 unsigned opt;
170 int exit_status = EXIT_SUCCESS;
171
172#if ENABLE_FEATURE_EXPAND_LONG_OPTIONS
173 static const char expand_longopts[] ALIGN1 =
174 /* name, has_arg, val */
175 "initial\0" No_argument "i"
176 "tabs\0" Required_argument "t"
177 ;
178#endif
179#if ENABLE_FEATURE_UNEXPAND_LONG_OPTIONS
180 static const char unexpand_longopts[] ALIGN1 =
181 /* name, has_arg, val */
182 "first-only\0" No_argument "i"
183 "tabs\0" Required_argument "t"
184 "all\0" No_argument "a"
185 ;
186#endif
Denys Vlasenko28055022010-01-04 20:49:58 +0100187 init_unicode();
Denis Vlasenko3952f202007-08-13 14:10:24 +0000188
189 if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e')) {
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000190 IF_FEATURE_EXPAND_LONG_OPTIONS(applet_long_options = expand_longopts);
Denis Vlasenkofe7cd642007-08-18 15:32:12 +0000191 opt = getopt32(argv, "it:", &opt_t);
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000192 } else {
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000193 IF_FEATURE_UNEXPAND_LONG_OPTIONS(applet_long_options = unexpand_longopts);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000194 /* -t NUM sets also -a */
195 opt_complementary = "ta";
Denis Vlasenkofe7cd642007-08-18 15:32:12 +0000196 opt = getopt32(argv, "ft:a", &opt_t);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000197 /* -f --first-only is the default */
198 if (!(opt & OPT_ALL)) opt |= OPT_INITIAL;
199 }
200 tab_size = xatou_range(opt_t, 1, UINT_MAX);
201
202 argv += optind;
203
Denis Vlasenko3952f202007-08-13 14:10:24 +0000204 if (!*argv) {
205 *--argv = (char*)bb_msg_standard_input;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000206 }
Denis Vlasenko3952f202007-08-13 14:10:24 +0000207 do {
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000208 file = fopen_or_warn_stdin(*argv);
209 if (!file) {
210 exit_status = EXIT_FAILURE;
211 continue;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000212 }
213
214 if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e'))
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000215 IF_EXPAND(expand(file, tab_size, opt));
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000216 else
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000217 IF_UNEXPAND(unexpand(file, tab_size, opt));
Denis Vlasenko3952f202007-08-13 14:10:24 +0000218
219 /* Check and close the file */
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000220 if (fclose_if_not_stdin(file)) {
Denis Vlasenko0c97c9d2007-10-01 11:58:38 +0000221 bb_simple_perror_msg(*argv);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000222 exit_status = EXIT_FAILURE;
223 }
224 /* If stdin also clear EOF */
Denis Vlasenko6a2f7f42007-08-16 10:35:17 +0000225 if (file == stdin)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000226 clearerr(file);
227 } while (*++argv);
228
229 /* Now close stdin also */
230 /* (if we didn't read from it, it's a no-op) */
231 if (fclose(stdin))
232 bb_perror_msg_and_die(bb_msg_standard_input);
233
234 fflush_stdout_and_exit(exit_status);
235}