blob: 29affc932bf16781bcb789812897357997afac82 [file] [log] [blame]
Denis Vlasenko3952f202007-08-13 14:10:24 +00001/* expand - convert tabs to spaces
2 * unexpand - convert spaces to tabs
3 *
4 * Copyright (C) 89, 91, 1995-2006 Free Software Foundation, Inc.
5 *
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +02006 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
Denis Vlasenko3952f202007-08-13 14:10:24 +00007 *
8 * David MacKenzie <djm@gnu.ai.mit.edu>
9 *
10 * Options for expand:
11 * -t num --tabs=NUM Convert tabs to num spaces (default 8 spaces).
12 * -i --initial Only convert initial tabs on each line to spaces.
13 *
14 * Options for unexpand:
15 * -a --all Convert all blanks, instead of just initial blanks.
16 * -f --first-only Convert only leading sequences of blanks (default).
17 * -t num --tabs=NUM Have tabs num characters apart instead of 8.
18 *
19 * Busybox version (C) 2007 by Tito Ragusa <farmatito@tiscali.it>
20 *
21 * Caveat: this versions of expand and unexpand don't accept tab lists.
22 */
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010023//config:config EXPAND
24//config: bool "expand"
25//config: default y
26//config: help
27//config: By default, convert all tabs to spaces.
28//config:
29//config:config FEATURE_EXPAND_LONG_OPTIONS
30//config: bool "Enable long options"
31//config: default y
32//config: depends on EXPAND && LONG_OPTS
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010033//config:
34//config:config UNEXPAND
35//config: bool "unexpand"
36//config: default y
37//config: help
38//config: By default, convert only leading sequences of blanks to tabs.
39//config:
40//config:config FEATURE_UNEXPAND_LONG_OPTIONS
41//config: bool "Enable long options"
42//config: default y
43//config: depends on UNEXPAND && LONG_OPTS
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010044
45//applet:IF_EXPAND(APPLET(expand, BB_DIR_USR_BIN, BB_SUID_DROP))
46//applet:IF_UNEXPAND(APPLET_ODDNAME(unexpand, expand, BB_DIR_USR_BIN, BB_SUID_DROP, unexpand))
47
48//kbuild:lib-$(CONFIG_EXPAND) += expand.o
49//kbuild:lib-$(CONFIG_UNEXPAND) += expand.o
Pere Orga34425382011-03-31 14:43:25 +020050
51//usage:#define expand_trivial_usage
52//usage: "[-i] [-t N] [FILE]..."
53//usage:#define expand_full_usage "\n\n"
54//usage: "Convert tabs to spaces, writing to stdout\n"
Pere Orga34425382011-03-31 14:43:25 +020055//usage: IF_FEATURE_EXPAND_LONG_OPTIONS(
56//usage: "\n -i,--initial Don't convert tabs after non blanks"
57//usage: "\n -t,--tabs=N Tabstops every N chars"
58//usage: )
59//usage: IF_NOT_FEATURE_EXPAND_LONG_OPTIONS(
60//usage: "\n -i Don't convert tabs after non blanks"
61//usage: "\n -t Tabstops every N chars"
62//usage: )
63
64//usage:#define unexpand_trivial_usage
65//usage: "[-fa][-t N] [FILE]..."
66//usage:#define unexpand_full_usage "\n\n"
67//usage: "Convert spaces to tabs, writing to stdout\n"
Pere Orga34425382011-03-31 14:43:25 +020068//usage: IF_FEATURE_UNEXPAND_LONG_OPTIONS(
69//usage: "\n -a,--all Convert all blanks"
70//usage: "\n -f,--first-only Convert only leading blanks"
71//usage: "\n -t,--tabs=N Tabstops every N chars"
72//usage: )
73//usage: IF_NOT_FEATURE_UNEXPAND_LONG_OPTIONS(
74//usage: "\n -a Convert all blanks"
75//usage: "\n -f Convert only leading blanks"
76//usage: "\n -t N Tabstops every N chars"
77//usage: )
78
Denis Vlasenko3952f202007-08-13 14:10:24 +000079#include "libbb.h"
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010080#include "unicode.h"
Denis Vlasenko3952f202007-08-13 14:10:24 +000081
82enum {
83 OPT_INITIAL = 1 << 0,
84 OPT_TABS = 1 << 1,
85 OPT_ALL = 1 << 2,
86};
87
Denis Vlasenko3952f202007-08-13 14:10:24 +000088#if ENABLE_EXPAND
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010089static void expand(FILE *file, unsigned tab_size, unsigned opt)
Denis Vlasenko3952f202007-08-13 14:10:24 +000090{
91 char *line;
Denis Vlasenko3952f202007-08-13 14:10:24 +000092
Denis Vlasenko3952f202007-08-13 14:10:24 +000093 while ((line = xmalloc_fgets(file)) != NULL) {
Denis Vlasenko3139ea72008-12-14 15:45:25 +000094 unsigned char c;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010095 char *ptr;
96 char *ptr_strbeg;
Denis Vlasenko3139ea72008-12-14 15:45:25 +000097
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010098 ptr = ptr_strbeg = line;
Denis Vlasenko3139ea72008-12-14 15:45:25 +000099 while ((c = *ptr) != '\0') {
100 if ((opt & OPT_INITIAL) && !isblank(c)) {
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100101 /* not space or tab */
Denis Vlasenko3139ea72008-12-14 15:45:25 +0000102 break;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000103 }
Denis Vlasenko3139ea72008-12-14 15:45:25 +0000104 if (c == '\t') {
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100105 unsigned len;
106 *ptr = '\0';
Denys Vlasenko19158a82010-03-26 14:06:56 +0100107# if ENABLE_UNICODE_SUPPORT
Michael Tokarev22bb81f2013-12-09 16:09:35 +0400108 len = unicode_strwidth(ptr_strbeg);
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100109# else
110 len = ptr - ptr_strbeg;
111# endif
112 len = tab_size - (len % tab_size);
113 /*while (ptr[1] == '\t') { ptr++; len += tab_size; } - can handle many tabs at once */
114 printf("%s%*s", ptr_strbeg, len, "");
115 ptr_strbeg = ptr + 1;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000116 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100117 ptr++;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000118 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100119 fputs(ptr_strbeg, stdout);
Denis Vlasenko3139ea72008-12-14 15:45:25 +0000120 free(line);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000121 }
122}
123#endif
124
125#if ENABLE_UNEXPAND
Denis Vlasenko3139ea72008-12-14 15:45:25 +0000126static void unexpand(FILE *file, unsigned tab_size, unsigned opt)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000127{
128 char *line;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000129
130 while ((line = xmalloc_fgets(file)) != NULL) {
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000131 char *ptr = line;
132 unsigned column = 0;
133
134 while (*ptr) {
135 unsigned n;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100136 unsigned len = 0;
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000137
138 while (*ptr == ' ') {
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000139 ptr++;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100140 len++;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000141 }
Tomas Heinrich968951f2010-03-26 09:46:07 +0100142 column += len;
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000143 if (*ptr == '\t') {
144 column += tab_size - (column % tab_size);
145 ptr++;
146 continue;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000147 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000148
149 n = column / tab_size;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100150 if (n) {
151 len = column = column % tab_size;
152 while (n--)
153 putchar('\t');
154 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000155
156 if ((opt & OPT_INITIAL) && ptr != line) {
Tomas Heinrich968951f2010-03-26 09:46:07 +0100157 printf("%*s%s", len, "", ptr);
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000158 break;
159 }
160 n = strcspn(ptr, "\t ");
Tomas Heinrich968951f2010-03-26 09:46:07 +0100161 printf("%*s%.*s", len, "", n, ptr);
Denys Vlasenko19158a82010-03-26 14:06:56 +0100162# if ENABLE_UNICODE_SUPPORT
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100163 {
Michael Tokarev22bb81f2013-12-09 16:09:35 +0400164 char c = ptr[n];
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100165 ptr[n] = '\0';
Michael Tokarev22bb81f2013-12-09 16:09:35 +0400166 len = unicode_strwidth(ptr);
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100167 ptr[n] = c;
168 }
169# else
170 len = n;
171# endif
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000172 ptr += n;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100173 column = (column + len) % tab_size;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000174 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000175 free(line);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000176 }
177}
178#endif
179
Denis Vlasenko9b49a5e2007-10-11 10:05:36 +0000180int expand_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
Denis Vlasenkoa60f84e2008-07-05 09:18:54 +0000181int expand_main(int argc UNUSED_PARAM, char **argv)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000182{
183 /* Default 8 spaces for 1 tab */
184 const char *opt_t = "8";
185 FILE *file;
186 unsigned tab_size;
187 unsigned opt;
188 int exit_status = EXIT_SUCCESS;
189
190#if ENABLE_FEATURE_EXPAND_LONG_OPTIONS
191 static const char expand_longopts[] ALIGN1 =
192 /* name, has_arg, val */
193 "initial\0" No_argument "i"
194 "tabs\0" Required_argument "t"
195 ;
196#endif
197#if ENABLE_FEATURE_UNEXPAND_LONG_OPTIONS
198 static const char unexpand_longopts[] ALIGN1 =
199 /* name, has_arg, val */
200 "first-only\0" No_argument "i"
201 "tabs\0" Required_argument "t"
202 "all\0" No_argument "a"
203 ;
204#endif
Denys Vlasenko28055022010-01-04 20:49:58 +0100205 init_unicode();
Denis Vlasenko3952f202007-08-13 14:10:24 +0000206
207 if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e')) {
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000208 IF_FEATURE_EXPAND_LONG_OPTIONS(applet_long_options = expand_longopts);
Denis Vlasenkofe7cd642007-08-18 15:32:12 +0000209 opt = getopt32(argv, "it:", &opt_t);
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000210 } else {
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000211 IF_FEATURE_UNEXPAND_LONG_OPTIONS(applet_long_options = unexpand_longopts);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000212 /* -t NUM sets also -a */
213 opt_complementary = "ta";
Denis Vlasenkofe7cd642007-08-18 15:32:12 +0000214 opt = getopt32(argv, "ft:a", &opt_t);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000215 /* -f --first-only is the default */
216 if (!(opt & OPT_ALL)) opt |= OPT_INITIAL;
217 }
218 tab_size = xatou_range(opt_t, 1, UINT_MAX);
219
220 argv += optind;
221
Denis Vlasenko3952f202007-08-13 14:10:24 +0000222 if (!*argv) {
223 *--argv = (char*)bb_msg_standard_input;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000224 }
Denis Vlasenko3952f202007-08-13 14:10:24 +0000225 do {
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000226 file = fopen_or_warn_stdin(*argv);
227 if (!file) {
228 exit_status = EXIT_FAILURE;
229 continue;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000230 }
231
232 if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e'))
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000233 IF_EXPAND(expand(file, tab_size, opt));
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000234 else
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000235 IF_UNEXPAND(unexpand(file, tab_size, opt));
Denis Vlasenko3952f202007-08-13 14:10:24 +0000236
237 /* Check and close the file */
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000238 if (fclose_if_not_stdin(file)) {
Denis Vlasenko0c97c9d2007-10-01 11:58:38 +0000239 bb_simple_perror_msg(*argv);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000240 exit_status = EXIT_FAILURE;
241 }
242 /* If stdin also clear EOF */
Denis Vlasenko6a2f7f42007-08-16 10:35:17 +0000243 if (file == stdin)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000244 clearerr(file);
245 } while (*++argv);
246
247 /* Now close stdin also */
248 /* (if we didn't read from it, it's a no-op) */
249 if (fclose(stdin))
250 bb_perror_msg_and_die(bb_msg_standard_input);
251
252 fflush_stdout_and_exit(exit_status);
253}