blob: 91084b80b1638d84402529d7851b9c440384011c [file] [log] [blame]
Denis Vlasenko3952f202007-08-13 14:10:24 +00001/* expand - convert tabs to spaces
2 * unexpand - convert spaces to tabs
3 *
4 * Copyright (C) 89, 91, 1995-2006 Free Software Foundation, Inc.
5 *
Denys Vlasenko0ef64bd2010-08-16 20:14:46 +02006 * Licensed under GPLv2 or later, see file LICENSE in this source tree.
Denis Vlasenko3952f202007-08-13 14:10:24 +00007 *
8 * David MacKenzie <djm@gnu.ai.mit.edu>
9 *
10 * Options for expand:
Denys Vlasenkobbc7bee2017-01-21 02:49:58 +010011 * -t num --tabs NUM Convert tabs to num spaces (default 8 spaces).
Denis Vlasenko3952f202007-08-13 14:10:24 +000012 * -i --initial Only convert initial tabs on each line to spaces.
13 *
14 * Options for unexpand:
15 * -a --all Convert all blanks, instead of just initial blanks.
16 * -f --first-only Convert only leading sequences of blanks (default).
Denys Vlasenkobbc7bee2017-01-21 02:49:58 +010017 * -t num --tabs NUM Have tabs num characters apart instead of 8.
Denis Vlasenko3952f202007-08-13 14:10:24 +000018 *
19 * Busybox version (C) 2007 by Tito Ragusa <farmatito@tiscali.it>
20 *
21 * Caveat: this versions of expand and unexpand don't accept tab lists.
22 */
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010023//config:config EXPAND
Denys Vlasenko4eed2c62017-07-18 22:01:24 +020024//config: bool "expand (5.8 kb)"
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010025//config: default y
26//config: help
Denys Vlasenko72089cf2017-07-21 09:50:55 +020027//config: By default, convert all tabs to spaces.
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010028//config:
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010029//config:config UNEXPAND
Denys Vlasenko4eed2c62017-07-18 22:01:24 +020030//config: bool "unexpand (6 kb)"
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010031//config: default y
32//config: help
Denys Vlasenko72089cf2017-07-21 09:50:55 +020033//config: By default, convert only leading sequences of blanks to tabs.
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010034
35//applet:IF_EXPAND(APPLET(expand, BB_DIR_USR_BIN, BB_SUID_DROP))
Denys Vlasenko205d48e2017-01-29 14:57:33 +010036// APPLET_ODDNAME:name main location suid_type help
Denys Vlasenkoaf3f4202016-11-23 14:46:56 +010037//applet:IF_UNEXPAND(APPLET_ODDNAME(unexpand, expand, BB_DIR_USR_BIN, BB_SUID_DROP, unexpand))
38
39//kbuild:lib-$(CONFIG_EXPAND) += expand.o
40//kbuild:lib-$(CONFIG_UNEXPAND) += expand.o
Pere Orga34425382011-03-31 14:43:25 +020041
42//usage:#define expand_trivial_usage
43//usage: "[-i] [-t N] [FILE]..."
44//usage:#define expand_full_usage "\n\n"
45//usage: "Convert tabs to spaces, writing to stdout\n"
Pere Orga34425382011-03-31 14:43:25 +020046//usage: "\n -i Don't convert tabs after non blanks"
47//usage: "\n -t Tabstops every N chars"
Pere Orga34425382011-03-31 14:43:25 +020048
49//usage:#define unexpand_trivial_usage
50//usage: "[-fa][-t N] [FILE]..."
51//usage:#define unexpand_full_usage "\n\n"
52//usage: "Convert spaces to tabs, writing to stdout\n"
Pere Orga34425382011-03-31 14:43:25 +020053//usage: "\n -a Convert all blanks"
54//usage: "\n -f Convert only leading blanks"
55//usage: "\n -t N Tabstops every N chars"
Pere Orga34425382011-03-31 14:43:25 +020056
Denis Vlasenko3952f202007-08-13 14:10:24 +000057#include "libbb.h"
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010058#include "unicode.h"
Denis Vlasenko3952f202007-08-13 14:10:24 +000059
60enum {
61 OPT_INITIAL = 1 << 0,
62 OPT_TABS = 1 << 1,
63 OPT_ALL = 1 << 2,
64};
65
Denis Vlasenko3952f202007-08-13 14:10:24 +000066#if ENABLE_EXPAND
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010067static void expand(FILE *file, unsigned tab_size, unsigned opt)
Denis Vlasenko3952f202007-08-13 14:10:24 +000068{
69 char *line;
Denis Vlasenko3952f202007-08-13 14:10:24 +000070
Denis Vlasenko3952f202007-08-13 14:10:24 +000071 while ((line = xmalloc_fgets(file)) != NULL) {
Denis Vlasenko3139ea72008-12-14 15:45:25 +000072 unsigned char c;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010073 char *ptr;
74 char *ptr_strbeg;
Denis Vlasenko3139ea72008-12-14 15:45:25 +000075
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010076 ptr = ptr_strbeg = line;
Denis Vlasenko3139ea72008-12-14 15:45:25 +000077 while ((c = *ptr) != '\0') {
78 if ((opt & OPT_INITIAL) && !isblank(c)) {
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010079 /* not space or tab */
Denis Vlasenko3139ea72008-12-14 15:45:25 +000080 break;
Denis Vlasenko3952f202007-08-13 14:10:24 +000081 }
Denis Vlasenko3139ea72008-12-14 15:45:25 +000082 if (c == '\t') {
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010083 unsigned len;
84 *ptr = '\0';
Denys Vlasenko19158a82010-03-26 14:06:56 +010085# if ENABLE_UNICODE_SUPPORT
Michael Tokarev22bb81f2013-12-09 16:09:35 +040086 len = unicode_strwidth(ptr_strbeg);
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010087# else
88 len = ptr - ptr_strbeg;
89# endif
90 len = tab_size - (len % tab_size);
91 /*while (ptr[1] == '\t') { ptr++; len += tab_size; } - can handle many tabs at once */
92 printf("%s%*s", ptr_strbeg, len, "");
93 ptr_strbeg = ptr + 1;
Denis Vlasenko3952f202007-08-13 14:10:24 +000094 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010095 ptr++;
Denis Vlasenko3952f202007-08-13 14:10:24 +000096 }
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +010097 fputs(ptr_strbeg, stdout);
Denis Vlasenko3139ea72008-12-14 15:45:25 +000098 free(line);
Denis Vlasenko3952f202007-08-13 14:10:24 +000099 }
100}
101#endif
102
103#if ENABLE_UNEXPAND
Denis Vlasenko3139ea72008-12-14 15:45:25 +0000104static void unexpand(FILE *file, unsigned tab_size, unsigned opt)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000105{
106 char *line;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000107
108 while ((line = xmalloc_fgets(file)) != NULL) {
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000109 char *ptr = line;
110 unsigned column = 0;
111
112 while (*ptr) {
113 unsigned n;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100114 unsigned len = 0;
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000115
116 while (*ptr == ' ') {
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000117 ptr++;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100118 len++;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000119 }
Tomas Heinrich968951f2010-03-26 09:46:07 +0100120 column += len;
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000121 if (*ptr == '\t') {
122 column += tab_size - (column % tab_size);
123 ptr++;
124 continue;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000125 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000126
127 n = column / tab_size;
Tomas Heinrich968951f2010-03-26 09:46:07 +0100128 if (n) {
129 len = column = column % tab_size;
130 while (n--)
131 putchar('\t');
132 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000133
134 if ((opt & OPT_INITIAL) && ptr != line) {
Tomas Heinrich968951f2010-03-26 09:46:07 +0100135 printf("%*s%s", len, "", ptr);
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000136 break;
137 }
138 n = strcspn(ptr, "\t ");
Tomas Heinrich968951f2010-03-26 09:46:07 +0100139 printf("%*s%.*s", len, "", n, ptr);
Denys Vlasenko19158a82010-03-26 14:06:56 +0100140# if ENABLE_UNICODE_SUPPORT
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100141 {
Michael Tokarev22bb81f2013-12-09 16:09:35 +0400142 char c = ptr[n];
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100143 ptr[n] = '\0';
Michael Tokarev22bb81f2013-12-09 16:09:35 +0400144 len = unicode_strwidth(ptr);
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100145 ptr[n] = c;
146 }
147# else
148 len = n;
149# endif
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000150 ptr += n;
Tomas Heinrichd2b1ba62010-01-04 16:21:31 +0100151 column = (column + len) % tab_size;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000152 }
Denis Vlasenkoe40e76f2008-12-26 14:56:03 +0000153 free(line);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000154 }
155}
156#endif
157
Denis Vlasenko9b49a5e2007-10-11 10:05:36 +0000158int expand_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
Denis Vlasenkoa60f84e2008-07-05 09:18:54 +0000159int expand_main(int argc UNUSED_PARAM, char **argv)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000160{
161 /* Default 8 spaces for 1 tab */
162 const char *opt_t = "8";
163 FILE *file;
164 unsigned tab_size;
165 unsigned opt;
166 int exit_status = EXIT_SUCCESS;
167
Denys Vlasenko28055022010-01-04 20:49:58 +0100168 init_unicode();
Denis Vlasenko3952f202007-08-13 14:10:24 +0000169
170 if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e')) {
Denys Vlasenko036585a2017-08-08 16:38:18 +0200171 opt = getopt32long(argv, "it:",
172 "initial\0" No_argument "i"
173 "tabs\0" Required_argument "t"
174 , &opt_t
175 );
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000176 } else {
Denys Vlasenko22542ec2017-08-08 21:55:02 +0200177 opt = getopt32long(argv, "^"
178 "ft:a"
179 "\0"
180 "ta" /* -t NUM sets -a */,
Denys Vlasenko036585a2017-08-08 16:38:18 +0200181 "first-only\0" No_argument "i"
182 "tabs\0" Required_argument "t"
183 "all\0" No_argument "a"
184 , &opt_t
185 );
Denis Vlasenko3952f202007-08-13 14:10:24 +0000186 /* -f --first-only is the default */
187 if (!(opt & OPT_ALL)) opt |= OPT_INITIAL;
188 }
189 tab_size = xatou_range(opt_t, 1, UINT_MAX);
190
191 argv += optind;
192
Denis Vlasenko3952f202007-08-13 14:10:24 +0000193 if (!*argv) {
194 *--argv = (char*)bb_msg_standard_input;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000195 }
Denis Vlasenko3952f202007-08-13 14:10:24 +0000196 do {
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000197 file = fopen_or_warn_stdin(*argv);
198 if (!file) {
199 exit_status = EXIT_FAILURE;
200 continue;
Denis Vlasenko3952f202007-08-13 14:10:24 +0000201 }
202
203 if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e'))
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000204 IF_EXPAND(expand(file, tab_size, opt));
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000205 else
Denis Vlasenko5e34ff22009-04-21 11:09:40 +0000206 IF_UNEXPAND(unexpand(file, tab_size, opt));
Denis Vlasenko3952f202007-08-13 14:10:24 +0000207
208 /* Check and close the file */
Denis Vlasenko62a90cd2008-03-17 09:07:36 +0000209 if (fclose_if_not_stdin(file)) {
Denis Vlasenko0c97c9d2007-10-01 11:58:38 +0000210 bb_simple_perror_msg(*argv);
Denis Vlasenko3952f202007-08-13 14:10:24 +0000211 exit_status = EXIT_FAILURE;
212 }
213 /* If stdin also clear EOF */
Denis Vlasenko6a2f7f42007-08-16 10:35:17 +0000214 if (file == stdin)
Denis Vlasenko3952f202007-08-13 14:10:24 +0000215 clearerr(file);
216 } while (*++argv);
217
218 /* Now close stdin also */
219 /* (if we didn't read from it, it's a no-op) */
220 if (fclose(stdin))
221 bb_perror_msg_and_die(bb_msg_standard_input);
222
223 fflush_stdout_and_exit(exit_status);
224}