Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 1 | /* expand - convert tabs to spaces |
| 2 | * unexpand - convert spaces to tabs |
| 3 | * |
| 4 | * Copyright (C) 89, 91, 1995-2006 Free Software Foundation, Inc. |
| 5 | * |
| 6 | * Licensed under GPLv2 or later, see file LICENSE in this tarball for details. |
| 7 | * |
| 8 | * David MacKenzie <djm@gnu.ai.mit.edu> |
| 9 | * |
| 10 | * Options for expand: |
| 11 | * -t num --tabs=NUM Convert tabs to num spaces (default 8 spaces). |
| 12 | * -i --initial Only convert initial tabs on each line to spaces. |
| 13 | * |
| 14 | * Options for unexpand: |
| 15 | * -a --all Convert all blanks, instead of just initial blanks. |
| 16 | * -f --first-only Convert only leading sequences of blanks (default). |
| 17 | * -t num --tabs=NUM Have tabs num characters apart instead of 8. |
| 18 | * |
| 19 | * Busybox version (C) 2007 by Tito Ragusa <farmatito@tiscali.it> |
| 20 | * |
| 21 | * Caveat: this versions of expand and unexpand don't accept tab lists. |
| 22 | */ |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 23 | #include "libbb.h" |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 24 | #include "unicode.h" |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 25 | |
| 26 | enum { |
| 27 | OPT_INITIAL = 1 << 0, |
| 28 | OPT_TABS = 1 << 1, |
| 29 | OPT_ALL = 1 << 2, |
| 30 | }; |
| 31 | |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 32 | #if ENABLE_EXPAND |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 33 | static void expand(FILE *file, unsigned tab_size, unsigned opt) |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 34 | { |
| 35 | char *line; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 36 | |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 37 | while ((line = xmalloc_fgets(file)) != NULL) { |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 38 | unsigned char c; |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 39 | char *ptr; |
| 40 | char *ptr_strbeg; |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 41 | |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 42 | ptr = ptr_strbeg = line; |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 43 | while ((c = *ptr) != '\0') { |
| 44 | if ((opt & OPT_INITIAL) && !isblank(c)) { |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 45 | /* not space or tab */ |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 46 | break; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 47 | } |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 48 | if (c == '\t') { |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 49 | unsigned len; |
| 50 | *ptr = '\0'; |
Denys Vlasenko | 19158a8 | 2010-03-26 14:06:56 +0100 | [diff] [blame^] | 51 | # if ENABLE_UNICODE_SUPPORT |
Tomas Heinrich | 1abc07d | 2010-03-26 09:40:47 +0100 | [diff] [blame] | 52 | { |
| 53 | uni_stat_t uni_stat; |
| 54 | printable_string(&uni_stat, ptr_strbeg); |
| 55 | len = uni_stat.unicode_width; |
| 56 | } |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 57 | # else |
| 58 | len = ptr - ptr_strbeg; |
| 59 | # endif |
| 60 | len = tab_size - (len % tab_size); |
| 61 | /*while (ptr[1] == '\t') { ptr++; len += tab_size; } - can handle many tabs at once */ |
| 62 | printf("%s%*s", ptr_strbeg, len, ""); |
| 63 | ptr_strbeg = ptr + 1; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 64 | } |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 65 | ptr++; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 66 | } |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 67 | fputs(ptr_strbeg, stdout); |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 68 | free(line); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 69 | } |
| 70 | } |
| 71 | #endif |
| 72 | |
| 73 | #if ENABLE_UNEXPAND |
Denis Vlasenko | 3139ea7 | 2008-12-14 15:45:25 +0000 | [diff] [blame] | 74 | static void unexpand(FILE *file, unsigned tab_size, unsigned opt) |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 75 | { |
| 76 | char *line; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 77 | |
| 78 | while ((line = xmalloc_fgets(file)) != NULL) { |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 79 | char *ptr = line; |
| 80 | unsigned column = 0; |
| 81 | |
| 82 | while (*ptr) { |
| 83 | unsigned n; |
Tomas Heinrich | 968951f | 2010-03-26 09:46:07 +0100 | [diff] [blame] | 84 | unsigned len = 0; |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 85 | |
| 86 | while (*ptr == ' ') { |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 87 | ptr++; |
Tomas Heinrich | 968951f | 2010-03-26 09:46:07 +0100 | [diff] [blame] | 88 | len++; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 89 | } |
Tomas Heinrich | 968951f | 2010-03-26 09:46:07 +0100 | [diff] [blame] | 90 | column += len; |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 91 | if (*ptr == '\t') { |
| 92 | column += tab_size - (column % tab_size); |
| 93 | ptr++; |
| 94 | continue; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 95 | } |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 96 | |
| 97 | n = column / tab_size; |
Tomas Heinrich | 968951f | 2010-03-26 09:46:07 +0100 | [diff] [blame] | 98 | if (n) { |
| 99 | len = column = column % tab_size; |
| 100 | while (n--) |
| 101 | putchar('\t'); |
| 102 | } |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 103 | |
| 104 | if ((opt & OPT_INITIAL) && ptr != line) { |
Tomas Heinrich | 968951f | 2010-03-26 09:46:07 +0100 | [diff] [blame] | 105 | printf("%*s%s", len, "", ptr); |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 106 | break; |
| 107 | } |
| 108 | n = strcspn(ptr, "\t "); |
Tomas Heinrich | 968951f | 2010-03-26 09:46:07 +0100 | [diff] [blame] | 109 | printf("%*s%.*s", len, "", n, ptr); |
Denys Vlasenko | 19158a8 | 2010-03-26 14:06:56 +0100 | [diff] [blame^] | 110 | # if ENABLE_UNICODE_SUPPORT |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 111 | { |
| 112 | char c; |
Tomas Heinrich | 1abc07d | 2010-03-26 09:40:47 +0100 | [diff] [blame] | 113 | uni_stat_t uni_stat; |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 114 | c = ptr[n]; |
| 115 | ptr[n] = '\0'; |
Tomas Heinrich | 1abc07d | 2010-03-26 09:40:47 +0100 | [diff] [blame] | 116 | printable_string(&uni_stat, ptr); |
| 117 | len = uni_stat.unicode_width; |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 118 | ptr[n] = c; |
| 119 | } |
| 120 | # else |
| 121 | len = n; |
| 122 | # endif |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 123 | ptr += n; |
Tomas Heinrich | d2b1ba6 | 2010-01-04 16:21:31 +0100 | [diff] [blame] | 124 | column = (column + len) % tab_size; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 125 | } |
Denis Vlasenko | e40e76f | 2008-12-26 14:56:03 +0000 | [diff] [blame] | 126 | free(line); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 127 | } |
| 128 | } |
| 129 | #endif |
| 130 | |
Denis Vlasenko | 9b49a5e | 2007-10-11 10:05:36 +0000 | [diff] [blame] | 131 | int expand_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE; |
Denis Vlasenko | a60f84e | 2008-07-05 09:18:54 +0000 | [diff] [blame] | 132 | int expand_main(int argc UNUSED_PARAM, char **argv) |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 133 | { |
| 134 | /* Default 8 spaces for 1 tab */ |
| 135 | const char *opt_t = "8"; |
| 136 | FILE *file; |
| 137 | unsigned tab_size; |
| 138 | unsigned opt; |
| 139 | int exit_status = EXIT_SUCCESS; |
| 140 | |
| 141 | #if ENABLE_FEATURE_EXPAND_LONG_OPTIONS |
| 142 | static const char expand_longopts[] ALIGN1 = |
| 143 | /* name, has_arg, val */ |
| 144 | "initial\0" No_argument "i" |
| 145 | "tabs\0" Required_argument "t" |
| 146 | ; |
| 147 | #endif |
| 148 | #if ENABLE_FEATURE_UNEXPAND_LONG_OPTIONS |
| 149 | static const char unexpand_longopts[] ALIGN1 = |
| 150 | /* name, has_arg, val */ |
| 151 | "first-only\0" No_argument "i" |
| 152 | "tabs\0" Required_argument "t" |
| 153 | "all\0" No_argument "a" |
| 154 | ; |
| 155 | #endif |
Denys Vlasenko | 2805502 | 2010-01-04 20:49:58 +0100 | [diff] [blame] | 156 | init_unicode(); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 157 | |
| 158 | if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e')) { |
Denis Vlasenko | 5e34ff2 | 2009-04-21 11:09:40 +0000 | [diff] [blame] | 159 | IF_FEATURE_EXPAND_LONG_OPTIONS(applet_long_options = expand_longopts); |
Denis Vlasenko | fe7cd64 | 2007-08-18 15:32:12 +0000 | [diff] [blame] | 160 | opt = getopt32(argv, "it:", &opt_t); |
Denis Vlasenko | 62a90cd | 2008-03-17 09:07:36 +0000 | [diff] [blame] | 161 | } else { |
Denis Vlasenko | 5e34ff2 | 2009-04-21 11:09:40 +0000 | [diff] [blame] | 162 | IF_FEATURE_UNEXPAND_LONG_OPTIONS(applet_long_options = unexpand_longopts); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 163 | /* -t NUM sets also -a */ |
| 164 | opt_complementary = "ta"; |
Denis Vlasenko | fe7cd64 | 2007-08-18 15:32:12 +0000 | [diff] [blame] | 165 | opt = getopt32(argv, "ft:a", &opt_t); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 166 | /* -f --first-only is the default */ |
| 167 | if (!(opt & OPT_ALL)) opt |= OPT_INITIAL; |
| 168 | } |
| 169 | tab_size = xatou_range(opt_t, 1, UINT_MAX); |
| 170 | |
| 171 | argv += optind; |
| 172 | |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 173 | if (!*argv) { |
| 174 | *--argv = (char*)bb_msg_standard_input; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 175 | } |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 176 | do { |
Denis Vlasenko | 62a90cd | 2008-03-17 09:07:36 +0000 | [diff] [blame] | 177 | file = fopen_or_warn_stdin(*argv); |
| 178 | if (!file) { |
| 179 | exit_status = EXIT_FAILURE; |
| 180 | continue; |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 181 | } |
| 182 | |
| 183 | if (ENABLE_EXPAND && (!ENABLE_UNEXPAND || applet_name[0] == 'e')) |
Denis Vlasenko | 5e34ff2 | 2009-04-21 11:09:40 +0000 | [diff] [blame] | 184 | IF_EXPAND(expand(file, tab_size, opt)); |
Denis Vlasenko | 62a90cd | 2008-03-17 09:07:36 +0000 | [diff] [blame] | 185 | else |
Denis Vlasenko | 5e34ff2 | 2009-04-21 11:09:40 +0000 | [diff] [blame] | 186 | IF_UNEXPAND(unexpand(file, tab_size, opt)); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 187 | |
| 188 | /* Check and close the file */ |
Denis Vlasenko | 62a90cd | 2008-03-17 09:07:36 +0000 | [diff] [blame] | 189 | if (fclose_if_not_stdin(file)) { |
Denis Vlasenko | 0c97c9d | 2007-10-01 11:58:38 +0000 | [diff] [blame] | 190 | bb_simple_perror_msg(*argv); |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 191 | exit_status = EXIT_FAILURE; |
| 192 | } |
| 193 | /* If stdin also clear EOF */ |
Denis Vlasenko | 6a2f7f4 | 2007-08-16 10:35:17 +0000 | [diff] [blame] | 194 | if (file == stdin) |
Denis Vlasenko | 3952f20 | 2007-08-13 14:10:24 +0000 | [diff] [blame] | 195 | clearerr(file); |
| 196 | } while (*++argv); |
| 197 | |
| 198 | /* Now close stdin also */ |
| 199 | /* (if we didn't read from it, it's a no-op) */ |
| 200 | if (fclose(stdin)) |
| 201 | bb_perror_msg_and_die(bb_msg_standard_input); |
| 202 | |
| 203 | fflush_stdout_and_exit(exit_status); |
| 204 | } |