blob: a5d068262bb636488e1ed6adf7ffb70a1bc3ef3f [file] [log] [blame]
Erik Andersenfb002d02000-03-05 08:07:00 +00001/* vi: set sw=4 ts=4: */
2/*
Erik Andersen8f8d6d52000-05-01 22:30:37 +00003 * Mini tr implementation for busybox
Erik Andersenfb002d02000-03-05 08:07:00 +00004 *
Erik Andersen5afc8642000-05-02 00:07:56 +00005 * Copyright (c) Michiel Huisjes
6 *
7 * This version of tr is adapted from Minix tr and was modified
8 * by Erik Andersen <andersee@debian.org> to be used in busybox.
Erik Andersenfb002d02000-03-05 08:07:00 +00009 *
Erik Andersen8f8d6d52000-05-01 22:30:37 +000010 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 *
24 * Original copyright notice is retained at the end of this file.
Erik Andersenfb002d02000-03-05 08:07:00 +000025 */
26
Erik Andersenfb002d02000-03-05 08:07:00 +000027#include <stdio.h>
Erik Andersenfb002d02000-03-05 08:07:00 +000028#include <string.h>
Erik Andersen8f8d6d52000-05-01 22:30:37 +000029#include <stdlib.h>
Erik Andersenfb002d02000-03-05 08:07:00 +000030#include <unistd.h>
Erik Andersen8f8d6d52000-05-01 22:30:37 +000031#include <sys/types.h>
Eric Andersencbe31da2001-02-20 06:14:08 +000032#include "busybox.h"
Erik Andersen330fd2b2000-05-19 05:35:19 +000033
Eric Andersen22ecf042001-07-02 17:32:40 +000034/* This must be a #define, since when DODEBUG and BUFFERS_GO_IN_BSS are
35 * enabled, we otherwise get a "storage size isn't constant error. */
36#define ASCII 0377
Erik Andersenfb002d02000-03-05 08:07:00 +000037
Mark Whitley8b7a0d82001-05-24 21:31:09 +000038/* some "globals" shared across this file */
Erik Andersen8f8d6d52000-05-01 22:30:37 +000039static char com_fl, del_fl, sq_fl;
Erik Andersen8f8d6d52000-05-01 22:30:37 +000040static short in_index, out_index;
Mark Whitley59ab0252001-01-23 22:30:04 +000041/* these last are pointers to static buffers declared in tr_main */
42static unsigned char *poutput, *pinput;
43static unsigned char *pvector;
44static char *pinvec, *poutvec;
Erik Andersenfb002d02000-03-05 08:07:00 +000045
Erik Andersenfb002d02000-03-05 08:07:00 +000046
Erik Andersen8f8d6d52000-05-01 22:30:37 +000047static void convert()
Erik Andersenfb002d02000-03-05 08:07:00 +000048{
Erik Andersen8f8d6d52000-05-01 22:30:37 +000049 short read_chars = 0;
50 short c, coded;
51 short last = -1;
Erik Andersenfb002d02000-03-05 08:07:00 +000052
Erik Andersen8f8d6d52000-05-01 22:30:37 +000053 for (;;) {
54 if (in_index == read_chars) {
Mark Whitley59ab0252001-01-23 22:30:04 +000055 if ((read_chars = read(0, (char *) pinput, BUFSIZ)) <= 0) {
56 if (write(1, (char *) poutput, out_index) != out_index)
Erik Andersen330fd2b2000-05-19 05:35:19 +000057 write(2, write_error, strlen(write_error));
Erik Andersen8f8d6d52000-05-01 22:30:37 +000058 exit(0);
Erik Andersenfb002d02000-03-05 08:07:00 +000059 }
Erik Andersen8f8d6d52000-05-01 22:30:37 +000060 in_index = 0;
61 }
Mark Whitley59ab0252001-01-23 22:30:04 +000062 c = pinput[in_index++];
63 coded = pvector[c];
64 if (del_fl && pinvec[c])
Erik Andersen8f8d6d52000-05-01 22:30:37 +000065 continue;
Mark Whitley59ab0252001-01-23 22:30:04 +000066 if (sq_fl && last == coded && (pinvec[c] || poutvec[coded]))
Erik Andersen8f8d6d52000-05-01 22:30:37 +000067 continue;
Mark Whitley59ab0252001-01-23 22:30:04 +000068 poutput[out_index++] = last = coded;
Erik Andersen8f8d6d52000-05-01 22:30:37 +000069 if (out_index == BUFSIZ) {
Mark Whitley59ab0252001-01-23 22:30:04 +000070 if (write(1, (char *) poutput, out_index) != out_index) {
Erik Andersen330fd2b2000-05-19 05:35:19 +000071 write(2, write_error, strlen(write_error));
Erik Andersen8f8d6d52000-05-01 22:30:37 +000072 exit(1);
Erik Andersenfb002d02000-03-05 08:07:00 +000073 }
Erik Andersen8f8d6d52000-05-01 22:30:37 +000074 out_index = 0;
75 }
Erik Andersenfb002d02000-03-05 08:07:00 +000076 }
77
Erik Andersenfb002d02000-03-05 08:07:00 +000078 /* NOTREACHED */
Erik Andersen8f8d6d52000-05-01 22:30:37 +000079}
80
Eric Andersen00143ba2000-07-13 16:40:41 +000081static void map(register unsigned char *string1, unsigned int string1_len,
82 register unsigned char *string2, unsigned int string2_len)
Erik Andersen8f8d6d52000-05-01 22:30:37 +000083{
84 unsigned char last = '0';
Eric Andersen00143ba2000-07-13 16:40:41 +000085 unsigned int i, j;
Erik Andersen8f8d6d52000-05-01 22:30:37 +000086
Eric Andersen00143ba2000-07-13 16:40:41 +000087 for (j = 0, i = 0; i < string1_len; i++) {
88 if (string2_len <= j)
Mark Whitley59ab0252001-01-23 22:30:04 +000089 pvector[string1[i]] = last;
Erik Andersen8f8d6d52000-05-01 22:30:37 +000090 else
Mark Whitley59ab0252001-01-23 22:30:04 +000091 pvector[string1[i]] = last = string2[j++];
Erik Andersen8f8d6d52000-05-01 22:30:37 +000092 }
93}
94
Mark Whitley8b7a0d82001-05-24 21:31:09 +000095/* supported constructs:
96 * Ranges, e.g., [0-9] ==> 0123456789
97 * Escapes, e.g., \a ==> Control-G
98 */
Eric Andersene5dfced2001-04-09 22:48:12 +000099static unsigned int expand(const char *arg, register unsigned char *buffer)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000100{
Eric Andersen00143ba2000-07-13 16:40:41 +0000101 unsigned char *buffer_start = buffer;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000102 int i, ac;
103
104 while (*arg) {
105 if (*arg == '\\') {
106 arg++;
Eric Andersenf7cf2f72000-07-05 17:26:35 +0000107 *buffer++ = process_escape_sequence(&arg);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000108 } else if (*arg == '[') {
109 arg++;
110 i = *arg++;
111 if (*arg++ != '-') {
112 *buffer++ = '[';
113 arg -= 2;
114 continue;
115 }
116 ac = *arg++;
117 while (i <= ac)
118 *buffer++ = i++;
Mark Whitley8b7a0d82001-05-24 21:31:09 +0000119 arg++; /* Skip the assumed ']' */
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000120 } else
121 *buffer++ = *arg++;
122 }
Eric Andersen00143ba2000-07-13 16:40:41 +0000123
124 return (buffer - buffer_start);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000125}
126
Eric Andersenfad04fd2000-07-14 06:49:52 +0000127static int complement(unsigned char *buffer, int buffer_len)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000128{
Eric Andersen1ca20a72001-03-21 07:34:27 +0000129 register short i, j, ix;
Eric Andersenfad04fd2000-07-14 06:49:52 +0000130 char conv[ASCII + 2];
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000131
Eric Andersen1ca20a72001-03-21 07:34:27 +0000132 ix = 0;
Eric Andersen00143ba2000-07-13 16:40:41 +0000133 for (i = 0; i <= ASCII; i++) {
134 for (j = 0; j < buffer_len; j++)
135 if (buffer[j] == i)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000136 break;
Eric Andersen00143ba2000-07-13 16:40:41 +0000137 if (j == buffer_len)
Eric Andersen1ca20a72001-03-21 07:34:27 +0000138 conv[ix++] = i & ASCII;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000139 }
Eric Andersen1ca20a72001-03-21 07:34:27 +0000140 memcpy(buffer, conv, ix);
141 return ix;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000142}
143
144extern int tr_main(int argc, char **argv)
145{
146 register unsigned char *ptr;
Eric Andersenfad04fd2000-07-14 06:49:52 +0000147 int output_length=0, input_length;
Eric Andersenf6aa13d2001-03-23 17:08:21 +0000148 int idx = 1;
Eric Andersenfad04fd2000-07-14 06:49:52 +0000149 int i;
Eric Andersend35c2152001-01-25 23:49:09 +0000150 RESERVE_BB_BUFFER(output, BUFSIZ);
151 RESERVE_BB_BUFFER(input, BUFSIZ);
152 RESERVE_BB_UBUFFER(vector, ASCII+1);
153 RESERVE_BB_BUFFER(invec, ASCII+1);
154 RESERVE_BB_BUFFER(outvec, ASCII+1);
Mark Whitley59ab0252001-01-23 22:30:04 +0000155
156 /* ... but make them available globally */
157 poutput = output;
158 pinput = input;
159 pvector = vector;
160 pinvec = invec;
161 poutvec = outvec;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000162
Eric Andersenf6aa13d2001-03-23 17:08:21 +0000163 if (argc > 1 && argv[idx][0] == '-') {
164 for (ptr = (unsigned char *) &argv[idx][1]; *ptr; ptr++) {
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000165 switch (*ptr) {
166 case 'c':
167 com_fl = TRUE;
168 break;
169 case 'd':
170 del_fl = TRUE;
171 break;
172 case 's':
173 sq_fl = TRUE;
174 break;
175 default:
Eric Andersen67991cf2001-02-14 21:23:06 +0000176 show_usage();
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000177 }
178 }
Eric Andersenf6aa13d2001-03-23 17:08:21 +0000179 idx++;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000180 }
181 for (i = 0; i <= ASCII; i++) {
182 vector[i] = i;
183 invec[i] = outvec[i] = FALSE;
184 }
185
Eric Andersenf6aa13d2001-03-23 17:08:21 +0000186 if (argv[idx] != NULL) {
187 input_length = expand(argv[idx++], input);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000188 if (com_fl)
Eric Andersen00143ba2000-07-13 16:40:41 +0000189 input_length = complement(input, input_length);
Eric Andersenf6aa13d2001-03-23 17:08:21 +0000190 if (argv[idx] != NULL) {
191 if (*argv[idx] == '\0')
Matt Kraaidd19c692001-01-31 19:00:21 +0000192 error_msg_and_die("STRING2 cannot be empty");
Eric Andersenf6aa13d2001-03-23 17:08:21 +0000193 output_length = expand(argv[idx], output);
Eric Andersen00143ba2000-07-13 16:40:41 +0000194 map(input, input_length, output, output_length);
Eric Andersena03d86c2000-07-10 16:38:50 +0000195 }
Eric Andersen00143ba2000-07-13 16:40:41 +0000196 for (i = 0; i < input_length; i++)
Eric Andersened3ef502001-01-27 08:24:39 +0000197 invec[(int)input[i]] = TRUE;
Eric Andersen00143ba2000-07-13 16:40:41 +0000198 for (i = 0; i < output_length; i++)
Eric Andersened3ef502001-01-27 08:24:39 +0000199 outvec[(int)output[i]] = TRUE;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000200 }
201 convert();
Erik Andersenfb002d02000-03-05 08:07:00 +0000202 return (0);
203}
204
Erik Andersenfb002d02000-03-05 08:07:00 +0000205/*
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000206 * Copyright (c) 1987,1997, Prentice Hall
207 * All rights reserved.
208 *
209 * Redistribution and use of the MINIX operating system in source and
210 * binary forms, with or without modification, are permitted provided
211 * that the following conditions are met:
212 *
213 * Redistributions of source code must retain the above copyright
214 * notice, this list of conditions and the following disclaimer.
215 *
216 * Redistributions in binary form must reproduce the above
217 * copyright notice, this list of conditions and the following
218 * disclaimer in the documentation and/or other materials provided
219 * with the distribution.
220 *
221 * Neither the name of Prentice Hall nor the names of the software
222 * authors or contributors may be used to endorse or promote
223 * products derived from this software without specific prior
224 * written permission.
225 *
226 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS, AUTHORS, AND
227 * CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
228 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
229 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
230 * IN NO EVENT SHALL PRENTICE HALL OR ANY AUTHORS OR CONTRIBUTORS BE
231 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
232 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
233 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
234 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
235 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
236 * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
237 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
238 *
Erik Andersenfb002d02000-03-05 08:07:00 +0000239 */
Erik Andersenfb002d02000-03-05 08:07:00 +0000240