blob: 563ee0837803240ced790b9201e90ada9e64ab82 [file] [log] [blame]
Erik Andersenfb002d02000-03-05 08:07:00 +00001/* vi: set sw=4 ts=4: */
2/*
Erik Andersen8f8d6d52000-05-01 22:30:37 +00003 * Mini tr implementation for busybox
Erik Andersenfb002d02000-03-05 08:07:00 +00004 *
Erik Andersen5afc8642000-05-02 00:07:56 +00005 * Copyright (c) Michiel Huisjes
6 *
7 * This version of tr is adapted from Minix tr and was modified
8 * by Erik Andersen <andersee@debian.org> to be used in busybox.
Erik Andersenfb002d02000-03-05 08:07:00 +00009 *
Erik Andersen8f8d6d52000-05-01 22:30:37 +000010 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 *
24 * Original copyright notice is retained at the end of this file.
Erik Andersenfb002d02000-03-05 08:07:00 +000025 */
26
Erik Andersenfb002d02000-03-05 08:07:00 +000027#include "internal.h"
Erik Andersenfb002d02000-03-05 08:07:00 +000028#include <stdio.h>
Erik Andersenfb002d02000-03-05 08:07:00 +000029#include <string.h>
Erik Andersen8f8d6d52000-05-01 22:30:37 +000030#include <stdlib.h>
Erik Andersenfb002d02000-03-05 08:07:00 +000031#include <unistd.h>
Erik Andersen8f8d6d52000-05-01 22:30:37 +000032#include <sys/types.h>
Erik Andersen330fd2b2000-05-19 05:35:19 +000033#define BB_DECLARE_EXTERN
34#define bb_need_write_error
35#include "messages.c"
36
37const char *tr_usage="tr [-cds] STRING1 [STRING2]\n"
38#ifndef BB_FEATURE_TRIVIAL_HELP
39 "\nTranslate, squeeze, and/or delete characters from\n"
40 "standard input, writing to standard output.\n\n"
41 "Options:\n"
42 "\t-c\ttake complement of STRING1\n"
43 "\t-d\tdelete input characters coded STRING1\n"
44 "\t-s\tsqueeze multiple output characters of STRING2 into one character\n"
45#endif
46;
Erik Andersenfb002d02000-03-05 08:07:00 +000047
Erik Andersenfb002d02000-03-05 08:07:00 +000048
Erik Andersenfb002d02000-03-05 08:07:00 +000049
Erik Andersen8f8d6d52000-05-01 22:30:37 +000050#ifdef TRUE
51#undef TRUE
52#undef FALSE
53#define TRUE 1
54#define FALSE 0
55#endif
Erik Andersenfb002d02000-03-05 08:07:00 +000056
Erik Andersen8f8d6d52000-05-01 22:30:37 +000057#define ASCII 0377
Erik Andersenfb002d02000-03-05 08:07:00 +000058
Erik Andersen8f8d6d52000-05-01 22:30:37 +000059/* some glabals shared across this file */
60static char com_fl, del_fl, sq_fl;
61static unsigned char output[BUFSIZ], input[BUFSIZ];
62static unsigned char vector[ASCII + 1];
63static char invec[ASCII + 1], outvec[ASCII + 1];
64static short in_index, out_index;
Erik Andersenfb002d02000-03-05 08:07:00 +000065
Erik Andersenfb002d02000-03-05 08:07:00 +000066
Erik Andersen8f8d6d52000-05-01 22:30:37 +000067static void convert()
Erik Andersenfb002d02000-03-05 08:07:00 +000068{
Erik Andersen8f8d6d52000-05-01 22:30:37 +000069 short read_chars = 0;
70 short c, coded;
71 short last = -1;
Erik Andersenfb002d02000-03-05 08:07:00 +000072
Erik Andersen8f8d6d52000-05-01 22:30:37 +000073 for (;;) {
74 if (in_index == read_chars) {
75 if ((read_chars = read(0, (char *) input, BUFSIZ)) <= 0) {
76 if (write(1, (char *) output, out_index) != out_index)
Erik Andersen330fd2b2000-05-19 05:35:19 +000077 write(2, write_error, strlen(write_error));
Erik Andersen8f8d6d52000-05-01 22:30:37 +000078 exit(0);
Erik Andersenfb002d02000-03-05 08:07:00 +000079 }
Erik Andersen8f8d6d52000-05-01 22:30:37 +000080 in_index = 0;
81 }
82 c = input[in_index++];
83 coded = vector[c];
84 if (del_fl && invec[c])
85 continue;
86 if (sq_fl && last == coded && outvec[coded])
87 continue;
88 output[out_index++] = last = coded;
89 if (out_index == BUFSIZ) {
90 if (write(1, (char *) output, out_index) != out_index) {
Erik Andersen330fd2b2000-05-19 05:35:19 +000091 write(2, write_error, strlen(write_error));
Erik Andersen8f8d6d52000-05-01 22:30:37 +000092 exit(1);
Erik Andersenfb002d02000-03-05 08:07:00 +000093 }
Erik Andersen8f8d6d52000-05-01 22:30:37 +000094 out_index = 0;
95 }
Erik Andersenfb002d02000-03-05 08:07:00 +000096 }
97
Erik Andersenfb002d02000-03-05 08:07:00 +000098 /* NOTREACHED */
Erik Andersen8f8d6d52000-05-01 22:30:37 +000099}
100
Eric Andersen00143ba2000-07-13 16:40:41 +0000101static void map(register unsigned char *string1, unsigned int string1_len,
102 register unsigned char *string2, unsigned int string2_len)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000103{
104 unsigned char last = '0';
Eric Andersen00143ba2000-07-13 16:40:41 +0000105 unsigned int i, j;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000106
Eric Andersen00143ba2000-07-13 16:40:41 +0000107 for (j = 0, i = 0; i < string1_len; i++) {
108 if (string2_len <= j)
109 vector[string1[i]] = last;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000110 else
Eric Andersen00143ba2000-07-13 16:40:41 +0000111 vector[string1[i]] = last = string2[j++];
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000112 }
113}
114
Eric Andersen00143ba2000-07-13 16:40:41 +0000115static unsigned int expand(char *arg, register unsigned char *buffer)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000116{
Eric Andersen00143ba2000-07-13 16:40:41 +0000117 unsigned char *buffer_start = buffer;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000118 int i, ac;
119
120 while (*arg) {
121 if (*arg == '\\') {
122 arg++;
Eric Andersenf7cf2f72000-07-05 17:26:35 +0000123 *buffer++ = process_escape_sequence(&arg);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000124 } else if (*arg == '[') {
125 arg++;
126 i = *arg++;
127 if (*arg++ != '-') {
128 *buffer++ = '[';
129 arg -= 2;
130 continue;
131 }
132 ac = *arg++;
133 while (i <= ac)
134 *buffer++ = i++;
135 arg++; /* Skip ']' */
136 } else
137 *buffer++ = *arg++;
138 }
Eric Andersen00143ba2000-07-13 16:40:41 +0000139
140 return (buffer - buffer_start);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000141}
142
Eric Andersen00143ba2000-07-13 16:40:41 +0000143static int complement(unsigned char *buffer, unsigned int buffer_len)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000144{
Eric Andersen00143ba2000-07-13 16:40:41 +0000145 register short i, j, index;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000146 unsigned char conv[ASCII + 2];
147
148 index = 0;
Eric Andersen00143ba2000-07-13 16:40:41 +0000149 for (i = 0; i <= ASCII; i++) {
150 for (j = 0; j < buffer_len; j++)
151 if (buffer[j] == i)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000152 break;
Eric Andersen00143ba2000-07-13 16:40:41 +0000153 if (j == buffer_len)
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000154 conv[index++] = i & ASCII;
155 }
Eric Andersen00143ba2000-07-13 16:40:41 +0000156 memcpy(buffer, conv, index);
157 return index;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000158}
159
160extern int tr_main(int argc, char **argv)
161{
162 register unsigned char *ptr;
Eric Andersen00143ba2000-07-13 16:40:41 +0000163 unsigned int output_length, input_length;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000164 int index = 1;
165 short i;
166
167 if (argc > 1 && argv[index][0] == '-') {
168 for (ptr = (unsigned char *) &argv[index][1]; *ptr; ptr++) {
169 switch (*ptr) {
170 case 'c':
171 com_fl = TRUE;
172 break;
173 case 'd':
174 del_fl = TRUE;
175 break;
176 case 's':
177 sq_fl = TRUE;
178 break;
179 default:
Erik Andersen330fd2b2000-05-19 05:35:19 +0000180 usage(tr_usage);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000181 }
182 }
183 index++;
184 }
185 for (i = 0; i <= ASCII; i++) {
186 vector[i] = i;
187 invec[i] = outvec[i] = FALSE;
188 }
189
190 if (argv[index] != NULL) {
Eric Andersen00143ba2000-07-13 16:40:41 +0000191 input_length = expand(argv[index++], input);
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000192 if (com_fl)
Eric Andersen00143ba2000-07-13 16:40:41 +0000193 input_length = complement(input, input_length);
Eric Andersena03d86c2000-07-10 16:38:50 +0000194 if (argv[index] != NULL) {
195 if (*argv[index] == '\0')
Matt Kraaibe84cd42000-07-12 17:02:35 +0000196 fatalError("STRING2 cannot be empty\n");
Eric Andersen00143ba2000-07-13 16:40:41 +0000197 output_length = expand(argv[index], output);
198 map(input, input_length, output, output_length);
Eric Andersena03d86c2000-07-10 16:38:50 +0000199 }
Eric Andersen00143ba2000-07-13 16:40:41 +0000200 for (i = 0; i < input_length; i++)
201 invec[input[i]] = TRUE;
202 for (i = 0; i < output_length; i++)
203 outvec[output[i]] = TRUE;
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000204 }
205 convert();
Erik Andersenfb002d02000-03-05 08:07:00 +0000206 return (0);
207}
208
Erik Andersenfb002d02000-03-05 08:07:00 +0000209/*
Erik Andersen8f8d6d52000-05-01 22:30:37 +0000210 * Copyright (c) 1987,1997, Prentice Hall
211 * All rights reserved.
212 *
213 * Redistribution and use of the MINIX operating system in source and
214 * binary forms, with or without modification, are permitted provided
215 * that the following conditions are met:
216 *
217 * Redistributions of source code must retain the above copyright
218 * notice, this list of conditions and the following disclaimer.
219 *
220 * Redistributions in binary form must reproduce the above
221 * copyright notice, this list of conditions and the following
222 * disclaimer in the documentation and/or other materials provided
223 * with the distribution.
224 *
225 * Neither the name of Prentice Hall nor the names of the software
226 * authors or contributors may be used to endorse or promote
227 * products derived from this software without specific prior
228 * written permission.
229 *
230 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS, AUTHORS, AND
231 * CONTRIBUTORS ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
232 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
233 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
234 * IN NO EVENT SHALL PRENTICE HALL OR ANY AUTHORS OR CONTRIBUTORS BE
235 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
236 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
237 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
238 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
239 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
240 * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
241 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
242 *
Erik Andersenfb002d02000-03-05 08:07:00 +0000243 */
Erik Andersenfb002d02000-03-05 08:07:00 +0000244