xref: /openbsd/usr.bin/tr/tr.c (revision 09467b48)
1 /*	$OpenBSD: tr.c,v 1.19 2015/10/09 01:37:09 deraadt Exp $	*/
2 /*	$NetBSD: tr.c,v 1.5 1995/08/31 22:13:48 jtc Exp $	*/
3 
4 /*
5  * Copyright (c) 1988, 1993
6  *	The Regents of the University of California.  All rights reserved.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. Neither the name of the University nor the names of its contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 
33 #include <sys/types.h>
34 
35 #include <stdio.h>
36 #include <stdlib.h>
37 #include <string.h>
38 #include <unistd.h>
39 #include <err.h>
40 
41 #include "extern.h"
42 
43 static int string1[NCHARS] = {
44 	0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,		/* ASCII */
45 	0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
46 	0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
47 	0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
48 	0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27,
49 	0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f,
50 	0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
51 	0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f,
52 	0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47,
53 	0x48, 0x49, 0x4a, 0x4b, 0x4c, 0x4d, 0x4e, 0x4f,
54 	0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57,
55 	0x58, 0x59, 0x5a, 0x5b, 0x5c, 0x5d, 0x5e, 0x5f,
56 	0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67,
57 	0x68, 0x69, 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f,
58 	0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77,
59 	0x78, 0x79, 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f,
60 	0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
61 	0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
62 	0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
63 	0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
64 	0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
65 	0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
66 	0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
67 	0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
68 	0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
69 	0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
70 	0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
71 	0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
72 	0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
73 	0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
74 	0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
75 	0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
76 }, string2[NCHARS];
77 
78 STR s1 = { STRING1, NORMAL, 0, OOBCH, { 0, OOBCH }, NULL, NULL };
79 STR s2 = { STRING2, NORMAL, 0, OOBCH, { 0, OOBCH }, NULL, NULL };
80 
81 static void setup(int *, char *, STR *, int);
82 static void usage(void);
83 
84 int
85 main(int argc, char *argv[])
86 {
87 	int ch, cnt, lastch, *p;
88 	int cflag, dflag, sflag, isstring2;
89 
90 	if (pledge("stdio", NULL) == -1)
91 		err(1, "pledge");
92 
93 	cflag = dflag = sflag = 0;
94 	while ((ch = getopt(argc, argv, "Ccds")) != -1)
95 		switch(ch) {
96 		case 'C':
97 		case 'c':
98 			cflag = 1;
99 			break;
100 		case 'd':
101 			dflag = 1;
102 			break;
103 		case 's':
104 			sflag = 1;
105 			break;
106 		case '?':
107 		default:
108 			usage();
109 		}
110 	argc -= optind;
111 	argv += optind;
112 
113 	switch(argc) {
114 	case 0:
115 	default:
116 		usage();
117 		/* NOTREACHED */
118 	case 1:
119 		isstring2 = 0;
120 		break;
121 	case 2:
122 		isstring2 = 1;
123 		break;
124 	}
125 
126 	/*
127 	 * tr -ds [-Cc] string1 string2
128 	 * Delete all characters (or complemented characters) in string1.
129 	 * Squeeze all characters in string2.
130 	 */
131 	if (dflag && sflag) {
132 		if (!isstring2)
133 			usage();
134 
135 		setup(string1, argv[0], &s1, cflag);
136 		setup(string2, argv[1], &s2, 0);
137 
138 		for (lastch = OOBCH; (ch = getchar()) != EOF;)
139 			if (!string1[ch] && (!string2[ch] || lastch != ch)) {
140 				lastch = ch;
141 				(void)putchar(ch);
142 			}
143 		exit(0);
144 	}
145 
146 	/*
147 	 * tr -d [-Cc] string1
148 	 * Delete all characters (or complemented characters) in string1.
149 	 */
150 	if (dflag) {
151 		if (isstring2)
152 			usage();
153 
154 		setup(string1, argv[0], &s1, cflag);
155 
156 		while ((ch = getchar()) != EOF)
157 			if (!string1[ch])
158 				(void)putchar(ch);
159 		exit(0);
160 	}
161 
162 	/*
163 	 * tr -s [-Cc] string1
164 	 * Squeeze all characters (or complemented characters) in string1.
165 	 */
166 	if (sflag && !isstring2) {
167 		setup(string1, argv[0], &s1, cflag);
168 
169 		for (lastch = OOBCH; (ch = getchar()) != EOF;)
170 			if (!string1[ch] || lastch != ch) {
171 				lastch = ch;
172 				(void)putchar(ch);
173 			}
174 		exit(0);
175 	}
176 
177 	/*
178 	 * tr [-Ccs] string1 string2
179 	 * Replace all characters (or complemented characters) in string1 with
180 	 * the character in the same position in string2.  If the -s option is
181 	 * specified, squeeze all the characters in string2.
182 	 */
183 	if (!isstring2)
184 		usage();
185 
186 	s1.str = (unsigned char *)argv[0];
187 	s2.str = (unsigned char *)argv[1];
188 
189 	if (cflag)
190 		for (cnt = NCHARS, p = string1; cnt--;)
191 			*p++ = OOBCH;
192 
193 	if (!next(&s2))
194 		errx(1, "empty string2");
195 
196 	/* If string2 runs out of characters, use the last one specified. */
197 	ch = s2.lastch;
198 	if (sflag)
199 		while (next(&s1)) {
200 			string1[s1.lastch] = ch = s2.lastch;
201 			string2[ch] = 1;
202 			(void)next(&s2);
203 		}
204 	else
205 		while (next(&s1)) {
206 			string1[s1.lastch] = ch = s2.lastch;
207 			(void)next(&s2);
208 		}
209 
210 	if (cflag)
211 		for (cnt = 0, p = string1; cnt < NCHARS; ++p, ++cnt)
212 			*p = *p == OOBCH ? ch : cnt;
213 
214 	if (sflag)
215 		for (lastch = OOBCH; (ch = getchar()) != EOF;) {
216 			ch = string1[ch];
217 			if (!string2[ch] || lastch != ch) {
218 				lastch = ch;
219 				(void)putchar(ch);
220 			}
221 		}
222 	else
223 		while ((ch = getchar()) != EOF)
224 			(void)putchar(string1[ch]);
225 	exit (0);
226 }
227 
228 static void
229 setup(int *string, char *arg, STR *str, int cflag)
230 {
231 	int cnt, *p;
232 
233 	str->str = (unsigned char *)arg;
234 	bzero(string, NCHARS * sizeof(int));
235 	while (next(str))
236 		string[str->lastch] = 1;
237 	if (cflag)
238 		for (p = string, cnt = NCHARS; cnt--; ++p)
239 			*p = !*p;
240 }
241 
242 static void
243 usage(void)
244 {
245 	fprintf(stderr,
246 	    "usage: tr [-Ccs] string1 string2\n"
247 	    "       tr [-Cc] -d string1\n"
248 	    "       tr [-Cc] -s string1\n"
249 	    "       tr [-Cc] -ds string1 string2\n");
250 	exit(1);
251 }
252