xref: /freebsd/bin/dd/conv_tab.c (revision 0957b409)
1 /*-
2  * SPDX-License-Identifier: BSD-3-Clause
3  *
4  * Copyright (c) 1991, 1993
5  *	The Regents of the University of California.  All rights reserved.
6  *
7  * This code is derived from software contributed to Berkeley by
8  * Keith Muller of the University of California, San Diego and Lance
9  * Visser of Convex Computer Corporation.
10  *
11  * Redistribution and use in source and binary forms, with or without
12  * modification, are permitted provided that the following conditions
13  * are met:
14  * 1. Redistributions of source code must retain the above copyright
15  *    notice, this list of conditions and the following disclaimer.
16  * 2. Redistributions in binary form must reproduce the above copyright
17  *    notice, this list of conditions and the following disclaimer in the
18  *    documentation and/or other materials provided with the distribution.
19  * 3. Neither the name of the University nor the names of its contributors
20  *    may be used to endorse or promote products derived from this software
21  *    without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33  * SUCH DAMAGE.
34  */
35 
36 #ifndef lint
37 #if 0
38 static char sccsid[] = "@(#)conv_tab.c	8.1 (Berkeley) 5/31/93";
39 #endif
40 #endif /* not lint */
41 #include <sys/cdefs.h>
42 __FBSDID("$FreeBSD$");
43 
44 #include <sys/types.h>
45 
46 #include <signal.h>
47 #include <stdint.h>
48 
49 #include "dd.h"
50 #include "extern.h"
51 
52 /*
53  * There are currently six tables:
54  *
55  *	ebcdic		-> ascii	32V		conv=oldascii
56  *	ascii		-> ebcdic	32V		conv=oldebcdic
57  *	ascii		-> ibm ebcdic	32V		conv=oldibm
58  *
59  *	ebcdic		-> ascii	POSIX/S5	conv=ascii
60  *	ascii		-> ebcdic	POSIX/S5	conv=ebcdic
61  *	ascii		-> ibm ebcdic	POSIX/S5	conv=ibm
62  *
63  * Other tables are built from these if multiple conversions are being
64  * done.
65  *
66  * Tables used for conversions to/from IBM and EBCDIC to support an extension
67  * to POSIX P1003.2/D11. The tables referencing POSIX contain data extracted
68  * from tables 4-3 and 4-4 in P1003.2/Draft 11.  The historic tables were
69  * constructed by running against a file with all possible byte values.
70  *
71  * More information can be obtained in "Correspondences of 8-Bit and Hollerith
72  * Codes for Computer Environments-A USASI Tutorial", Communications of the
73  * ACM, Volume 11, Number 11, November 1968, pp. 783-789.
74  */
75 
76 u_char casetab[256];
77 
78 /* EBCDIC to ASCII -- 32V compatible. */
79 const u_char e2a_32V[] = {
80 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
81 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
82 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
83 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
84 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
85 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
86 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
87 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
88 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
89 	0247, 0250, 0133, 0056, 0074, 0050, 0053, 0041,		/* 0110 */
90 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
91 	0260, 0261, 0135, 0044, 0052, 0051, 0073, 0136,		/* 0130 */
92 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
93 	0270, 0271, 0174, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
94 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
95 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
96 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
97 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
98 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
99 	0161, 0162, 0313, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
100 	0321, 0176, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
101 	0171, 0172, 0322, 0323, 0324, 0325, 0326, 0327,		/* 0250 */
102 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
103 	0340, 0341, 0342, 0343, 0344, 0345, 0346, 0347,		/* 0270 */
104 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
105 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
106 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
107 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
108 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
109 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
110 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
111 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
112 };
113 
114 /* ASCII to EBCDIC -- 32V compatible. */
115 const u_char a2e_32V[] = {
116 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
117 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
118 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
119 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
120 	0100, 0117, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
121 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
122 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
123 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
124 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
125 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
126 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
127 	0347, 0350, 0351, 0112, 0340, 0132, 0137, 0155,		/* 0130 */
128 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
129 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
130 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
131 	0247, 0250, 0251, 0300, 0152, 0320, 0241, 0007,		/* 0170 */
132 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
133 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
134 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
135 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
136 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
137 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
138 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
139 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
140 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
141 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
142 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
143 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
144 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
145 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
146 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
147 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
148 };
149 
150 /* ASCII to IBM EBCDIC -- 32V compatible. */
151 const u_char a2ibm_32V[] = {
152 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
153 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
154 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
155 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
156 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
157 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
158 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
159 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
160 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
161 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
162 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
163 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
164 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
165 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
166 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
167 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
168 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
169 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
170 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
171 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
172 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
173 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
174 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
175 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
176 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
177 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
178 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
179 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
180 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
181 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
182 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
183 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
184 };
185 
186 /* EBCDIC to ASCII -- POSIX and System V compatible. */
187 const u_char e2a_POSIX[] = {
188 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
189 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
190 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
191 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
192 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
193 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
194 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
195 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
196 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
197 	0247, 0250, 0325, 0056, 0074, 0050, 0053, 0174,		/* 0110 */
198 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
199 	0260, 0261, 0041, 0044, 0052, 0051, 0073, 0176,		/* 0130 */
200 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
201 	0270, 0271, 0313, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
202 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
203 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
204 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
205 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
206 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
207 	0161, 0162, 0136, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
208 	0321, 0345, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
209 	0171, 0172, 0322, 0323, 0324, 0133, 0326, 0327,		/* 0250 */
210 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
211 	0340, 0341, 0342, 0343, 0344, 0135, 0346, 0347,		/* 0270 */
212 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
213 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
214 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
215 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
216 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
217 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
218 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
219 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
220 };
221 
222 /* ASCII to EBCDIC -- POSIX and System V compatible. */
223 const u_char a2e_POSIX[] = {
224 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
225 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
226 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
227 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
228 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
229 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
230 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
231 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
232 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
233 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
234 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
235 	0347, 0350, 0351, 0255, 0340, 0275, 0232, 0155,		/* 0130 */
236 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
237 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
238 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
239 	0247, 0250, 0251, 0300, 0117, 0320, 0137, 0007,		/* 0170 */
240 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
241 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
242 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
243 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
244 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
245 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
246 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
247 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
248 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
249 	0216, 0217, 0220, 0152, 0233, 0234, 0235, 0236,		/* 0310 */
250 	0237, 0240, 0252, 0253, 0254, 0112, 0256, 0257,		/* 0320 */
251 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
252 	0270, 0271, 0272, 0273, 0274, 0241, 0276, 0277,		/* 0340 */
253 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
254 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
255 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
256 };
257 
258 /* ASCII to IBM EBCDIC -- POSIX and System V compatible. */
259 const u_char a2ibm_POSIX[] = {
260 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
261 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
262 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
263 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
264 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
265 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
266 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
267 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
268 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
269 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
270 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
271 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
272 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
273 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
274 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
275 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
276 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
277 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
278 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
279 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
280 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
281 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
282 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
283 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
284 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
285 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
286 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
287 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
288 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
289 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
290 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
291 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
292 };
293