xref: /freebsd/bin/dd/conv_tab.c (revision bdcbfde31e8e9b343f113a1956384bdf30d1ed62)
1 /*-
2  * SPDX-License-Identifier: BSD-3-Clause
3  *
4  * Copyright (c) 1991, 1993
5  *	The Regents of the University of California.  All rights reserved.
6  *
7  * This code is derived from software contributed to Berkeley by
8  * Keith Muller of the University of California, San Diego and Lance
9  * Visser of Convex Computer Corporation.
10  *
11  * Redistribution and use in source and binary forms, with or without
12  * modification, are permitted provided that the following conditions
13  * are met:
14  * 1. Redistributions of source code must retain the above copyright
15  *    notice, this list of conditions and the following disclaimer.
16  * 2. Redistributions in binary form must reproduce the above copyright
17  *    notice, this list of conditions and the following disclaimer in the
18  *    documentation and/or other materials provided with the distribution.
19  * 3. Neither the name of the University nor the names of its contributors
20  *    may be used to endorse or promote products derived from this software
21  *    without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33  * SUCH DAMAGE.
34  */
35 
36 #ifndef lint
37 #endif /* not lint */
38 #include <sys/cdefs.h>
39 #include <sys/types.h>
40 
41 #include <signal.h>
42 #include <stdint.h>
43 
44 #include "dd.h"
45 #include "extern.h"
46 
47 /*
48  * There are currently six tables:
49  *
50  *	ebcdic		-> ascii	32V		conv=oldascii
51  *	ascii		-> ebcdic	32V		conv=oldebcdic
52  *	ascii		-> ibm ebcdic	32V		conv=oldibm
53  *
54  *	ebcdic		-> ascii	POSIX/S5	conv=ascii
55  *	ascii		-> ebcdic	POSIX/S5	conv=ebcdic
56  *	ascii		-> ibm ebcdic	POSIX/S5	conv=ibm
57  *
58  * Other tables are built from these if multiple conversions are being
59  * done.
60  *
61  * Tables used for conversions to/from IBM and EBCDIC to support an extension
62  * to POSIX P1003.2/D11. The tables referencing POSIX contain data extracted
63  * from tables 4-3 and 4-4 in P1003.2/Draft 11.  The historic tables were
64  * constructed by running against a file with all possible byte values.
65  *
66  * More information can be obtained in "Correspondences of 8-Bit and Hollerith
67  * Codes for Computer Environments-A USASI Tutorial", Communications of the
68  * ACM, Volume 11, Number 11, November 1968, pp. 783-789.
69  */
70 
71 u_char casetab[256];
72 
73 /* EBCDIC to ASCII -- 32V compatible. */
74 const u_char e2a_32V[] = {
75 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
76 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
77 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
78 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
79 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
80 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
81 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
82 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
83 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
84 	0247, 0250, 0133, 0056, 0074, 0050, 0053, 0041,		/* 0110 */
85 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
86 	0260, 0261, 0135, 0044, 0052, 0051, 0073, 0136,		/* 0130 */
87 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
88 	0270, 0271, 0174, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
89 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
90 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
91 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
92 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
93 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
94 	0161, 0162, 0313, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
95 	0321, 0176, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
96 	0171, 0172, 0322, 0323, 0324, 0325, 0326, 0327,		/* 0250 */
97 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
98 	0340, 0341, 0342, 0343, 0344, 0345, 0346, 0347,		/* 0270 */
99 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
100 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
101 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
102 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
103 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
104 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
105 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
106 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
107 };
108 
109 /* ASCII to EBCDIC -- 32V compatible. */
110 const u_char a2e_32V[] = {
111 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
112 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
113 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
114 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
115 	0100, 0117, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
116 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
117 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
118 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
119 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
120 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
121 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
122 	0347, 0350, 0351, 0112, 0340, 0132, 0137, 0155,		/* 0130 */
123 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
124 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
125 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
126 	0247, 0250, 0251, 0300, 0152, 0320, 0241, 0007,		/* 0170 */
127 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
128 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
129 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
130 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
131 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
132 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
133 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
134 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
135 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
136 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
137 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
138 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
139 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
140 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
141 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
142 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
143 };
144 
145 /* ASCII to IBM EBCDIC -- 32V compatible. */
146 const u_char a2ibm_32V[] = {
147 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
148 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
149 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
150 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
151 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
152 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
153 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
154 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
155 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
156 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
157 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
158 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
159 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
160 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
161 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
162 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
163 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
164 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
165 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
166 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
167 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
168 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
169 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
170 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
171 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
172 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
173 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
174 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
175 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
176 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
177 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
178 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
179 };
180 
181 /* EBCDIC to ASCII -- POSIX and System V compatible. */
182 const u_char e2a_POSIX[] = {
183 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
184 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
185 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
186 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
187 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
188 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
189 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
190 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
191 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
192 	0247, 0250, 0325, 0056, 0074, 0050, 0053, 0174,		/* 0110 */
193 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
194 	0260, 0261, 0041, 0044, 0052, 0051, 0073, 0176,		/* 0130 */
195 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
196 	0270, 0271, 0313, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
197 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
198 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
199 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
200 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
201 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
202 	0161, 0162, 0136, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
203 	0321, 0345, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
204 	0171, 0172, 0322, 0323, 0324, 0133, 0326, 0327,		/* 0250 */
205 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
206 	0340, 0341, 0342, 0343, 0344, 0135, 0346, 0347,		/* 0270 */
207 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
208 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
209 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
210 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
211 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
212 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
213 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
214 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
215 };
216 
217 /* ASCII to EBCDIC -- POSIX and System V compatible. */
218 const u_char a2e_POSIX[] = {
219 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
220 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
221 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
222 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
223 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
224 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
225 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
226 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
227 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
228 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
229 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
230 	0347, 0350, 0351, 0255, 0340, 0275, 0232, 0155,		/* 0130 */
231 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
232 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
233 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
234 	0247, 0250, 0251, 0300, 0117, 0320, 0137, 0007,		/* 0170 */
235 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
236 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
237 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
238 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
239 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
240 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
241 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
242 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
243 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
244 	0216, 0217, 0220, 0152, 0233, 0234, 0235, 0236,		/* 0310 */
245 	0237, 0240, 0252, 0253, 0254, 0112, 0256, 0257,		/* 0320 */
246 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
247 	0270, 0271, 0272, 0273, 0274, 0241, 0276, 0277,		/* 0340 */
248 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
249 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
250 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
251 };
252 
253 /* ASCII to IBM EBCDIC -- POSIX and System V compatible. */
254 const u_char a2ibm_POSIX[] = {
255 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
256 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
257 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
258 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
259 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
260 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
261 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
262 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
263 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
264 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
265 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
266 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
267 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
268 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
269 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
270 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
271 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
272 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
273 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
274 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
275 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
276 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
277 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
278 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
279 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
280 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
281 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
282 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
283 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
284 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
285 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
286 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
287 };
288