xref: /freebsd/bin/dd/conv_tab.c (revision 35b53f8c989f62286aad075ef2e97bba358144f8)
1 /*-
2  * SPDX-License-Identifier: BSD-3-Clause
3  *
4  * Copyright (c) 1991, 1993
5  *	The Regents of the University of California.  All rights reserved.
6  *
7  * This code is derived from software contributed to Berkeley by
8  * Keith Muller of the University of California, San Diego and Lance
9  * Visser of Convex Computer Corporation.
10  *
11  * Redistribution and use in source and binary forms, with or without
12  * modification, are permitted provided that the following conditions
13  * are met:
14  * 1. Redistributions of source code must retain the above copyright
15  *    notice, this list of conditions and the following disclaimer.
16  * 2. Redistributions in binary form must reproduce the above copyright
17  *    notice, this list of conditions and the following disclaimer in the
18  *    documentation and/or other materials provided with the distribution.
19  * 3. Neither the name of the University nor the names of its contributors
20  *    may be used to endorse or promote products derived from this software
21  *    without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33  * SUCH DAMAGE.
34  */
35 
36 #include <sys/types.h>
37 
38 #include <signal.h>
39 #include <stdint.h>
40 
41 #include "dd.h"
42 #include "extern.h"
43 
44 /*
45  * There are currently six tables:
46  *
47  *	ebcdic		-> ascii	32V		conv=oldascii
48  *	ascii		-> ebcdic	32V		conv=oldebcdic
49  *	ascii		-> ibm ebcdic	32V		conv=oldibm
50  *
51  *	ebcdic		-> ascii	POSIX/S5	conv=ascii
52  *	ascii		-> ebcdic	POSIX/S5	conv=ebcdic
53  *	ascii		-> ibm ebcdic	POSIX/S5	conv=ibm
54  *
55  * Other tables are built from these if multiple conversions are being
56  * done.
57  *
58  * Tables used for conversions to/from IBM and EBCDIC to support an extension
59  * to POSIX P1003.2/D11. The tables referencing POSIX contain data extracted
60  * from tables 4-3 and 4-4 in P1003.2/Draft 11.  The historic tables were
61  * constructed by running against a file with all possible byte values.
62  *
63  * More information can be obtained in "Correspondences of 8-Bit and Hollerith
64  * Codes for Computer Environments-A USASI Tutorial", Communications of the
65  * ACM, Volume 11, Number 11, November 1968, pp. 783-789.
66  */
67 
68 u_char casetab[256];
69 
70 /* EBCDIC to ASCII -- 32V compatible. */
71 const u_char e2a_32V[] = {
72 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
73 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
74 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
75 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
76 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
77 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
78 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
79 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
80 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
81 	0247, 0250, 0133, 0056, 0074, 0050, 0053, 0041,		/* 0110 */
82 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
83 	0260, 0261, 0135, 0044, 0052, 0051, 0073, 0136,		/* 0130 */
84 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
85 	0270, 0271, 0174, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
86 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
87 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
88 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
89 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
90 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
91 	0161, 0162, 0313, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
92 	0321, 0176, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
93 	0171, 0172, 0322, 0323, 0324, 0325, 0326, 0327,		/* 0250 */
94 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
95 	0340, 0341, 0342, 0343, 0344, 0345, 0346, 0347,		/* 0270 */
96 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
97 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
98 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
99 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
100 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
101 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
102 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
103 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
104 };
105 
106 /* ASCII to EBCDIC -- 32V compatible. */
107 const u_char a2e_32V[] = {
108 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
109 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
110 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
111 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
112 	0100, 0117, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
113 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
114 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
115 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
116 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
117 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
118 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
119 	0347, 0350, 0351, 0112, 0340, 0132, 0137, 0155,		/* 0130 */
120 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
121 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
122 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
123 	0247, 0250, 0251, 0300, 0152, 0320, 0241, 0007,		/* 0170 */
124 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
125 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
126 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
127 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
128 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
129 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
130 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
131 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
132 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
133 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
134 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
135 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
136 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
137 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
138 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
139 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
140 };
141 
142 /* ASCII to IBM EBCDIC -- 32V compatible. */
143 const u_char a2ibm_32V[] = {
144 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
145 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
146 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
147 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
148 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
149 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
150 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
151 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
152 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
153 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
154 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
155 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
156 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
157 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
158 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
159 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
160 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
161 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
162 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
163 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
164 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
165 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
166 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
167 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
168 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
169 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
170 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
171 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
172 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
173 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
174 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
175 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
176 };
177 
178 /* EBCDIC to ASCII -- POSIX and System V compatible. */
179 const u_char e2a_POSIX[] = {
180 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
181 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
182 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
183 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
184 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
185 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
186 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
187 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
188 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
189 	0247, 0250, 0325, 0056, 0074, 0050, 0053, 0174,		/* 0110 */
190 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
191 	0260, 0261, 0041, 0044, 0052, 0051, 0073, 0176,		/* 0130 */
192 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
193 	0270, 0271, 0313, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
194 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
195 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
196 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
197 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
198 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
199 	0161, 0162, 0136, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
200 	0321, 0345, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
201 	0171, 0172, 0322, 0323, 0324, 0133, 0326, 0327,		/* 0250 */
202 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
203 	0340, 0341, 0342, 0343, 0344, 0135, 0346, 0347,		/* 0270 */
204 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
205 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
206 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
207 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
208 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
209 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
210 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
211 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
212 };
213 
214 /* ASCII to EBCDIC -- POSIX and System V compatible. */
215 const u_char a2e_POSIX[] = {
216 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
217 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
218 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
219 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
220 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
221 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
222 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
223 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
224 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
225 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
226 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
227 	0347, 0350, 0351, 0255, 0340, 0275, 0232, 0155,		/* 0130 */
228 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
229 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
230 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
231 	0247, 0250, 0251, 0300, 0117, 0320, 0137, 0007,		/* 0170 */
232 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
233 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
234 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
235 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
236 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
237 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
238 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
239 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
240 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
241 	0216, 0217, 0220, 0152, 0233, 0234, 0235, 0236,		/* 0310 */
242 	0237, 0240, 0252, 0253, 0254, 0112, 0256, 0257,		/* 0320 */
243 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
244 	0270, 0271, 0272, 0273, 0274, 0241, 0276, 0277,		/* 0340 */
245 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
246 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
247 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
248 };
249 
250 /* ASCII to IBM EBCDIC -- POSIX and System V compatible. */
251 const u_char a2ibm_POSIX[] = {
252 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
253 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
254 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
255 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
256 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
257 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
258 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
259 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
260 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
261 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
262 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
263 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
264 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
265 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
266 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
267 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
268 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
269 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
270 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
271 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
272 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
273 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
274 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
275 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
276 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
277 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
278 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
279 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
280 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
281 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
282 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
283 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
284 };
285