xref: /freebsd/bin/dd/conv_tab.c (revision 3f0164abf32b9b761e0a2cb4bdca3a8b84f156d4)
1 /*-
2  * Copyright (c) 1991, 1993
3  *	The Regents of the University of California.  All rights reserved.
4  *
5  * This code is derived from software contributed to Berkeley by
6  * Keith Muller of the University of California, San Diego and Lance
7  * Visser of Convex Computer Corporation.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  * 4. Neither the name of the University nor the names of its contributors
18  *    may be used to endorse or promote products derived from this software
19  *    without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31  * SUCH DAMAGE.
32  */
33 
34 #ifndef lint
35 #if 0
36 static char sccsid[] = "@(#)conv_tab.c	8.1 (Berkeley) 5/31/93";
37 #endif
38 #endif /* not lint */
39 #include <sys/cdefs.h>
40 __FBSDID("$FreeBSD$");
41 
42 #include <sys/types.h>
43 
44 #include <signal.h>
45 #include <stdint.h>
46 
47 #include "dd.h"
48 #include "extern.h"
49 
50 /*
51  * There are currently six tables:
52  *
53  *	ebcdic		-> ascii	32V		conv=oldascii
54  *	ascii		-> ebcdic	32V		conv=oldebcdic
55  *	ascii		-> ibm ebcdic	32V		conv=oldibm
56  *
57  *	ebcdic		-> ascii	POSIX/S5	conv=ascii
58  *	ascii		-> ebcdic	POSIX/S5	conv=ebcdic
59  *	ascii		-> ibm ebcdic	POSIX/S5	conv=ibm
60  *
61  * Other tables are built from these if multiple conversions are being
62  * done.
63  *
64  * Tables used for conversions to/from IBM and EBCDIC to support an extension
65  * to POSIX P1003.2/D11. The tables referencing POSIX contain data extracted
66  * from tables 4-3 and 4-4 in P1003.2/Draft 11.  The historic tables were
67  * constructed by running against a file with all possible byte values.
68  *
69  * More information can be obtained in "Correspondences of 8-Bit and Hollerith
70  * Codes for Computer Environments-A USASI Tutorial", Communications of the
71  * ACM, Volume 11, Number 11, November 1968, pp. 783-789.
72  */
73 
74 u_char casetab[256];
75 
76 /* EBCDIC to ASCII -- 32V compatible. */
77 const u_char e2a_32V[] = {
78 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
79 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
80 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
81 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
82 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
83 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
84 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
85 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
86 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
87 	0247, 0250, 0133, 0056, 0074, 0050, 0053, 0041,		/* 0110 */
88 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
89 	0260, 0261, 0135, 0044, 0052, 0051, 0073, 0136,		/* 0130 */
90 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
91 	0270, 0271, 0174, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
92 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
93 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
94 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
95 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
96 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
97 	0161, 0162, 0313, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
98 	0321, 0176, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
99 	0171, 0172, 0322, 0323, 0324, 0325, 0326, 0327,		/* 0250 */
100 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
101 	0340, 0341, 0342, 0343, 0344, 0345, 0346, 0347,		/* 0270 */
102 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
103 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
104 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
105 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
106 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
107 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
108 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
109 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
110 };
111 
112 /* ASCII to EBCDIC -- 32V compatible. */
113 const u_char a2e_32V[] = {
114 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
115 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
116 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
117 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
118 	0100, 0117, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
119 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
120 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
121 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
122 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
123 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
124 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
125 	0347, 0350, 0351, 0112, 0340, 0132, 0137, 0155,		/* 0130 */
126 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
127 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
128 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
129 	0247, 0250, 0251, 0300, 0152, 0320, 0241, 0007,		/* 0170 */
130 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
131 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
132 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
133 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
134 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
135 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
136 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
137 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
138 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
139 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
140 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
141 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
142 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
143 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
144 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
145 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
146 };
147 
148 /* ASCII to IBM EBCDIC -- 32V compatible. */
149 const u_char a2ibm_32V[] = {
150 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
151 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
152 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
153 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
154 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
155 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
156 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
157 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
158 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
159 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
160 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
161 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
162 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
163 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
164 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
165 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
166 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
167 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
168 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
169 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
170 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
171 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
172 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
173 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
174 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
175 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
176 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
177 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
178 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
179 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
180 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
181 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
182 };
183 
184 /* EBCDIC to ASCII -- POSIX and System V compatible. */
185 const u_char e2a_POSIX[] = {
186 	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
187 	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
188 	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
189 	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
190 	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
191 	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
192 	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
193 	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
194 	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
195 	0247, 0250, 0325, 0056, 0074, 0050, 0053, 0174,		/* 0110 */
196 	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
197 	0260, 0261, 0041, 0044, 0052, 0051, 0073, 0176,		/* 0130 */
198 	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
199 	0270, 0271, 0313, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
200 	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
201 	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
202 	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
203 	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
204 	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
205 	0161, 0162, 0136, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
206 	0321, 0345, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
207 	0171, 0172, 0322, 0323, 0324, 0133, 0326, 0327,		/* 0250 */
208 	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
209 	0340, 0341, 0342, 0343, 0344, 0135, 0346, 0347,		/* 0270 */
210 	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
211 	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
212 	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
213 	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
214 	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
215 	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
216 	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
217 	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
218 };
219 
220 /* ASCII to EBCDIC -- POSIX and System V compatible. */
221 const u_char a2e_POSIX[] = {
222 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
223 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
224 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
225 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
226 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
227 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
228 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
229 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
230 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
231 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
232 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
233 	0347, 0350, 0351, 0255, 0340, 0275, 0232, 0155,		/* 0130 */
234 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
235 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
236 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
237 	0247, 0250, 0251, 0300, 0117, 0320, 0137, 0007,		/* 0170 */
238 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
239 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
240 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
241 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
242 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
243 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
244 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
245 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
246 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
247 	0216, 0217, 0220, 0152, 0233, 0234, 0235, 0236,		/* 0310 */
248 	0237, 0240, 0252, 0253, 0254, 0112, 0256, 0257,		/* 0320 */
249 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
250 	0270, 0271, 0272, 0273, 0274, 0241, 0276, 0277,		/* 0340 */
251 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
252 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
253 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
254 };
255 
256 /* ASCII to IBM EBCDIC -- POSIX and System V compatible. */
257 const u_char a2ibm_POSIX[] = {
258 	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
259 	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
260 	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
261 	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
262 	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
263 	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
264 	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
265 	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
266 	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
267 	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
268 	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
269 	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
270 	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
271 	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
272 	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
273 	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
274 	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
275 	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
276 	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
277 	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
278 	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
279 	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
280 	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
281 	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
282 	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
283 	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
284 	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
285 	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
286 	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
287 	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
288 	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
289 	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
290 };
291