1/*-
2 * SPDX-License-Identifier: BSD-3-Clause
3 *
4 * Copyright (c) 1991, 1993
5 *	The Regents of the University of California.  All rights reserved.
6 *
7 * This code is derived from software contributed to Berkeley by
8 * Keith Muller of the University of California, San Diego and Lance
9 * Visser of Convex Computer Corporation.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 *    notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 *    notice, this list of conditions and the following disclaimer in the
18 *    documentation and/or other materials provided with the distribution.
19 * 3. Neither the name of the University nor the names of its contributors
20 *    may be used to endorse or promote products derived from this software
21 *    without specific prior written permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * SUCH DAMAGE.
34 */
35
36#include <sys/types.h>
37
38#include <signal.h>
39#include <stdint.h>
40
41#include "dd.h"
42#include "extern.h"
43
44/*
45 * There are currently six tables:
46 *
47 *	ebcdic		-> ascii	32V		conv=oldascii
48 *	ascii		-> ebcdic	32V		conv=oldebcdic
49 *	ascii		-> ibm ebcdic	32V		conv=oldibm
50 *
51 *	ebcdic		-> ascii	POSIX/S5	conv=ascii
52 *	ascii		-> ebcdic	POSIX/S5	conv=ebcdic
53 *	ascii		-> ibm ebcdic	POSIX/S5	conv=ibm
54 *
55 * Other tables are built from these if multiple conversions are being
56 * done.
57 *
58 * Tables used for conversions to/from IBM and EBCDIC to support an extension
59 * to POSIX P1003.2/D11. The tables referencing POSIX contain data extracted
60 * from tables 4-3 and 4-4 in P1003.2/Draft 11.  The historic tables were
61 * constructed by running against a file with all possible byte values.
62 *
63 * More information can be obtained in "Correspondences of 8-Bit and Hollerith
64 * Codes for Computer Environments-A USASI Tutorial", Communications of the
65 * ACM, Volume 11, Number 11, November 1968, pp. 783-789.
66 */
67
68u_char casetab[256];
69
70/* EBCDIC to ASCII -- 32V compatible. */
71const u_char e2a_32V[] = {
72	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
73	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
74	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
75	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
76	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
77	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
78	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
79	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
80	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
81	0247, 0250, 0133, 0056, 0074, 0050, 0053, 0041,		/* 0110 */
82	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
83	0260, 0261, 0135, 0044, 0052, 0051, 0073, 0136,		/* 0130 */
84	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
85	0270, 0271, 0174, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
86	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
87	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
88	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
89	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
90	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
91	0161, 0162, 0313, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
92	0321, 0176, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
93	0171, 0172, 0322, 0323, 0324, 0325, 0326, 0327,		/* 0250 */
94	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
95	0340, 0341, 0342, 0343, 0344, 0345, 0346, 0347,		/* 0270 */
96	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
97	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
98	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
99	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
100	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
101	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
102	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
103	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
104};
105
106/* ASCII to EBCDIC -- 32V compatible. */
107const u_char a2e_32V[] = {
108	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
109	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
110	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
111	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
112	0100, 0117, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
113	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
114	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
115	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
116	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
117	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
118	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
119	0347, 0350, 0351, 0112, 0340, 0132, 0137, 0155,		/* 0130 */
120	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
121	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
122	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
123	0247, 0250, 0251, 0300, 0152, 0320, 0241, 0007,		/* 0170 */
124	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
125	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
126	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
127	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
128	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
129	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
130	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
131	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
132	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
133	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
134	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
135	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
136	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
137	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
138	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
139	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
140};
141
142/* ASCII to IBM EBCDIC -- 32V compatible. */
143const u_char a2ibm_32V[] = {
144	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
145	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
146	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
147	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
148	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
149	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
150	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
151	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
152	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
153	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
154	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
155	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
156	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
157	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
158	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
159	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
160	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
161	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
162	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
163	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
164	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
165	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
166	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
167	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
168	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
169	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
170	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
171	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
172	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
173	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
174	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
175	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
176};
177
178/* EBCDIC to ASCII -- POSIX and System V compatible. */
179const u_char e2a_POSIX[] = {
180	0000, 0001, 0002, 0003, 0234, 0011, 0206, 0177,		/* 0000 */
181	0227, 0215, 0216, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
182	0020, 0021, 0022, 0023, 0235, 0205, 0010, 0207,		/* 0020 */
183	0030, 0031, 0222, 0217, 0034, 0035, 0036, 0037,		/* 0030 */
184	0200, 0201, 0202, 0203, 0204, 0012, 0027, 0033,		/* 0040 */
185	0210, 0211, 0212, 0213, 0214, 0005, 0006, 0007,		/* 0050 */
186	0220, 0221, 0026, 0223, 0224, 0225, 0226, 0004,		/* 0060 */
187	0230, 0231, 0232, 0233, 0024, 0025, 0236, 0032,		/* 0070 */
188	0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,		/* 0100 */
189	0247, 0250, 0325, 0056, 0074, 0050, 0053, 0174,		/* 0110 */
190	0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0120 */
191	0260, 0261, 0041, 0044, 0052, 0051, 0073, 0176,		/* 0130 */
192	0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0140 */
193	0270, 0271, 0313, 0054, 0045, 0137, 0076, 0077,		/* 0150 */
194	0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,		/* 0160 */
195	0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,		/* 0170 */
196	0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0200 */
197	0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,		/* 0210 */
198	0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,		/* 0220 */
199	0161, 0162, 0136, 0314, 0315, 0316, 0317, 0320,		/* 0230 */
200	0321, 0345, 0163, 0164, 0165, 0166, 0167, 0170,		/* 0240 */
201	0171, 0172, 0322, 0323, 0324, 0133, 0326, 0327,		/* 0250 */
202	0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,		/* 0260 */
203	0340, 0341, 0342, 0343, 0344, 0135, 0346, 0347,		/* 0270 */
204	0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,		/* 0300 */
205	0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,		/* 0310 */
206	0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,		/* 0320 */
207	0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,		/* 0330 */
208	0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,		/* 0340 */
209	0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,		/* 0350 */
210	0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,		/* 0360 */
211	0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
212};
213
214/* ASCII to EBCDIC -- POSIX and System V compatible. */
215const u_char a2e_POSIX[] = {
216	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
217	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
218	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
219	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
220	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
221	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
222	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
223	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
224	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
225	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
226	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
227	0347, 0350, 0351, 0255, 0340, 0275, 0232, 0155,		/* 0130 */
228	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
229	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
230	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
231	0247, 0250, 0251, 0300, 0117, 0320, 0137, 0007,		/* 0170 */
232	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
233	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
234	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
235	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
236	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
237	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
238	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
239	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
240	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
241	0216, 0217, 0220, 0152, 0233, 0234, 0235, 0236,		/* 0310 */
242	0237, 0240, 0252, 0253, 0254, 0112, 0256, 0257,		/* 0320 */
243	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
244	0270, 0271, 0272, 0273, 0274, 0241, 0276, 0277,		/* 0340 */
245	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
246	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
247	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
248};
249
250/* ASCII to IBM EBCDIC -- POSIX and System V compatible. */
251const u_char a2ibm_POSIX[] = {
252	0000, 0001, 0002, 0003, 0067, 0055, 0056, 0057,		/* 0000 */
253	0026, 0005, 0045, 0013, 0014, 0015, 0016, 0017,		/* 0010 */
254	0020, 0021, 0022, 0023, 0074, 0075, 0062, 0046,		/* 0020 */
255	0030, 0031, 0077, 0047, 0034, 0035, 0036, 0037,		/* 0030 */
256	0100, 0132, 0177, 0173, 0133, 0154, 0120, 0175,		/* 0040 */
257	0115, 0135, 0134, 0116, 0153, 0140, 0113, 0141,		/* 0050 */
258	0360, 0361, 0362, 0363, 0364, 0365, 0366, 0367,		/* 0060 */
259	0370, 0371, 0172, 0136, 0114, 0176, 0156, 0157,		/* 0070 */
260	0174, 0301, 0302, 0303, 0304, 0305, 0306, 0307,		/* 0100 */
261	0310, 0311, 0321, 0322, 0323, 0324, 0325, 0326,		/* 0110 */
262	0327, 0330, 0331, 0342, 0343, 0344, 0345, 0346,		/* 0120 */
263	0347, 0350, 0351, 0255, 0340, 0275, 0137, 0155,		/* 0130 */
264	0171, 0201, 0202, 0203, 0204, 0205, 0206, 0207,		/* 0140 */
265	0210, 0211, 0221, 0222, 0223, 0224, 0225, 0226,		/* 0150 */
266	0227, 0230, 0231, 0242, 0243, 0244, 0245, 0246,		/* 0160 */
267	0247, 0250, 0251, 0300, 0117, 0320, 0241, 0007,		/* 0170 */
268	0040, 0041, 0042, 0043, 0044, 0025, 0006, 0027,		/* 0200 */
269	0050, 0051, 0052, 0053, 0054, 0011, 0012, 0033,		/* 0210 */
270	0060, 0061, 0032, 0063, 0064, 0065, 0066, 0010,		/* 0220 */
271	0070, 0071, 0072, 0073, 0004, 0024, 0076, 0341,		/* 0230 */
272	0101, 0102, 0103, 0104, 0105, 0106, 0107, 0110,		/* 0240 */
273	0111, 0121, 0122, 0123, 0124, 0125, 0126, 0127,		/* 0250 */
274	0130, 0131, 0142, 0143, 0144, 0145, 0146, 0147,		/* 0260 */
275	0150, 0151, 0160, 0161, 0162, 0163, 0164, 0165,		/* 0270 */
276	0166, 0167, 0170, 0200, 0212, 0213, 0214, 0215,		/* 0300 */
277	0216, 0217, 0220, 0232, 0233, 0234, 0235, 0236,		/* 0310 */
278	0237, 0240, 0252, 0253, 0254, 0255, 0256, 0257,		/* 0320 */
279	0260, 0261, 0262, 0263, 0264, 0265, 0266, 0267,		/* 0330 */
280	0270, 0271, 0272, 0273, 0274, 0275, 0276, 0277,		/* 0340 */
281	0312, 0313, 0314, 0315, 0316, 0317, 0332, 0333,		/* 0350 */
282	0334, 0335, 0336, 0337, 0352, 0353, 0354, 0355,		/* 0360 */
283	0356, 0357, 0372, 0373, 0374, 0375, 0376, 0377,		/* 0370 */
284};
285