xref: /freebsd/stand/common/interp_backslash.c (revision 3e15b01d6914c927e37d1699645783acf286655c)
1ca987d46SWarner Losh /*-
2ca987d46SWarner Losh  * Redistribution and use in source and binary forms, with or without
3ca987d46SWarner Losh  * modification, are permitted provided that the following conditions
4ca987d46SWarner Losh  * are met:
5ca987d46SWarner Losh  * 1. Redistributions of source code must retain the above copyright
6ca987d46SWarner Losh  *    notice, this list of conditions and the following disclaimer.
7ca987d46SWarner Losh  * 2. Redistributions in binary form must reproduce the above copyright
8ca987d46SWarner Losh  *    notice, this list of conditions and the following disclaimer in the
9ca987d46SWarner Losh  *    documentation and/or other materials provided with the distribution.
10ca987d46SWarner Losh  *
11ca987d46SWarner Losh  * Jordan K. Hubbard
12ca987d46SWarner Losh  * 29 August 1998
13ca987d46SWarner Losh  *
14ca987d46SWarner Losh  * Routine for doing backslash elimination.
15ca987d46SWarner Losh  */
16ca987d46SWarner Losh 
17ca987d46SWarner Losh #include <stand.h>
18ca987d46SWarner Losh #include <string.h>
19ca987d46SWarner Losh #include "bootstrap.h"
20ca987d46SWarner Losh 
21ca987d46SWarner Losh #define	DIGIT(x) (isdigit(x) ? (x) - '0' : islower(x) ? (x) + 10 - 'a' : (x) + 10 - 'A')
22ca987d46SWarner Losh 
23ca987d46SWarner Losh /*
24ca987d46SWarner Losh  * backslash: Return malloc'd copy of str with all standard "backslash
25ca987d46SWarner Losh  * processing" done on it.  Original can be free'd if desired.
26ca987d46SWarner Losh  */
27ca987d46SWarner Losh char *
backslash(const char * str)28*bd04a914SWarner Losh backslash(const char *str)
29ca987d46SWarner Losh {
30ca987d46SWarner Losh 	/*
31ca987d46SWarner Losh 	 * Remove backslashes from the strings. Turn \040 etc. into a single
32ca987d46SWarner Losh 	 * character (we allow eight bit values). Currently NUL is not
33ca987d46SWarner Losh 	 * allowed.
34ca987d46SWarner Losh 	 *
35ca987d46SWarner Losh 	 * Turn "\n" and "\t" into '\n' and '\t' characters. Etc.
36ca987d46SWarner Losh 	 *
37ca987d46SWarner Losh 	 */
38ca987d46SWarner Losh 	char *new_str;
39ca987d46SWarner Losh 	int seenbs = 0;
40ca987d46SWarner Losh 	int i = 0;
41ca987d46SWarner Losh 
42ca987d46SWarner Losh 	if ((new_str = strdup(str)) == NULL)
43ca987d46SWarner Losh 		return NULL;
44ca987d46SWarner Losh 
45ca987d46SWarner Losh 	while (*str) {
46ca987d46SWarner Losh 		if (seenbs) {
47ca987d46SWarner Losh 			seenbs = 0;
48ca987d46SWarner Losh 			switch (*str) {
49ca987d46SWarner Losh 			case '\\':
50ca987d46SWarner Losh 				new_str[i++] = '\\';
51ca987d46SWarner Losh 				str++;
52ca987d46SWarner Losh 				break;
53ca987d46SWarner Losh 
54ca987d46SWarner Losh 				/* preserve backslashed quotes, dollar signs */
55ca987d46SWarner Losh 			case '\'':
56ca987d46SWarner Losh 			case '"':
57ca987d46SWarner Losh 			case '$':
58ca987d46SWarner Losh 				new_str[i++] = '\\';
59ca987d46SWarner Losh 				new_str[i++] = *str++;
60ca987d46SWarner Losh 				break;
61ca987d46SWarner Losh 
62ca987d46SWarner Losh 			case 'b':
63ca987d46SWarner Losh 				new_str[i++] = '\b';
64ca987d46SWarner Losh 				str++;
65ca987d46SWarner Losh 				break;
66ca987d46SWarner Losh 
67ca987d46SWarner Losh 			case 'f':
68ca987d46SWarner Losh 				new_str[i++] = '\f';
69ca987d46SWarner Losh 				str++;
70ca987d46SWarner Losh 				break;
71ca987d46SWarner Losh 
72ca987d46SWarner Losh 			case 'r':
73ca987d46SWarner Losh 				new_str[i++] = '\r';
74ca987d46SWarner Losh 				str++;
75ca987d46SWarner Losh 				break;
76ca987d46SWarner Losh 
77ca987d46SWarner Losh 			case 'n':
78ca987d46SWarner Losh 				new_str[i++] = '\n';
79ca987d46SWarner Losh 				str++;
80ca987d46SWarner Losh 				break;
81ca987d46SWarner Losh 
82ca987d46SWarner Losh 			case 's':
83ca987d46SWarner Losh 				new_str[i++] = ' ';
84ca987d46SWarner Losh 				str++;
85ca987d46SWarner Losh 				break;
86ca987d46SWarner Losh 
87ca987d46SWarner Losh 			case 't':
88ca987d46SWarner Losh 				new_str[i++] = '\t';
89ca987d46SWarner Losh 				str++;
90ca987d46SWarner Losh 				break;
91ca987d46SWarner Losh 
92ca987d46SWarner Losh 			case 'v':
93ca987d46SWarner Losh 				new_str[i++] = '\13';
94ca987d46SWarner Losh 				str++;
95ca987d46SWarner Losh 				break;
96ca987d46SWarner Losh 
97ca987d46SWarner Losh 			case 'z':
98ca987d46SWarner Losh 				str++;
99ca987d46SWarner Losh 				break;
100ca987d46SWarner Losh 
101ca987d46SWarner Losh 			case '0': case '1': case '2': case '3': case '4':
102ca987d46SWarner Losh 			case '5': case '6': case '7': case '8': case '9': {
103ca987d46SWarner Losh 				char val;
104ca987d46SWarner Losh 
105ca987d46SWarner Losh 				/* Three digit octal constant? */
106ca987d46SWarner Losh 				if (*str >= '0' && *str <= '3' &&
107ca987d46SWarner Losh 				    *(str + 1) >= '0' && *(str + 1) <= '7' &&
108ca987d46SWarner Losh 				    *(str + 2) >= '0' && *(str + 2) <= '7') {
109ca987d46SWarner Losh 
110ca987d46SWarner Losh 					val = (DIGIT(*str) << 6) + (DIGIT(*(str + 1)) << 3) +
111ca987d46SWarner Losh 					    DIGIT(*(str + 2));
112ca987d46SWarner Losh 
113ca987d46SWarner Losh 					/* Allow null value if user really wants to shoot
114ca987d46SWarner Losh 					   at feet, but beware! */
115ca987d46SWarner Losh 					new_str[i++] = val;
116ca987d46SWarner Losh 					str += 3;
117ca987d46SWarner Losh 					break;
118ca987d46SWarner Losh 				}
119ca987d46SWarner Losh 
120ca987d46SWarner Losh 				/* One or two digit hex constant?
121ca987d46SWarner Losh 				 * If two are there they will both be taken.
122ca987d46SWarner Losh 				 * Use \z to split them up if this is not wanted.
123ca987d46SWarner Losh 				 */
124ca987d46SWarner Losh 				if (*str == '0' &&
125ca987d46SWarner Losh 				    (*(str + 1) == 'x' || *(str + 1) == 'X') &&
126ca987d46SWarner Losh 				    isxdigit(*(str + 2))) {
127ca987d46SWarner Losh 					val = DIGIT(*(str + 2));
128ca987d46SWarner Losh 					if (isxdigit(*(str + 3))) {
129ca987d46SWarner Losh 						val = (val << 4) + DIGIT(*(str + 3));
130ca987d46SWarner Losh 						str += 4;
131ca987d46SWarner Losh 					}
132ca987d46SWarner Losh 					else
133ca987d46SWarner Losh 						str += 3;
134ca987d46SWarner Losh 					/* Yep, allow null value here too */
135ca987d46SWarner Losh 					new_str[i++] = val;
136ca987d46SWarner Losh 					break;
137ca987d46SWarner Losh 				}
138ca987d46SWarner Losh 			}
139ca987d46SWarner Losh 				break;
140ca987d46SWarner Losh 
141ca987d46SWarner Losh 			default:
142ca987d46SWarner Losh 				new_str[i++] = *str++;
143ca987d46SWarner Losh 				break;
144ca987d46SWarner Losh 			}
145ca987d46SWarner Losh 		}
146ca987d46SWarner Losh 		else {
147ca987d46SWarner Losh 			if (*str == '\\') {
148ca987d46SWarner Losh 				seenbs = 1;
149ca987d46SWarner Losh 				str++;
150ca987d46SWarner Losh 			}
151ca987d46SWarner Losh 			else
152ca987d46SWarner Losh 				new_str[i++] = *str++;
153ca987d46SWarner Losh 		}
154ca987d46SWarner Losh 	}
155ca987d46SWarner Losh 
156ca987d46SWarner Losh 	if (seenbs) {
157ca987d46SWarner Losh 		/*
158ca987d46SWarner Losh 		 * The final character was a '\'. Put it in as a single backslash.
159ca987d46SWarner Losh 		 */
160ca987d46SWarner Losh 		new_str[i++] = '\\';
161ca987d46SWarner Losh 	}
162ca987d46SWarner Losh 	new_str[i] = '\0';
163ca987d46SWarner Losh 	return new_str;
164ca987d46SWarner Losh }
165