xref: /freebsd/usr.bin/unexpand/unexpand.c (revision 0b8224d1cc9dc6c9778ba04a75b2c8d47e5d7481)
19b50d902SRodney W. Grimes /*-
28a16b7a1SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
38a16b7a1SPedro F. Giffuni  *
49b50d902SRodney W. Grimes  * Copyright (c) 1980, 1993
59b50d902SRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
69b50d902SRodney W. Grimes  *
79b50d902SRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
89b50d902SRodney W. Grimes  * modification, are permitted provided that the following conditions
99b50d902SRodney W. Grimes  * are met:
109b50d902SRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
119b50d902SRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
129b50d902SRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
139b50d902SRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
149b50d902SRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
15fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
169b50d902SRodney W. Grimes  *    may be used to endorse or promote products derived from this software
179b50d902SRodney W. Grimes  *    without specific prior written permission.
189b50d902SRodney W. Grimes  *
199b50d902SRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
209b50d902SRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
219b50d902SRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
229b50d902SRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
239b50d902SRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
249b50d902SRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
259b50d902SRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
269b50d902SRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
279b50d902SRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
289b50d902SRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
299b50d902SRodney W. Grimes  * SUCH DAMAGE.
309b50d902SRodney W. Grimes  */
319b50d902SRodney W. Grimes 
329b50d902SRodney W. Grimes /*
339b50d902SRodney W. Grimes  * unexpand - put tabs into a file replacing blanks
349b50d902SRodney W. Grimes  */
35ec85e6a0STim J. Robbins #include <ctype.h>
3656d8f922SPhilippe Charnier #include <err.h>
37aca29625STim J. Robbins #include <limits.h>
38ec85e6a0STim J. Robbins #include <locale.h>
399b50d902SRodney W. Grimes #include <stdio.h>
40948a3f54SDima Dorfman #include <stdlib.h>
41821df508SXin LI #include <string.h>
42aca29625STim J. Robbins #include <unistd.h>
43a2641fe8STim J. Robbins #include <wchar.h>
44821df508SXin LI #include <wctype.h>
459b50d902SRodney W. Grimes 
4673827c10SEd Schouten static int	all;
4773827c10SEd Schouten static int	nstops;
4873827c10SEd Schouten static int	tabstops[100];
499b50d902SRodney W. Grimes 
50aca29625STim J. Robbins static void getstops(const char *);
51*cccdaf50SAlfonso Gregory static void usage(void) __dead2;
52a2641fe8STim J. Robbins static int tabify(const char *);
5356d8f922SPhilippe Charnier 
5401492790SPhilippe Charnier int
main(int argc,char * argv[])55f4ac32deSDavid Malone main(int argc, char *argv[])
569b50d902SRodney W. Grimes {
574596ce3dSTim J. Robbins 	int ch, failed;
584596ce3dSTim J. Robbins 	char *filename;
599b50d902SRodney W. Grimes 
60ec85e6a0STim J. Robbins 	setlocale(LC_CTYPE, "");
61ec85e6a0STim J. Robbins 
62aca29625STim J. Robbins 	nstops = 1;
63aca29625STim J. Robbins 	tabstops[0] = 8;
64aca29625STim J. Robbins 	while ((ch = getopt(argc, argv, "at:")) != -1) {
65aca29625STim J. Robbins 		switch (ch) {
66aca29625STim J. Robbins 		case 'a':	/* Un-expand all spaces, not just leading. */
67aca29625STim J. Robbins 			all = 1;
68aca29625STim J. Robbins 			break;
69aca29625STim J. Robbins 		case 't':	/* Specify tab list, implies -a. */
70aca29625STim J. Robbins 			getstops(optarg);
71aca29625STim J. Robbins 			all = 1;
72aca29625STim J. Robbins 			break;
73aca29625STim J. Robbins 		default:
7456d8f922SPhilippe Charnier 			usage();
75aca29625STim J. Robbins 			/*NOTREACHED*/
769b50d902SRodney W. Grimes 		}
77aca29625STim J. Robbins 	}
78aca29625STim J. Robbins 	argc -= optind;
79aca29625STim J. Robbins 	argv += optind;
80aca29625STim J. Robbins 
814596ce3dSTim J. Robbins 	failed = 0;
824596ce3dSTim J. Robbins 	if (argc == 0)
83a2641fe8STim J. Robbins 		failed |= tabify("stdin");
844596ce3dSTim J. Robbins 	else {
854596ce3dSTim J. Robbins 		while ((filename = *argv++) != NULL) {
864596ce3dSTim J. Robbins 			if (freopen(filename, "r", stdin) == NULL) {
874596ce3dSTim J. Robbins 				warn("%s", filename);
88a2641fe8STim J. Robbins 				failed = 1;
894596ce3dSTim J. Robbins 			} else
90a2641fe8STim J. Robbins 				failed |= tabify(filename);
914596ce3dSTim J. Robbins 		}
924596ce3dSTim J. Robbins 	}
934596ce3dSTim J. Robbins 	exit(failed != 0);
949b50d902SRodney W. Grimes }
959b50d902SRodney W. Grimes 
9656d8f922SPhilippe Charnier static void
usage(void)97f4ac32deSDavid Malone usage(void)
9856d8f922SPhilippe Charnier {
99bb361298SRuslan Ermilov 	fprintf(stderr, "usage: unexpand [-a | -t tablist] [file ...]\n");
10056d8f922SPhilippe Charnier 	exit(1);
10156d8f922SPhilippe Charnier }
10256d8f922SPhilippe Charnier 
103a2641fe8STim J. Robbins static int
tabify(const char * curfile)104a2641fe8STim J. Robbins tabify(const char *curfile)
1059b50d902SRodney W. Grimes {
106a2641fe8STim J. Robbins 	int dcol, doneline, limit, n, ocol, width;
107a2641fe8STim J. Robbins 	wint_t ch;
1089b50d902SRodney W. Grimes 
109aca29625STim J. Robbins 	limit = nstops == 1 ? INT_MAX : tabstops[nstops - 1] - 1;
1109b50d902SRodney W. Grimes 
111aca29625STim J. Robbins 	doneline = ocol = dcol = 0;
112a2641fe8STim J. Robbins 	while ((ch = getwchar()) != WEOF) {
1134596ce3dSTim J. Robbins 		if (ch == ' ' && !doneline) {
114aca29625STim J. Robbins 			if (++dcol >= limit)
115aca29625STim J. Robbins 				doneline = 1;
116aca29625STim J. Robbins 			continue;
117aca29625STim J. Robbins 		} else if (ch == '\t') {
118aca29625STim J. Robbins 			if (nstops == 1) {
119aca29625STim J. Robbins 				dcol = (1 + dcol / tabstops[0]) *
120aca29625STim J. Robbins 				    tabstops[0];
121aca29625STim J. Robbins 				continue;
122aca29625STim J. Robbins 			} else {
123336c5fb5SPedro F. Giffuni 				for (n = 0; n < nstops &&
124336c5fb5SPedro F. Giffuni 				    tabstops[n] - 1 < dcol; n++)
125aca29625STim J. Robbins 					;
126aca29625STim J. Robbins 				if (n < nstops - 1 && tabstops[n] - 1 < limit) {
127aca29625STim J. Robbins 					dcol = tabstops[n];
128aca29625STim J. Robbins 					continue;
1299b50d902SRodney W. Grimes 				}
130aca29625STim J. Robbins 				doneline = 1;
131aca29625STim J. Robbins 			}
132aca29625STim J. Robbins 		}
133aca29625STim J. Robbins 
134aca29625STim J. Robbins 		/* Output maximal number of tabs. */
135aca29625STim J. Robbins 		if (nstops == 1) {
136aca29625STim J. Robbins 			while (((ocol + tabstops[0]) / tabstops[0])
137aca29625STim J. Robbins 			    <= (dcol / tabstops[0])) {
138aca29625STim J. Robbins 				if (dcol - ocol < 2)
139aca29625STim J. Robbins 					break;
140a2641fe8STim J. Robbins 				putwchar('\t');
141aca29625STim J. Robbins 				ocol = (1 + ocol / tabstops[0]) *
142aca29625STim J. Robbins 				    tabstops[0];
143aca29625STim J. Robbins 			}
144aca29625STim J. Robbins 		} else {
145336c5fb5SPedro F. Giffuni 			for (n = 0; n < nstops && tabstops[n] - 1 < ocol; n++)
146aca29625STim J. Robbins 				;
147aca29625STim J. Robbins 			while (ocol < dcol && n < nstops && ocol < limit) {
148a2641fe8STim J. Robbins 				putwchar('\t');
149aca29625STim J. Robbins 				ocol = tabstops[n++];
150aca29625STim J. Robbins 			}
151aca29625STim J. Robbins 		}
152aca29625STim J. Robbins 
153aca29625STim J. Robbins 		/* Then spaces. */
154aca29625STim J. Robbins 		while (ocol < dcol && ocol < limit) {
155a2641fe8STim J. Robbins 			putwchar(' ');
1569b50d902SRodney W. Grimes 			ocol++;
1579b50d902SRodney W. Grimes 		}
158aca29625STim J. Robbins 
1594596ce3dSTim J. Robbins 		if (ch == '\b') {
160a2641fe8STim J. Robbins 			putwchar('\b');
1614596ce3dSTim J. Robbins 			if (ocol > 0)
1624596ce3dSTim J. Robbins 				ocol--, dcol--;
1634596ce3dSTim J. Robbins 		} else if (ch == '\n') {
164a2641fe8STim J. Robbins 			putwchar('\n');
1654596ce3dSTim J. Robbins 			doneline = ocol = dcol = 0;
16626cabd19STim J. Robbins 			continue;
1674596ce3dSTim J. Robbins 		} else if (ch != ' ' || dcol > limit) {
168a2641fe8STim J. Robbins 			putwchar(ch);
169a2641fe8STim J. Robbins 			if ((width = wcwidth(ch)) > 0)
170a2641fe8STim J. Robbins 				ocol += width, dcol += width;
1719b50d902SRodney W. Grimes 		}
172aca29625STim J. Robbins 
173aca29625STim J. Robbins 		/*
174aca29625STim J. Robbins 		 * Only processing leading blanks or we've gone past the
175aca29625STim J. Robbins 		 * last tab stop. Emit remainder of this line unchanged.
176aca29625STim J. Robbins 		 */
177aca29625STim J. Robbins 		if (!all || dcol >= limit) {
178a2641fe8STim J. Robbins 			while ((ch = getwchar()) != '\n' && ch != WEOF)
179a2641fe8STim J. Robbins 				putwchar(ch);
180aca29625STim J. Robbins 			if (ch == '\n')
181a2641fe8STim J. Robbins 				putwchar('\n');
1824596ce3dSTim J. Robbins 			doneline = ocol = dcol = 0;
183aca29625STim J. Robbins 		}
184aca29625STim J. Robbins 	}
185a2641fe8STim J. Robbins 	if (ferror(stdin)) {
186a2641fe8STim J. Robbins 		warn("%s", curfile);
187a2641fe8STim J. Robbins 		return (1);
188a2641fe8STim J. Robbins 	}
189a2641fe8STim J. Robbins 	return (0);
190aca29625STim J. Robbins }
191aca29625STim J. Robbins 
192aca29625STim J. Robbins static void
getstops(const char * cp)193f4ac32deSDavid Malone getstops(const char *cp)
194aca29625STim J. Robbins {
195aca29625STim J. Robbins 	int i;
196aca29625STim J. Robbins 
197aca29625STim J. Robbins 	nstops = 0;
198aca29625STim J. Robbins 	for (;;) {
199aca29625STim J. Robbins 		i = 0;
200aca29625STim J. Robbins 		while (*cp >= '0' && *cp <= '9')
201aca29625STim J. Robbins 			i = i * 10 + *cp++ - '0';
202aca29625STim J. Robbins 		if (i <= 0)
203aca29625STim J. Robbins 			errx(1, "bad tab stop spec");
204aca29625STim J. Robbins 		if (nstops > 0 && i <= tabstops[nstops-1])
205aca29625STim J. Robbins 			errx(1, "bad tab stop spec");
206aca29625STim J. Robbins 		if (nstops == sizeof(tabstops) / sizeof(*tabstops))
207aca29625STim J. Robbins 			errx(1, "too many tab stops");
208aca29625STim J. Robbins 		tabstops[nstops++] = i;
209aca29625STim J. Robbins 		if (*cp == 0)
210aca29625STim J. Robbins 			break;
211ec85e6a0STim J. Robbins 		if (*cp != ',' && !isblank((unsigned char)*cp))
212aca29625STim J. Robbins 			errx(1, "bad tab stop spec");
2139b50d902SRodney W. Grimes 		cp++;
2149b50d902SRodney W. Grimes 	}
2159b50d902SRodney W. Grimes }
216