xref: /freebsd/usr.bin/fold/fold.c (revision a3cf0ef5a295c885c895fabfd56470c0d1db322d)
1 /*-
2  * Copyright (c) 1990, 1993
3  *	The Regents of the University of California.  All rights reserved.
4  *
5  * This code is derived from software contributed to Berkeley by
6  * Kevin Ruddy.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 3. All advertising materials mentioning features or use of this software
17  *    must display the following acknowledgement:
18  *	This product includes software developed by the University of
19  *	California, Berkeley and its contributors.
20  * 4. Neither the name of the University nor the names of its contributors
21  *    may be used to endorse or promote products derived from this software
22  *    without specific prior written permission.
23  *
24  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
25  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
28  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
29  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
30  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
32  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
33  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34  * SUCH DAMAGE.
35  */
36 
37 #ifndef lint
38 static const char copyright[] =
39 "@(#) Copyright (c) 1990, 1993\n\
40 	The Regents of the University of California.  All rights reserved.\n";
41 #endif /* not lint */
42 
43 #ifndef lint
44 #if 0
45 static char sccsid[] = "@(#)fold.c	8.1 (Berkeley) 6/6/93";
46 #endif
47 #endif /* not lint */
48 
49 #include <sys/cdefs.h>
50 __FBSDID("$FreeBSD$");
51 
52 #include <err.h>
53 #include <limits.h>
54 #include <locale.h>
55 #include <stdio.h>
56 #include <stdlib.h>
57 #include <string.h>
58 #include <unistd.h>
59 #include <wchar.h>
60 #include <wctype.h>
61 
62 #define	DEFLINEWIDTH	80
63 
64 void fold(int);
65 static int newpos(int, wint_t);
66 static void usage(void);
67 
68 int bflag;			/* Count bytes, not columns */
69 int sflag;			/* Split on word boundaries */
70 
71 int
72 main(int argc, char **argv)
73 {
74 	int ch, previous_ch;
75 	int rval, width;
76 
77 	(void) setlocale(LC_CTYPE, "");
78 
79 	width = -1;
80 	previous_ch = 0;
81 	while ((ch = getopt(argc, argv, "0123456789bsw:")) != -1) {
82 		switch (ch) {
83 		case 'b':
84 			bflag = 1;
85 			break;
86 		case 's':
87 			sflag = 1;
88 			break;
89 		case 'w':
90 			if ((width = atoi(optarg)) <= 0) {
91 				errx(1, "illegal width value");
92 			}
93 			break;
94 		case '0': case '1': case '2': case '3': case '4':
95 		case '5': case '6': case '7': case '8': case '9':
96 			/* Accept a width as eg. -30. Note that a width
97 			 * specified using the -w option is always used prior
98 			 * to this undocumented option. */
99 			switch (previous_ch) {
100 			case '0': case '1': case '2': case '3': case '4':
101 			case '5': case '6': case '7': case '8': case '9':
102 				/* The width is a number with multiple digits:
103 				 * add the last one. */
104 				width = width * 10 + (ch - '0');
105 				break;
106 			default:
107 				/* Set the width, unless it was previously
108 				 * set. For instance, the following options
109 				 * would all give a width of 5 and not 10:
110 				 *   -10 -w5
111 				 *   -5b10
112 				 *   -5 -10b */
113 				if (width == -1)
114 					width = ch - '0';
115 				break;
116 			}
117 			break;
118 		default:
119 			usage();
120 		}
121 		previous_ch = ch;
122 	}
123 	argv += optind;
124 	argc -= optind;
125 
126 	if (width == -1)
127 		width = DEFLINEWIDTH;
128 	rval = 0;
129 	if (!*argv)
130 		fold(width);
131 	else for (; *argv; ++argv)
132 		if (!freopen(*argv, "r", stdin)) {
133 			warn("%s", *argv);
134 			rval = 1;
135 		} else
136 			fold(width);
137 	exit(rval);
138 }
139 
140 static void
141 usage(void)
142 {
143 	(void)fprintf(stderr, "usage: fold [-bs] [-w width] [file ...]\n");
144 	exit(1);
145 }
146 
147 /*
148  * Fold the contents of standard input to fit within WIDTH columns (or bytes)
149  * and write to standard output.
150  *
151  * If sflag is set, split the line at the last space character on the line.
152  * This flag necessitates storing the line in a buffer until the current
153  * column > width, or a newline or EOF is read.
154  *
155  * The buffer can grow larger than WIDTH due to backspaces and carriage
156  * returns embedded in the input stream.
157  */
158 void
159 fold(int width)
160 {
161 	static wchar_t *buf;
162 	static int buf_max;
163 	int col, i, indx, space;
164 	wint_t ch;
165 
166 	col = indx = 0;
167 	while ((ch = getwchar()) != WEOF) {
168 		if (ch == '\n') {
169 			wprintf(L"%.*ls\n", indx, buf);
170 			col = indx = 0;
171 			continue;
172 		}
173 		if ((col = newpos(col, ch)) > width) {
174 			if (sflag) {
175 				i = indx;
176 				while (--i >= 0 && !iswblank(buf[i]))
177 					;
178 				space = i;
179 			}
180 			if (sflag && space != -1) {
181 				space++;
182 				wprintf(L"%.*ls\n", space, buf);
183 				wmemmove(buf, buf + space, indx - space);
184 				indx -= space;
185 				col = 0;
186 				for (i = 0; i < indx; i++)
187 					col = newpos(col, buf[i]);
188 			} else {
189 				wprintf(L"%.*ls\n", indx, buf);
190 				col = indx = 0;
191 			}
192 			col = newpos(col, ch);
193 		}
194 		if (indx + 1 > buf_max) {
195 			buf_max += LINE_MAX;
196 			buf = realloc(buf, sizeof(*buf) * buf_max);
197 			if (buf == NULL)
198 				err(1, "realloc()");
199 		}
200 		buf[indx++] = ch;
201 	}
202 
203 	if (indx != 0)
204 		wprintf(L"%.*ls", indx, buf);
205 }
206 
207 /*
208  * Update the current column position for a character.
209  */
210 static int
211 newpos(int col, wint_t ch)
212 {
213 	char buf[MB_LEN_MAX];
214 	size_t len;
215 	int w;
216 
217 	if (bflag) {
218 		len = wcrtomb(buf, ch, NULL);
219 		col += len;
220 	} else
221 		switch (ch) {
222 		case '\b':
223 			if (col > 0)
224 				--col;
225 			break;
226 		case '\r':
227 			col = 0;
228 			break;
229 		case '\t':
230 			col = (col + 8) & ~7;
231 			break;
232 		default:
233 			if ((w = wcwidth(ch)) > 0)
234 				col += w;
235 			break;
236 		}
237 
238 	return (col);
239 }
240