xref: /freebsd/usr.bin/wc/wc.c (revision ebb42aee311aba4f36f4bf0fa5f80f358beed2c1)
19b50d902SRodney W. Grimes /*
29b50d902SRodney W. Grimes  * Copyright (c) 1980, 1987, 1991, 1993
39b50d902SRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
49b50d902SRodney W. Grimes  *
59b50d902SRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
69b50d902SRodney W. Grimes  * modification, are permitted provided that the following conditions
79b50d902SRodney W. Grimes  * are met:
89b50d902SRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
99b50d902SRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
109b50d902SRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
119b50d902SRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
129b50d902SRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
139b50d902SRodney W. Grimes  * 3. All advertising materials mentioning features or use of this software
149b50d902SRodney W. Grimes  *    must display the following acknowledgement:
159b50d902SRodney W. Grimes  *	This product includes software developed by the University of
169b50d902SRodney W. Grimes  *	California, Berkeley and its contributors.
179b50d902SRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
189b50d902SRodney W. Grimes  *    may be used to endorse or promote products derived from this software
199b50d902SRodney W. Grimes  *    without specific prior written permission.
209b50d902SRodney W. Grimes  *
219b50d902SRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
229b50d902SRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
239b50d902SRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
249b50d902SRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
259b50d902SRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
269b50d902SRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
279b50d902SRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
289b50d902SRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
299b50d902SRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
309b50d902SRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
319b50d902SRodney W. Grimes  * SUCH DAMAGE.
329b50d902SRodney W. Grimes  */
339b50d902SRodney W. Grimes 
349b50d902SRodney W. Grimes #ifndef lint
3506469209SMike Barcroft static const char copyright[] =
369b50d902SRodney W. Grimes "@(#) Copyright (c) 1980, 1987, 1991, 1993\n\
379b50d902SRodney W. Grimes 	The Regents of the University of California.  All rights reserved.\n";
38a821e36eSMike Barcroft #endif /* not lint */
399b50d902SRodney W. Grimes 
4006469209SMike Barcroft #if 0
419b50d902SRodney W. Grimes #ifndef lint
42a821e36eSMike Barcroft static char sccsid[] = "@(#)wc.c	8.1 (Berkeley) 6/6/93";
43a821e36eSMike Barcroft #endif /* not lint */
442c51e5edSBruce Evans #endif
459b50d902SRodney W. Grimes 
46a821e36eSMike Barcroft #include <sys/cdefs.h>
47a821e36eSMike Barcroft __FBSDID("$FreeBSD$");
48a821e36eSMike Barcroft 
499b50d902SRodney W. Grimes #include <sys/param.h>
509b50d902SRodney W. Grimes #include <sys/stat.h>
512c51e5edSBruce Evans 
522c51e5edSBruce Evans #include <ctype.h>
532c51e5edSBruce Evans #include <err.h>
54ebb42aeeSTim J. Robbins #include <errno.h>
559b50d902SRodney W. Grimes #include <fcntl.h>
56ae6fa8aeSAndrey A. Chernov #include <locale.h>
57a821e36eSMike Barcroft #include <stdint.h>
589b50d902SRodney W. Grimes #include <stdio.h>
599b50d902SRodney W. Grimes #include <stdlib.h>
609b50d902SRodney W. Grimes #include <string.h>
612c51e5edSBruce Evans #include <unistd.h>
629b50d902SRodney W. Grimes 
63a821e36eSMike Barcroft uintmax_t tlinect, twordct, tcharct;
64ebb42aeeSTim J. Robbins int doline, doword, dochar, domulti;
659b50d902SRodney W. Grimes 
663f330d7dSWarner Losh static int	cnt(const char *);
673f330d7dSWarner Losh static void	usage(void);
689b50d902SRodney W. Grimes 
699b50d902SRodney W. Grimes int
709b50d902SRodney W. Grimes main(argc, argv)
719b50d902SRodney W. Grimes 	int argc;
729b50d902SRodney W. Grimes 	char *argv[];
739b50d902SRodney W. Grimes {
74a0cf59e6SSheldon Hearn 	int ch, errors, total;
759b50d902SRodney W. Grimes 
76ae6fa8aeSAndrey A. Chernov 	(void) setlocale(LC_CTYPE, "");
77ae6fa8aeSAndrey A. Chernov 
78ebb42aeeSTim J. Robbins 	while ((ch = getopt(argc, argv, "clmw")) != -1)
799b50d902SRodney W. Grimes 		switch((char)ch) {
809b50d902SRodney W. Grimes 		case 'l':
819b50d902SRodney W. Grimes 			doline = 1;
829b50d902SRodney W. Grimes 			break;
839b50d902SRodney W. Grimes 		case 'w':
849b50d902SRodney W. Grimes 			doword = 1;
859b50d902SRodney W. Grimes 			break;
869b50d902SRodney W. Grimes 		case 'c':
879b50d902SRodney W. Grimes 			dochar = 1;
88ebb42aeeSTim J. Robbins 			domulti = 0;
89ebb42aeeSTim J. Robbins 			break;
90ebb42aeeSTim J. Robbins 		case 'm':
91ebb42aeeSTim J. Robbins 			domulti = 1;
92ebb42aeeSTim J. Robbins 			dochar = 0;
939b50d902SRodney W. Grimes 			break;
949b50d902SRodney W. Grimes 		case '?':
959b50d902SRodney W. Grimes 		default:
969b50d902SRodney W. Grimes 			usage();
979b50d902SRodney W. Grimes 		}
989b50d902SRodney W. Grimes 	argv += optind;
999b50d902SRodney W. Grimes 	argc -= optind;
1009b50d902SRodney W. Grimes 
1019b50d902SRodney W. Grimes 	/* Wc's flags are on by default. */
102ebb42aeeSTim J. Robbins 	if (doline + doword + dochar + domulti == 0)
1039b50d902SRodney W. Grimes 		doline = doword = dochar = 1;
1049b50d902SRodney W. Grimes 
1052c51e5edSBruce Evans 	errors = 0;
1069b50d902SRodney W. Grimes 	total = 0;
1079b50d902SRodney W. Grimes 	if (!*argv) {
1082c51e5edSBruce Evans 		if (cnt((char *)NULL) != 0)
1092c51e5edSBruce Evans 			++errors;
1102c51e5edSBruce Evans 		else
1119b50d902SRodney W. Grimes 			(void)printf("\n");
1129b50d902SRodney W. Grimes 	}
1139b50d902SRodney W. Grimes 	else do {
1142c51e5edSBruce Evans 		if (cnt(*argv) != 0)
1152c51e5edSBruce Evans 			++errors;
1162c51e5edSBruce Evans 		else
1179b50d902SRodney W. Grimes 			(void)printf(" %s\n", *argv);
1189b50d902SRodney W. Grimes 		++total;
1199b50d902SRodney W. Grimes 	} while(*++argv);
1209b50d902SRodney W. Grimes 
1219b50d902SRodney W. Grimes 	if (total > 1) {
1229b50d902SRodney W. Grimes 		if (doline)
123a821e36eSMike Barcroft 			(void)printf(" %7ju", tlinect);
1249b50d902SRodney W. Grimes 		if (doword)
125a821e36eSMike Barcroft 			(void)printf(" %7ju", twordct);
126ebb42aeeSTim J. Robbins 		if (dochar || domulti)
127a821e36eSMike Barcroft 			(void)printf(" %7ju", tcharct);
1289b50d902SRodney W. Grimes 		(void)printf(" total\n");
1299b50d902SRodney W. Grimes 	}
1302c51e5edSBruce Evans 	exit(errors == 0 ? 0 : 1);
1319b50d902SRodney W. Grimes }
1329b50d902SRodney W. Grimes 
133a821e36eSMike Barcroft static int
1349b50d902SRodney W. Grimes cnt(file)
1357a8fb588SMark Murray 	const char *file;
1369b50d902SRodney W. Grimes {
1379b50d902SRodney W. Grimes 	struct stat sb;
138a821e36eSMike Barcroft 	uintmax_t linect, wordct, charct;
139ebb42aeeSTim J. Robbins 	ssize_t nread;
140ebb42aeeSTim J. Robbins 	int clen, fd, len, warned;
141a0cf59e6SSheldon Hearn 	short gotsp;
142a0cf59e6SSheldon Hearn 	u_char *p;
143a0cf59e6SSheldon Hearn 	u_char buf[MAXBSIZE], ch;
144ebb42aeeSTim J. Robbins 	wchar_t wch;
1459b50d902SRodney W. Grimes 
1469b50d902SRodney W. Grimes 	linect = wordct = charct = 0;
1472c51e5edSBruce Evans 	if (file == NULL) {
1482c51e5edSBruce Evans 		file = "stdin";
1492c51e5edSBruce Evans 		fd = STDIN_FILENO;
1502c51e5edSBruce Evans 	} else {
151a0d038a4SWolfram Schneider 		if ((fd = open(file, O_RDONLY, 0)) < 0) {
1522c51e5edSBruce Evans 			warn("%s: open", file);
1532c51e5edSBruce Evans 			return (1);
154a0d038a4SWolfram Schneider 		}
155ebb42aeeSTim J. Robbins 		if (doword || (domulti && MB_CUR_MAX != 1))
1569b50d902SRodney W. Grimes 			goto word;
1579b50d902SRodney W. Grimes 		/*
1589b50d902SRodney W. Grimes 		 * Line counting is split out because it's a lot faster to get
1599b50d902SRodney W. Grimes 		 * lines than to get words, since the word count requires some
1609b50d902SRodney W. Grimes 		 * logic.
1619b50d902SRodney W. Grimes 		 */
1629b50d902SRodney W. Grimes 		if (doline) {
1638c85cce7SPhilippe Charnier 			while ((len = read(fd, buf, MAXBSIZE))) {
1642c51e5edSBruce Evans 				if (len == -1) {
1652c51e5edSBruce Evans 					warn("%s: read", file);
1662c51e5edSBruce Evans 					(void)close(fd);
1672c51e5edSBruce Evans 					return (1);
1682c51e5edSBruce Evans 				}
1699b50d902SRodney W. Grimes 				charct += len;
1709b50d902SRodney W. Grimes 				for (p = buf; len--; ++p)
1719b50d902SRodney W. Grimes 					if (*p == '\n')
1729b50d902SRodney W. Grimes 						++linect;
1739b50d902SRodney W. Grimes 			}
1749b50d902SRodney W. Grimes 			tlinect += linect;
175a821e36eSMike Barcroft 			(void)printf(" %7ju", linect);
1769b50d902SRodney W. Grimes 			if (dochar) {
1779b50d902SRodney W. Grimes 				tcharct += charct;
178a821e36eSMike Barcroft 				(void)printf(" %7ju", charct);
1799b50d902SRodney W. Grimes 			}
1809b50d902SRodney W. Grimes 			(void)close(fd);
1812c51e5edSBruce Evans 			return (0);
1829b50d902SRodney W. Grimes 		}
1839b50d902SRodney W. Grimes 		/*
1849b50d902SRodney W. Grimes 		 * If all we need is the number of characters and it's a
1859b50d902SRodney W. Grimes 		 * regular or linked file, just stat the puppy.
1869b50d902SRodney W. Grimes 		 */
187ebb42aeeSTim J. Robbins 		if (dochar || domulti) {
1882c51e5edSBruce Evans 			if (fstat(fd, &sb)) {
1892c51e5edSBruce Evans 				warn("%s: fstat", file);
1902c51e5edSBruce Evans 				(void)close(fd);
1912c51e5edSBruce Evans 				return (1);
1922c51e5edSBruce Evans 			}
1939b50d902SRodney W. Grimes 			if (S_ISREG(sb.st_mode) || S_ISLNK(sb.st_mode)) {
194a0cf59e6SSheldon Hearn 				(void)printf(" %7lld", (long long)sb.st_size);
1959b50d902SRodney W. Grimes 				tcharct += sb.st_size;
1969b50d902SRodney W. Grimes 				(void)close(fd);
1972c51e5edSBruce Evans 				return (0);
1989b50d902SRodney W. Grimes 			}
1999b50d902SRodney W. Grimes 		}
2009b50d902SRodney W. Grimes 	}
2019b50d902SRodney W. Grimes 
2029b50d902SRodney W. Grimes 	/* Do it the hard way... */
203ebb42aeeSTim J. Robbins word:	gotsp = 1;
204ebb42aeeSTim J. Robbins 	len = 0;
205ebb42aeeSTim J. Robbins 	warned = 0;
206ebb42aeeSTim J. Robbins 	while ((nread = read(fd, buf + len, MAXBSIZE - len)) != 0) {
207ebb42aeeSTim J. Robbins 		if (nread == -1) {
2082c51e5edSBruce Evans 			warn("%s: read", file);
2092c51e5edSBruce Evans 			(void)close(fd);
2102c51e5edSBruce Evans 			return (1);
2112c51e5edSBruce Evans 		}
212ebb42aeeSTim J. Robbins 		len += nread;
213ebb42aeeSTim J. Robbins 		p = buf;
214ebb42aeeSTim J. Robbins 		while (len > 0) {
215ebb42aeeSTim J. Robbins 			if (!domulti || MB_CUR_MAX == 1) {
216ebb42aeeSTim J. Robbins 				clen = 1;
217ebb42aeeSTim J. Robbins 				wch = (unsigned char)*p;
218ebb42aeeSTim J. Robbins 			} else if ((clen = mbtowc(&wch, p, len)) <= 0) {
219ebb42aeeSTim J. Robbins 				if (len > MB_CUR_MAX) {
220ebb42aeeSTim J. Robbins 					clen = 1;
221ebb42aeeSTim J. Robbins 					wch = (unsigned char)*p;
222ebb42aeeSTim J. Robbins 					if (!warned) {
223ebb42aeeSTim J. Robbins 						errno = EILSEQ;
224ebb42aeeSTim J. Robbins 						warn("%s", file);
225ebb42aeeSTim J. Robbins 						warned = 1;
226ebb42aeeSTim J. Robbins 					}
227ebb42aeeSTim J. Robbins 				} else {
228ebb42aeeSTim J. Robbins 					memmove(buf, p, len);
229ebb42aeeSTim J. Robbins 					break;
230ebb42aeeSTim J. Robbins 				}
231ebb42aeeSTim J. Robbins 			}
232ebb42aeeSTim J. Robbins 			charct++;
233ebb42aeeSTim J. Robbins 			len -= clen;
234ebb42aeeSTim J. Robbins 			p += clen;
235ebb42aeeSTim J. Robbins 			if (wch == L'\n')
2369b50d902SRodney W. Grimes 				++linect;
237ebb42aeeSTim J. Robbins 			/* XXX Non-portable; should use iswspace() */
2389b50d902SRodney W. Grimes 			if (isspace(ch))
2399b50d902SRodney W. Grimes 				gotsp = 1;
2409b50d902SRodney W. Grimes 			else if (gotsp) {
2419b50d902SRodney W. Grimes 				gotsp = 0;
2429b50d902SRodney W. Grimes 				++wordct;
2439b50d902SRodney W. Grimes 			}
2449b50d902SRodney W. Grimes 		}
2459b50d902SRodney W. Grimes 	}
2469b50d902SRodney W. Grimes 	if (doline) {
2479b50d902SRodney W. Grimes 		tlinect += linect;
248a821e36eSMike Barcroft 		(void)printf(" %7ju", linect);
2499b50d902SRodney W. Grimes 	}
2509b50d902SRodney W. Grimes 	if (doword) {
2519b50d902SRodney W. Grimes 		twordct += wordct;
252a821e36eSMike Barcroft 		(void)printf(" %7ju", wordct);
2539b50d902SRodney W. Grimes 	}
254ebb42aeeSTim J. Robbins 	if (dochar || domulti) {
2559b50d902SRodney W. Grimes 		tcharct += charct;
256a821e36eSMike Barcroft 		(void)printf(" %7ju", charct);
2579b50d902SRodney W. Grimes 	}
2589b50d902SRodney W. Grimes 	(void)close(fd);
2592c51e5edSBruce Evans 	return (0);
2609b50d902SRodney W. Grimes }
2619b50d902SRodney W. Grimes 
262a821e36eSMike Barcroft static void
2639b50d902SRodney W. Grimes usage()
2649b50d902SRodney W. Grimes {
265ebb42aeeSTim J. Robbins 	(void)fprintf(stderr, "usage: wc [-clmw] [file ...]\n");
2669b50d902SRodney W. Grimes 	exit(1);
2679b50d902SRodney W. Grimes }
268