xref: /freebsd/usr.bin/wc/wc.c (revision 3f330d7d1a3fe98c53faf01d0f30c0a9fbb37c41)
19b50d902SRodney W. Grimes /*
29b50d902SRodney W. Grimes  * Copyright (c) 1980, 1987, 1991, 1993
39b50d902SRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
49b50d902SRodney W. Grimes  *
59b50d902SRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
69b50d902SRodney W. Grimes  * modification, are permitted provided that the following conditions
79b50d902SRodney W. Grimes  * are met:
89b50d902SRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
99b50d902SRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
109b50d902SRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
119b50d902SRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
129b50d902SRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
139b50d902SRodney W. Grimes  * 3. All advertising materials mentioning features or use of this software
149b50d902SRodney W. Grimes  *    must display the following acknowledgement:
159b50d902SRodney W. Grimes  *	This product includes software developed by the University of
169b50d902SRodney W. Grimes  *	California, Berkeley and its contributors.
179b50d902SRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
189b50d902SRodney W. Grimes  *    may be used to endorse or promote products derived from this software
199b50d902SRodney W. Grimes  *    without specific prior written permission.
209b50d902SRodney W. Grimes  *
219b50d902SRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
229b50d902SRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
239b50d902SRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
249b50d902SRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
259b50d902SRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
269b50d902SRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
279b50d902SRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
289b50d902SRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
299b50d902SRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
309b50d902SRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
319b50d902SRodney W. Grimes  * SUCH DAMAGE.
329b50d902SRodney W. Grimes  */
339b50d902SRodney W. Grimes 
349b50d902SRodney W. Grimes #ifndef lint
3506469209SMike Barcroft static const char copyright[] =
369b50d902SRodney W. Grimes "@(#) Copyright (c) 1980, 1987, 1991, 1993\n\
379b50d902SRodney W. Grimes 	The Regents of the University of California.  All rights reserved.\n";
38a821e36eSMike Barcroft #endif /* not lint */
399b50d902SRodney W. Grimes 
4006469209SMike Barcroft #if 0
419b50d902SRodney W. Grimes #ifndef lint
42a821e36eSMike Barcroft static char sccsid[] = "@(#)wc.c	8.1 (Berkeley) 6/6/93";
43a821e36eSMike Barcroft #endif /* not lint */
442c51e5edSBruce Evans #endif
459b50d902SRodney W. Grimes 
46a821e36eSMike Barcroft #include <sys/cdefs.h>
47a821e36eSMike Barcroft __FBSDID("$FreeBSD$");
48a821e36eSMike Barcroft 
499b50d902SRodney W. Grimes #include <sys/param.h>
509b50d902SRodney W. Grimes #include <sys/stat.h>
512c51e5edSBruce Evans 
522c51e5edSBruce Evans #include <ctype.h>
532c51e5edSBruce Evans #include <err.h>
549b50d902SRodney W. Grimes #include <fcntl.h>
55ae6fa8aeSAndrey A. Chernov #include <locale.h>
56a821e36eSMike Barcroft #include <stdint.h>
579b50d902SRodney W. Grimes #include <stdio.h>
589b50d902SRodney W. Grimes #include <stdlib.h>
599b50d902SRodney W. Grimes #include <string.h>
602c51e5edSBruce Evans #include <unistd.h>
619b50d902SRodney W. Grimes 
62a821e36eSMike Barcroft uintmax_t tlinect, twordct, tcharct;
639b50d902SRodney W. Grimes int doline, doword, dochar;
649b50d902SRodney W. Grimes 
653f330d7dSWarner Losh static int	cnt(const char *);
663f330d7dSWarner Losh static void	usage(void);
679b50d902SRodney W. Grimes 
689b50d902SRodney W. Grimes int
699b50d902SRodney W. Grimes main(argc, argv)
709b50d902SRodney W. Grimes 	int argc;
719b50d902SRodney W. Grimes 	char *argv[];
729b50d902SRodney W. Grimes {
73a0cf59e6SSheldon Hearn 	int ch, errors, total;
749b50d902SRodney W. Grimes 
75ae6fa8aeSAndrey A. Chernov 	(void) setlocale(LC_CTYPE, "");
76ae6fa8aeSAndrey A. Chernov 
771c8af878SWarner Losh 	while ((ch = getopt(argc, argv, "lwc")) != -1)
789b50d902SRodney W. Grimes 		switch((char)ch) {
799b50d902SRodney W. Grimes 		case 'l':
809b50d902SRodney W. Grimes 			doline = 1;
819b50d902SRodney W. Grimes 			break;
829b50d902SRodney W. Grimes 		case 'w':
839b50d902SRodney W. Grimes 			doword = 1;
849b50d902SRodney W. Grimes 			break;
859b50d902SRodney W. Grimes 		case 'c':
869b50d902SRodney W. Grimes 			dochar = 1;
879b50d902SRodney W. Grimes 			break;
889b50d902SRodney W. Grimes 		case '?':
899b50d902SRodney W. Grimes 		default:
909b50d902SRodney W. Grimes 			usage();
919b50d902SRodney W. Grimes 		}
929b50d902SRodney W. Grimes 	argv += optind;
939b50d902SRodney W. Grimes 	argc -= optind;
949b50d902SRodney W. Grimes 
959b50d902SRodney W. Grimes 	/* Wc's flags are on by default. */
969b50d902SRodney W. Grimes 	if (doline + doword + dochar == 0)
979b50d902SRodney W. Grimes 		doline = doword = dochar = 1;
989b50d902SRodney W. Grimes 
992c51e5edSBruce Evans 	errors = 0;
1009b50d902SRodney W. Grimes 	total = 0;
1019b50d902SRodney W. Grimes 	if (!*argv) {
1022c51e5edSBruce Evans 		if (cnt((char *)NULL) != 0)
1032c51e5edSBruce Evans 			++errors;
1042c51e5edSBruce Evans 		else
1059b50d902SRodney W. Grimes 			(void)printf("\n");
1069b50d902SRodney W. Grimes 	}
1079b50d902SRodney W. Grimes 	else do {
1082c51e5edSBruce Evans 		if (cnt(*argv) != 0)
1092c51e5edSBruce Evans 			++errors;
1102c51e5edSBruce Evans 		else
1119b50d902SRodney W. Grimes 			(void)printf(" %s\n", *argv);
1129b50d902SRodney W. Grimes 		++total;
1139b50d902SRodney W. Grimes 	} while(*++argv);
1149b50d902SRodney W. Grimes 
1159b50d902SRodney W. Grimes 	if (total > 1) {
1169b50d902SRodney W. Grimes 		if (doline)
117a821e36eSMike Barcroft 			(void)printf(" %7ju", tlinect);
1189b50d902SRodney W. Grimes 		if (doword)
119a821e36eSMike Barcroft 			(void)printf(" %7ju", twordct);
1209b50d902SRodney W. Grimes 		if (dochar)
121a821e36eSMike Barcroft 			(void)printf(" %7ju", tcharct);
1229b50d902SRodney W. Grimes 		(void)printf(" total\n");
1239b50d902SRodney W. Grimes 	}
1242c51e5edSBruce Evans 	exit(errors == 0 ? 0 : 1);
1259b50d902SRodney W. Grimes }
1269b50d902SRodney W. Grimes 
127a821e36eSMike Barcroft static int
1289b50d902SRodney W. Grimes cnt(file)
1297a8fb588SMark Murray 	const char *file;
1309b50d902SRodney W. Grimes {
1319b50d902SRodney W. Grimes 	struct stat sb;
132a821e36eSMike Barcroft 	uintmax_t linect, wordct, charct;
133a0cf59e6SSheldon Hearn 	int fd, len;
134a0cf59e6SSheldon Hearn 	short gotsp;
135a0cf59e6SSheldon Hearn 	u_char *p;
136a0cf59e6SSheldon Hearn 	u_char buf[MAXBSIZE], ch;
1379b50d902SRodney W. Grimes 
1389b50d902SRodney W. Grimes 	linect = wordct = charct = 0;
1392c51e5edSBruce Evans 	if (file == NULL) {
1402c51e5edSBruce Evans 		file = "stdin";
1412c51e5edSBruce Evans 		fd = STDIN_FILENO;
1422c51e5edSBruce Evans 	} else {
143a0d038a4SWolfram Schneider 		if ((fd = open(file, O_RDONLY, 0)) < 0) {
1442c51e5edSBruce Evans 			warn("%s: open", file);
1452c51e5edSBruce Evans 			return (1);
146a0d038a4SWolfram Schneider 		}
1479b50d902SRodney W. Grimes 		if (doword)
1489b50d902SRodney W. Grimes 			goto word;
1499b50d902SRodney W. Grimes 		/*
1509b50d902SRodney W. Grimes 		 * Line counting is split out because it's a lot faster to get
1519b50d902SRodney W. Grimes 		 * lines than to get words, since the word count requires some
1529b50d902SRodney W. Grimes 		 * logic.
1539b50d902SRodney W. Grimes 		 */
1549b50d902SRodney W. Grimes 		if (doline) {
1558c85cce7SPhilippe Charnier 			while ((len = read(fd, buf, MAXBSIZE))) {
1562c51e5edSBruce Evans 				if (len == -1) {
1572c51e5edSBruce Evans 					warn("%s: read", file);
1582c51e5edSBruce Evans 					(void)close(fd);
1592c51e5edSBruce Evans 					return (1);
1602c51e5edSBruce Evans 				}
1619b50d902SRodney W. Grimes 				charct += len;
1629b50d902SRodney W. Grimes 				for (p = buf; len--; ++p)
1639b50d902SRodney W. Grimes 					if (*p == '\n')
1649b50d902SRodney W. Grimes 						++linect;
1659b50d902SRodney W. Grimes 			}
1669b50d902SRodney W. Grimes 			tlinect += linect;
167a821e36eSMike Barcroft 			(void)printf(" %7ju", linect);
1689b50d902SRodney W. Grimes 			if (dochar) {
1699b50d902SRodney W. Grimes 				tcharct += charct;
170a821e36eSMike Barcroft 				(void)printf(" %7ju", charct);
1719b50d902SRodney W. Grimes 			}
1729b50d902SRodney W. Grimes 			(void)close(fd);
1732c51e5edSBruce Evans 			return (0);
1749b50d902SRodney W. Grimes 		}
1759b50d902SRodney W. Grimes 		/*
1769b50d902SRodney W. Grimes 		 * If all we need is the number of characters and it's a
1779b50d902SRodney W. Grimes 		 * regular or linked file, just stat the puppy.
1789b50d902SRodney W. Grimes 		 */
1799b50d902SRodney W. Grimes 		if (dochar) {
1802c51e5edSBruce Evans 			if (fstat(fd, &sb)) {
1812c51e5edSBruce Evans 				warn("%s: fstat", file);
1822c51e5edSBruce Evans 				(void)close(fd);
1832c51e5edSBruce Evans 				return (1);
1842c51e5edSBruce Evans 			}
1859b50d902SRodney W. Grimes 			if (S_ISREG(sb.st_mode) || S_ISLNK(sb.st_mode)) {
186a0cf59e6SSheldon Hearn 				(void)printf(" %7lld", (long long)sb.st_size);
1879b50d902SRodney W. Grimes 				tcharct += sb.st_size;
1889b50d902SRodney W. Grimes 				(void)close(fd);
1892c51e5edSBruce Evans 				return (0);
1909b50d902SRodney W. Grimes 			}
1919b50d902SRodney W. Grimes 		}
1929b50d902SRodney W. Grimes 	}
1939b50d902SRodney W. Grimes 
1949b50d902SRodney W. Grimes 	/* Do it the hard way... */
1958c85cce7SPhilippe Charnier word:	for (gotsp = 1; (len = read(fd, buf, MAXBSIZE));) {
1962c51e5edSBruce Evans 		if (len == -1) {
1972c51e5edSBruce Evans 			warn("%s: read", file);
1982c51e5edSBruce Evans 			(void)close(fd);
1992c51e5edSBruce Evans 			return (1);
2002c51e5edSBruce Evans 		}
2019b50d902SRodney W. Grimes 		/*
2029b50d902SRodney W. Grimes 		 * This loses in the presence of multi-byte characters.
2039b50d902SRodney W. Grimes 		 * To do it right would require a function to return a
2049b50d902SRodney W. Grimes 		 * character while knowing how many bytes it consumed.
2059b50d902SRodney W. Grimes 		 */
2069b50d902SRodney W. Grimes 		charct += len;
2079b50d902SRodney W. Grimes 		for (p = buf; len--;) {
2089b50d902SRodney W. Grimes 			ch = *p++;
2099b50d902SRodney W. Grimes 			if (ch == '\n')
2109b50d902SRodney W. Grimes 				++linect;
2119b50d902SRodney W. Grimes 			if (isspace(ch))
2129b50d902SRodney W. Grimes 				gotsp = 1;
2139b50d902SRodney W. Grimes 			else if (gotsp) {
2149b50d902SRodney W. Grimes 				gotsp = 0;
2159b50d902SRodney W. Grimes 				++wordct;
2169b50d902SRodney W. Grimes 			}
2179b50d902SRodney W. Grimes 		}
2189b50d902SRodney W. Grimes 	}
2199b50d902SRodney W. Grimes 	if (doline) {
2209b50d902SRodney W. Grimes 		tlinect += linect;
221a821e36eSMike Barcroft 		(void)printf(" %7ju", linect);
2229b50d902SRodney W. Grimes 	}
2239b50d902SRodney W. Grimes 	if (doword) {
2249b50d902SRodney W. Grimes 		twordct += wordct;
225a821e36eSMike Barcroft 		(void)printf(" %7ju", wordct);
2269b50d902SRodney W. Grimes 	}
2279b50d902SRodney W. Grimes 	if (dochar) {
2289b50d902SRodney W. Grimes 		tcharct += charct;
229a821e36eSMike Barcroft 		(void)printf(" %7ju", charct);
2309b50d902SRodney W. Grimes 	}
2319b50d902SRodney W. Grimes 	(void)close(fd);
2322c51e5edSBruce Evans 	return (0);
2339b50d902SRodney W. Grimes }
2349b50d902SRodney W. Grimes 
235a821e36eSMike Barcroft static void
2369b50d902SRodney W. Grimes usage()
2379b50d902SRodney W. Grimes {
2388c85cce7SPhilippe Charnier 	(void)fprintf(stderr, "usage: wc [-clw] [file ...]\n");
2399b50d902SRodney W. Grimes 	exit(1);
2409b50d902SRodney W. Grimes }
241