1 /* 2 * Copyright (c) 1980, 1987, 1991, 1993 3 * The Regents of the University of California. All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 3. All advertising materials mentioning features or use of this software 14 * must display the following acknowledgement: 15 * This product includes software developed by the University of 16 * California, Berkeley and its contributors. 17 * 4. Neither the name of the University nor the names of its contributors 18 * may be used to endorse or promote products derived from this software 19 * without specific prior written permission. 20 * 21 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 22 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 24 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 25 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 26 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 27 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 28 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 29 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 31 * SUCH DAMAGE. 32 */ 33 34 #ifndef lint 35 static const char copyright[] = 36 "@(#) Copyright (c) 1980, 1987, 1991, 1993\n\ 37 The Regents of the University of California. All rights reserved.\n"; 38 #endif /* not lint */ 39 40 #if 0 41 #ifndef lint 42 static char sccsid[] = "@(#)wc.c 8.1 (Berkeley) 6/6/93"; 43 #endif /* not lint */ 44 #endif 45 46 #include <sys/cdefs.h> 47 __FBSDID("$FreeBSD$"); 48 49 #include <sys/param.h> 50 #include <sys/stat.h> 51 52 #include <ctype.h> 53 #include <err.h> 54 #include <errno.h> 55 #include <fcntl.h> 56 #include <locale.h> 57 #include <stdint.h> 58 #include <stdio.h> 59 #include <stdlib.h> 60 #include <string.h> 61 #include <unistd.h> 62 #include <wctype.h> 63 64 uintmax_t tlinect, twordct, tcharct; 65 int doline, doword, dochar, domulti; 66 67 static int cnt(const char *); 68 static void usage(void); 69 70 int 71 main(argc, argv) 72 int argc; 73 char *argv[]; 74 { 75 int ch, errors, total; 76 77 (void) setlocale(LC_CTYPE, ""); 78 79 while ((ch = getopt(argc, argv, "clmw")) != -1) 80 switch((char)ch) { 81 case 'l': 82 doline = 1; 83 break; 84 case 'w': 85 doword = 1; 86 break; 87 case 'c': 88 dochar = 1; 89 domulti = 0; 90 break; 91 case 'm': 92 domulti = 1; 93 dochar = 0; 94 break; 95 case '?': 96 default: 97 usage(); 98 } 99 argv += optind; 100 argc -= optind; 101 102 /* Wc's flags are on by default. */ 103 if (doline + doword + dochar + domulti == 0) 104 doline = doword = dochar = 1; 105 106 errors = 0; 107 total = 0; 108 if (!*argv) { 109 if (cnt((char *)NULL) != 0) 110 ++errors; 111 else 112 (void)printf("\n"); 113 } 114 else do { 115 if (cnt(*argv) != 0) 116 ++errors; 117 else 118 (void)printf(" %s\n", *argv); 119 ++total; 120 } while(*++argv); 121 122 if (total > 1) { 123 if (doline) 124 (void)printf(" %7ju", tlinect); 125 if (doword) 126 (void)printf(" %7ju", twordct); 127 if (dochar || domulti) 128 (void)printf(" %7ju", tcharct); 129 (void)printf(" total\n"); 130 } 131 exit(errors == 0 ? 0 : 1); 132 } 133 134 static int 135 cnt(file) 136 const char *file; 137 { 138 struct stat sb; 139 uintmax_t linect, wordct, charct; 140 ssize_t nread; 141 int clen, fd, len, warned; 142 short gotsp; 143 u_char *p; 144 u_char buf[MAXBSIZE]; 145 wchar_t wch; 146 147 linect = wordct = charct = 0; 148 if (file == NULL) { 149 file = "stdin"; 150 fd = STDIN_FILENO; 151 } else { 152 if ((fd = open(file, O_RDONLY, 0)) < 0) { 153 warn("%s: open", file); 154 return (1); 155 } 156 if (doword || (domulti && MB_CUR_MAX != 1)) 157 goto word; 158 /* 159 * Line counting is split out because it's a lot faster to get 160 * lines than to get words, since the word count requires some 161 * logic. 162 */ 163 if (doline) { 164 while ((len = read(fd, buf, MAXBSIZE))) { 165 if (len == -1) { 166 warn("%s: read", file); 167 (void)close(fd); 168 return (1); 169 } 170 charct += len; 171 for (p = buf; len--; ++p) 172 if (*p == '\n') 173 ++linect; 174 } 175 tlinect += linect; 176 (void)printf(" %7ju", linect); 177 if (dochar) { 178 tcharct += charct; 179 (void)printf(" %7ju", charct); 180 } 181 (void)close(fd); 182 return (0); 183 } 184 /* 185 * If all we need is the number of characters and it's a 186 * regular file, just stat the puppy. 187 */ 188 if (dochar || domulti) { 189 if (fstat(fd, &sb)) { 190 warn("%s: fstat", file); 191 (void)close(fd); 192 return (1); 193 } 194 if (S_ISREG(sb.st_mode)) { 195 (void)printf(" %7lld", (long long)sb.st_size); 196 tcharct += sb.st_size; 197 (void)close(fd); 198 return (0); 199 } 200 } 201 } 202 203 /* Do it the hard way... */ 204 word: gotsp = 1; 205 len = 0; 206 warned = 0; 207 while ((nread = read(fd, buf + len, MAXBSIZE - len)) != 0) { 208 if (nread == -1) { 209 warn("%s: read", file); 210 (void)close(fd); 211 return (1); 212 } 213 len += nread; 214 p = buf; 215 while (len > 0) { 216 if (!domulti || MB_CUR_MAX == 1) { 217 clen = 1; 218 wch = (unsigned char)*p; 219 } else if ((clen = mbtowc(&wch, p, len)) <= 0) { 220 if (len > MB_CUR_MAX) { 221 clen = 1; 222 wch = (unsigned char)*p; 223 if (!warned) { 224 errno = EILSEQ; 225 warn("%s", file); 226 warned = 1; 227 } 228 } else { 229 memmove(buf, p, len); 230 break; 231 } 232 } 233 charct++; 234 len -= clen; 235 p += clen; 236 if (wch == L'\n') 237 ++linect; 238 if (iswspace(wch)) 239 gotsp = 1; 240 else if (gotsp) { 241 gotsp = 0; 242 ++wordct; 243 } 244 } 245 } 246 if (doline) { 247 tlinect += linect; 248 (void)printf(" %7ju", linect); 249 } 250 if (doword) { 251 twordct += wordct; 252 (void)printf(" %7ju", wordct); 253 } 254 if (dochar || domulti) { 255 tcharct += charct; 256 (void)printf(" %7ju", charct); 257 } 258 (void)close(fd); 259 return (0); 260 } 261 262 static void 263 usage() 264 { 265 (void)fprintf(stderr, "usage: wc [-clmw] [file ...]\n"); 266 exit(1); 267 } 268