1f2155981SBrian Somers /*- 2f2155981SBrian Somers * Copyright (c) 1999 The NetBSD Foundation, Inc. 3f2155981SBrian Somers * All rights reserved. 4f2155981SBrian Somers * 5f2155981SBrian Somers * This code is derived from software contributed to The NetBSD Foundation 6f2155981SBrian Somers * by Klaus Klein. 7f2155981SBrian Somers * 8f2155981SBrian Somers * Redistribution and use in source and binary forms, with or without 9f2155981SBrian Somers * modification, are permitted provided that the following conditions 10f2155981SBrian Somers * are met: 11f2155981SBrian Somers * 1. Redistributions of source code must retain the above copyright 12f2155981SBrian Somers * notice, this list of conditions and the following disclaimer. 13f2155981SBrian Somers * 2. Redistributions in binary form must reproduce the above copyright 14f2155981SBrian Somers * notice, this list of conditions and the following disclaimer in the 15f2155981SBrian Somers * documentation and/or other materials provided with the distribution. 16f2155981SBrian Somers * 3. All advertising materials mentioning features or use of this software 17f2155981SBrian Somers * must display the following acknowledgement: 18f2155981SBrian Somers * This product includes software developed by the NetBSD 19f2155981SBrian Somers * Foundation, Inc. and its contributors. 20f2155981SBrian Somers * 4. Neither the name of The NetBSD Foundation nor the names of its 21f2155981SBrian Somers * contributors may be used to endorse or promote products derived 22f2155981SBrian Somers * from this software without specific prior written permission. 23f2155981SBrian Somers * 24f2155981SBrian Somers * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 25f2155981SBrian Somers * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 26f2155981SBrian Somers * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 27f2155981SBrian Somers * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 28f2155981SBrian Somers * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 29f2155981SBrian Somers * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 30f2155981SBrian Somers * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 31f2155981SBrian Somers * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 32f2155981SBrian Somers * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 33f2155981SBrian Somers * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 34f2155981SBrian Somers * POSSIBILITY OF SUCH DAMAGE. 35f2155981SBrian Somers */ 36f2155981SBrian Somers 37f2155981SBrian Somers #include <sys/cdefs.h> 38f2155981SBrian Somers #ifndef lint 39f2155981SBrian Somers __COPYRIGHT( 40f2155981SBrian Somers "@(#) Copyright (c) 1999\ 41f2155981SBrian Somers The NetBSD Foundation, Inc. All rights reserved."); 42f2155981SBrian Somers __RCSID("$FreeBSD$"); 43f2155981SBrian Somers #endif 44f2155981SBrian Somers 45f2155981SBrian Somers #include <sys/types.h> 46f2155981SBrian Somers 47f1e20ff7STim J. Robbins #include <err.h> 48f2155981SBrian Somers #include <errno.h> 49f2155981SBrian Somers #include <limits.h> 50f2155981SBrian Somers #include <locale.h> 51f2155981SBrian Somers #include <regex.h> 52f2155981SBrian Somers #include <stdio.h> 53f2155981SBrian Somers #include <stdlib.h> 54f2155981SBrian Somers #include <string.h> 55f2155981SBrian Somers #include <unistd.h> 56f2155981SBrian Somers 57f2155981SBrian Somers typedef enum { 58f2155981SBrian Somers number_all, /* number all lines */ 59f2155981SBrian Somers number_nonempty, /* number non-empty lines */ 60f2155981SBrian Somers number_none, /* no line numbering */ 61f2155981SBrian Somers number_regex /* number lines matching regular expression */ 62f2155981SBrian Somers } numbering_type; 63f2155981SBrian Somers 64f2155981SBrian Somers struct numbering_property { 65f2155981SBrian Somers const char * const name; /* for diagnostics */ 66f2155981SBrian Somers numbering_type type; /* numbering type */ 67f2155981SBrian Somers regex_t expr; /* for type == number_regex */ 68f2155981SBrian Somers }; 69f2155981SBrian Somers 70f2155981SBrian Somers /* line numbering formats */ 71f2155981SBrian Somers #define FORMAT_LN "%-*d" /* left justified, leading zeros suppressed */ 72f2155981SBrian Somers #define FORMAT_RN "%*d" /* right justified, leading zeros suppressed */ 73f2155981SBrian Somers #define FORMAT_RZ "%0*d" /* right justified, leading zeros kept */ 74f2155981SBrian Somers 75f2155981SBrian Somers #define FOOTER 0 76f2155981SBrian Somers #define BODY 1 77f2155981SBrian Somers #define HEADER 2 78f2155981SBrian Somers #define NP_LAST HEADER 79f2155981SBrian Somers 80f2155981SBrian Somers static struct numbering_property numbering_properties[NP_LAST + 1] = { 81f2155981SBrian Somers { "footer", number_none }, 82f2155981SBrian Somers { "body", number_nonempty }, 83f2155981SBrian Somers { "header", number_none } 84f2155981SBrian Somers }; 85f2155981SBrian Somers 86f2155981SBrian Somers #define max(a, b) ((a) > (b) ? (a) : (b)) 87f2155981SBrian Somers 88f2155981SBrian Somers /* 89f2155981SBrian Somers * Maximum number of characters required for a decimal representation of a 90f2155981SBrian Somers * (signed) int; courtesy of tzcode. 91f2155981SBrian Somers */ 92f2155981SBrian Somers #define INT_STRLEN_MAXIMUM \ 93f2155981SBrian Somers ((sizeof (int) * CHAR_BIT - 1) * 302 / 1000 + 2) 94f2155981SBrian Somers 95d3cb5dedSWarner Losh static void filter(void); 96d3cb5dedSWarner Losh static void parse_numbering(const char *, int); 97d3cb5dedSWarner Losh static void usage(void); 98f2155981SBrian Somers 99f2155981SBrian Somers /* 100f2155981SBrian Somers * Pointer to dynamically allocated input line buffer, and its size. 101f2155981SBrian Somers */ 102f2155981SBrian Somers static char *buffer; 103f2155981SBrian Somers static size_t buffersize; 104f2155981SBrian Somers 105f2155981SBrian Somers /* 106f2155981SBrian Somers * Dynamically allocated buffer suitable for string representation of ints. 107f2155981SBrian Somers */ 108f2155981SBrian Somers static char *intbuffer; 109f2155981SBrian Somers 110f2155981SBrian Somers /* 111f2155981SBrian Somers * Configurable parameters. 112f2155981SBrian Somers */ 113f2155981SBrian Somers /* delimiter characters that indicate the start of a logical page section */ 114f2155981SBrian Somers static char delim[2] = { '\\', ':' }; 115f2155981SBrian Somers 116f2155981SBrian Somers /* line numbering format */ 117f2155981SBrian Somers static const char *format = FORMAT_RN; 118f2155981SBrian Somers 119f2155981SBrian Somers /* increment value used to number logical page lines */ 120f2155981SBrian Somers static int incr = 1; 121f2155981SBrian Somers 122f2155981SBrian Somers /* number of adjacent blank lines to be considered (and numbered) as one */ 123f2155981SBrian Somers static unsigned int nblank = 1; 124f2155981SBrian Somers 125f2155981SBrian Somers /* whether to restart numbering at logical page delimiters */ 126f2155981SBrian Somers static int restart = 1; 127f2155981SBrian Somers 128f2155981SBrian Somers /* characters used in separating the line number and the corrsp. text line */ 129f2155981SBrian Somers static const char *sep = "\t"; 130f2155981SBrian Somers 131f2155981SBrian Somers /* initial value used to number logical page lines */ 132f2155981SBrian Somers static int startnum = 1; 133f2155981SBrian Somers 134f2155981SBrian Somers /* number of characters to be used for the line number */ 135f2155981SBrian Somers /* should be unsigned but required signed by `*' precision conversion */ 136f2155981SBrian Somers static int width = 6; 137f2155981SBrian Somers 138f2155981SBrian Somers 139f2155981SBrian Somers int 140f2155981SBrian Somers main(argc, argv) 141f2155981SBrian Somers int argc; 142f2155981SBrian Somers char *argv[]; 143f2155981SBrian Somers { 144f2155981SBrian Somers int c; 145f2155981SBrian Somers long val; 146f2155981SBrian Somers unsigned long uval; 147f2155981SBrian Somers char *ep; 148f2155981SBrian Somers size_t intbuffersize; 149f2155981SBrian Somers 150f2155981SBrian Somers (void)setlocale(LC_ALL, ""); 151f2155981SBrian Somers 152f2155981SBrian Somers while ((c = getopt(argc, argv, "pb:d:f:h:i:l:n:s:v:w:")) != -1) { 153f2155981SBrian Somers switch (c) { 154f2155981SBrian Somers case 'p': 155f2155981SBrian Somers restart = 0; 156f2155981SBrian Somers break; 157f2155981SBrian Somers case 'b': 158f2155981SBrian Somers parse_numbering(optarg, BODY); 159f2155981SBrian Somers break; 160f2155981SBrian Somers case 'd': 161f2155981SBrian Somers if (optarg[0] != '\0') 162f2155981SBrian Somers delim[0] = optarg[0]; 163f2155981SBrian Somers if (optarg[1] != '\0') 164f2155981SBrian Somers delim[1] = optarg[1]; 165f2155981SBrian Somers /* at most two delimiter characters */ 166f2155981SBrian Somers if (optarg[2] != '\0') { 16753e29ec5STim J. Robbins errx(EXIT_FAILURE, 16853e29ec5STim J. Robbins "invalid delim argument -- %s", 169f2155981SBrian Somers optarg); 170f2155981SBrian Somers /* NOTREACHED */ 171f2155981SBrian Somers } 172f2155981SBrian Somers break; 173f2155981SBrian Somers case 'f': 174f2155981SBrian Somers parse_numbering(optarg, FOOTER); 175f2155981SBrian Somers break; 176f2155981SBrian Somers case 'h': 177f2155981SBrian Somers parse_numbering(optarg, HEADER); 178f2155981SBrian Somers break; 179f2155981SBrian Somers case 'i': 180f2155981SBrian Somers errno = 0; 181f2155981SBrian Somers val = strtol(optarg, &ep, 10); 182f2155981SBrian Somers if ((ep != NULL && *ep != '\0') || 18353e29ec5STim J. Robbins ((val == LONG_MIN || val == LONG_MAX) && errno != 0)) 18453e29ec5STim J. Robbins errx(EXIT_FAILURE, 18553e29ec5STim J. Robbins "invalid incr argument -- %s", optarg); 186f2155981SBrian Somers incr = (int)val; 187f2155981SBrian Somers break; 188f2155981SBrian Somers case 'l': 189f2155981SBrian Somers errno = 0; 190f2155981SBrian Somers uval = strtoul(optarg, &ep, 10); 191f2155981SBrian Somers if ((ep != NULL && *ep != '\0') || 19253e29ec5STim J. Robbins (uval == ULONG_MAX && errno != 0)) 19353e29ec5STim J. Robbins errx(EXIT_FAILURE, 19453e29ec5STim J. Robbins "invalid num argument -- %s", optarg); 195f2155981SBrian Somers nblank = (unsigned int)uval; 196f2155981SBrian Somers break; 197f2155981SBrian Somers case 'n': 198f2155981SBrian Somers if (strcmp(optarg, "ln") == 0) { 199f2155981SBrian Somers format = FORMAT_LN; 200f2155981SBrian Somers } else if (strcmp(optarg, "rn") == 0) { 201f2155981SBrian Somers format = FORMAT_RN; 202f2155981SBrian Somers } else if (strcmp(optarg, "rz") == 0) { 203f2155981SBrian Somers format = FORMAT_RZ; 20453e29ec5STim J. Robbins } else 20553e29ec5STim J. Robbins errx(EXIT_FAILURE, 20653e29ec5STim J. Robbins "illegal format -- %s", optarg); 207f2155981SBrian Somers break; 208f2155981SBrian Somers case 's': 209f2155981SBrian Somers sep = optarg; 210f2155981SBrian Somers break; 211f2155981SBrian Somers case 'v': 212f2155981SBrian Somers errno = 0; 213f2155981SBrian Somers val = strtol(optarg, &ep, 10); 214f2155981SBrian Somers if ((ep != NULL && *ep != '\0') || 21553e29ec5STim J. Robbins ((val == LONG_MIN || val == LONG_MAX) && errno != 0)) 21653e29ec5STim J. Robbins errx(EXIT_FAILURE, 21753e29ec5STim J. Robbins "invalid startnum value -- %s", optarg); 218f2155981SBrian Somers startnum = (int)val; 219f2155981SBrian Somers break; 220f2155981SBrian Somers case 'w': 221f2155981SBrian Somers errno = 0; 222f2155981SBrian Somers val = strtol(optarg, &ep, 10); 223f2155981SBrian Somers if ((ep != NULL && *ep != '\0') || 22453e29ec5STim J. Robbins ((val == LONG_MIN || val == LONG_MAX) && errno != 0)) 22553e29ec5STim J. Robbins errx(EXIT_FAILURE, 22653e29ec5STim J. Robbins "invalid width value -- %s", optarg); 227f2155981SBrian Somers width = (int)val; 22853e29ec5STim J. Robbins if (!(width > 0)) 22953e29ec5STim J. Robbins errx(EXIT_FAILURE, 23053e29ec5STim J. Robbins "width argument must be > 0 -- %d", 231f2155981SBrian Somers width); 232f2155981SBrian Somers break; 233f2155981SBrian Somers case '?': 234f2155981SBrian Somers default: 235f2155981SBrian Somers usage(); 236f2155981SBrian Somers /* NOTREACHED */ 237f2155981SBrian Somers } 238f2155981SBrian Somers } 239f2155981SBrian Somers argc -= optind; 240f2155981SBrian Somers argv += optind; 241f2155981SBrian Somers 242f2155981SBrian Somers switch (argc) { 243f2155981SBrian Somers case 0: 244f2155981SBrian Somers break; 245f2155981SBrian Somers case 1: 246f1e20ff7STim J. Robbins if (freopen(argv[0], "r", stdin) == NULL) 247f1e20ff7STim J. Robbins err(EXIT_FAILURE, "%s", argv[0]); 248f2155981SBrian Somers break; 249f2155981SBrian Somers default: 250f2155981SBrian Somers usage(); 251f2155981SBrian Somers /* NOTREACHED */ 252f2155981SBrian Somers } 253f2155981SBrian Somers 254f2155981SBrian Somers /* Determine the maximum input line length to operate on. */ 255f2155981SBrian Somers if ((val = sysconf(_SC_LINE_MAX)) == -1) /* ignore errno */ 256f2155981SBrian Somers val = LINE_MAX; 257f2155981SBrian Somers /* Allocate sufficient buffer space (including the terminating NUL). */ 258f2155981SBrian Somers buffersize = (size_t)val + 1; 259f1e20ff7STim J. Robbins if ((buffer = malloc(buffersize)) == NULL) 260f1e20ff7STim J. Robbins err(EXIT_FAILURE, "cannot allocate input line buffer"); 261f2155981SBrian Somers 262f2155981SBrian Somers /* Allocate a buffer suitable for preformatting line number. */ 263f2155981SBrian Somers intbuffersize = max(INT_STRLEN_MAXIMUM, width) + 1; /* NUL */ 264f1e20ff7STim J. Robbins if ((intbuffer = malloc(intbuffersize)) == NULL) 265f1e20ff7STim J. Robbins err(EXIT_FAILURE, "cannot allocate preformatting buffer"); 266f2155981SBrian Somers 267f2155981SBrian Somers /* Do the work. */ 268f2155981SBrian Somers filter(); 269f2155981SBrian Somers 270f2155981SBrian Somers exit(EXIT_SUCCESS); 271f2155981SBrian Somers /* NOTREACHED */ 272f2155981SBrian Somers } 273f2155981SBrian Somers 274f2155981SBrian Somers static void 275f2155981SBrian Somers filter() 276f2155981SBrian Somers { 277f2155981SBrian Somers int line; /* logical line number */ 278f2155981SBrian Somers int section; /* logical page section */ 279f2155981SBrian Somers unsigned int adjblank; /* adjacent blank lines */ 280f2155981SBrian Somers int consumed; /* intbuffer measurement */ 281f2155981SBrian Somers int donumber, idx; 282f2155981SBrian Somers 283f2155981SBrian Somers adjblank = 0; 284f2155981SBrian Somers line = startnum; 285f2155981SBrian Somers section = BODY; 286f2155981SBrian Somers #ifdef __GNUC__ 287f2155981SBrian Somers (void)&donumber; /* avoid bogus `uninitialized' warning */ 288f2155981SBrian Somers #endif 289f2155981SBrian Somers 290f2155981SBrian Somers while (fgets(buffer, (int)buffersize, stdin) != NULL) { 291f2155981SBrian Somers for (idx = FOOTER; idx <= NP_LAST; idx++) { 292f2155981SBrian Somers /* Does it look like a delimiter? */ 293f2155981SBrian Somers if (buffer[2 * idx + 0] == delim[0] && 294f2155981SBrian Somers buffer[2 * idx + 1] == delim[1]) { 295f2155981SBrian Somers /* Was this the whole line? */ 296f2155981SBrian Somers if (buffer[2 * idx + 2] == '\n') { 297f2155981SBrian Somers section = idx; 298f2155981SBrian Somers adjblank = 0; 299f2155981SBrian Somers if (restart) 300f2155981SBrian Somers line = startnum; 301f2155981SBrian Somers goto nextline; 302f2155981SBrian Somers } 303f2155981SBrian Somers } else { 304f2155981SBrian Somers break; 305f2155981SBrian Somers } 306f2155981SBrian Somers } 307f2155981SBrian Somers 308f2155981SBrian Somers switch (numbering_properties[section].type) { 309f2155981SBrian Somers case number_all: 310f2155981SBrian Somers /* 311f2155981SBrian Somers * Doing this for number_all only is disputable, but 312f2155981SBrian Somers * the standard expresses an explicit dependency on 313f2155981SBrian Somers * `-b a' etc. 314f2155981SBrian Somers */ 315f2155981SBrian Somers if (buffer[0] == '\n' && ++adjblank < nblank) 316f2155981SBrian Somers donumber = 0; 317f2155981SBrian Somers else 318f2155981SBrian Somers donumber = 1, adjblank = 0; 319f2155981SBrian Somers break; 320f2155981SBrian Somers case number_nonempty: 321f2155981SBrian Somers donumber = (buffer[0] != '\n'); 322f2155981SBrian Somers break; 323f2155981SBrian Somers case number_none: 324f2155981SBrian Somers donumber = 0; 325f2155981SBrian Somers break; 326f2155981SBrian Somers case number_regex: 327f2155981SBrian Somers donumber = 328f2155981SBrian Somers (regexec(&numbering_properties[section].expr, 329f2155981SBrian Somers buffer, 0, NULL, 0) == 0); 330f2155981SBrian Somers break; 331f2155981SBrian Somers } 332f2155981SBrian Somers 333f2155981SBrian Somers if (donumber) { 334f2155981SBrian Somers /* Note: sprintf() is safe here. */ 335f2155981SBrian Somers consumed = sprintf(intbuffer, format, width, line); 336f2155981SBrian Somers (void)printf("%s", 337f2155981SBrian Somers intbuffer + max(0, consumed - width)); 338f2155981SBrian Somers line += incr; 339f2155981SBrian Somers } else { 340f2155981SBrian Somers (void)printf("%*s", width, ""); 341f2155981SBrian Somers } 342f2155981SBrian Somers (void)printf("%s%s", sep, buffer); 343f2155981SBrian Somers 344f1e20ff7STim J. Robbins if (ferror(stdout)) 345f1e20ff7STim J. Robbins err(EXIT_FAILURE, "output error"); 346f2155981SBrian Somers nextline: 347f2155981SBrian Somers ; 348f2155981SBrian Somers } 349f2155981SBrian Somers 350f1e20ff7STim J. Robbins if (ferror(stdin)) 351f1e20ff7STim J. Robbins err(EXIT_FAILURE, "input error"); 352f2155981SBrian Somers } 353f2155981SBrian Somers 354f2155981SBrian Somers /* 355f2155981SBrian Somers * Various support functions. 356f2155981SBrian Somers */ 357f2155981SBrian Somers 358f2155981SBrian Somers static void 359f2155981SBrian Somers parse_numbering(argstr, section) 360f2155981SBrian Somers const char *argstr; 361f2155981SBrian Somers int section; 362f2155981SBrian Somers { 363f2155981SBrian Somers int error; 364f2155981SBrian Somers char errorbuf[NL_TEXTMAX]; 365f2155981SBrian Somers 366f2155981SBrian Somers switch (argstr[0]) { 367f2155981SBrian Somers case 'a': 368f2155981SBrian Somers numbering_properties[section].type = number_all; 369f2155981SBrian Somers break; 370f2155981SBrian Somers case 'n': 371f2155981SBrian Somers numbering_properties[section].type = number_none; 372f2155981SBrian Somers break; 373f2155981SBrian Somers case 't': 374f2155981SBrian Somers numbering_properties[section].type = number_nonempty; 375f2155981SBrian Somers break; 376f2155981SBrian Somers case 'p': 377f2155981SBrian Somers /* If there was a previous expression, throw it away. */ 378f2155981SBrian Somers if (numbering_properties[section].type == number_regex) 379f2155981SBrian Somers regfree(&numbering_properties[section].expr); 380f2155981SBrian Somers else 381f2155981SBrian Somers numbering_properties[section].type = number_regex; 382f2155981SBrian Somers 383f2155981SBrian Somers /* Compile/validate the supplied regular expression. */ 384f2155981SBrian Somers if ((error = regcomp(&numbering_properties[section].expr, 385f2155981SBrian Somers &argstr[1], REG_NEWLINE|REG_NOSUB)) != 0) { 386f2155981SBrian Somers (void)regerror(error, 387f2155981SBrian Somers &numbering_properties[section].expr, 388f2155981SBrian Somers errorbuf, sizeof (errorbuf)); 38953e29ec5STim J. Robbins errx(EXIT_FAILURE, 39053e29ec5STim J. Robbins "%s expr: %s -- %s", 391f2155981SBrian Somers numbering_properties[section].name, errorbuf, 392f2155981SBrian Somers &argstr[1]); 393f2155981SBrian Somers } 394f2155981SBrian Somers break; 395f2155981SBrian Somers default: 39653e29ec5STim J. Robbins errx(EXIT_FAILURE, 39753e29ec5STim J. Robbins "illegal %s line numbering type -- %s", 398f2155981SBrian Somers numbering_properties[section].name, argstr); 399f2155981SBrian Somers } 400f2155981SBrian Somers } 401f2155981SBrian Somers 402f2155981SBrian Somers static void 403f2155981SBrian Somers usage() 404f2155981SBrian Somers { 405f2155981SBrian Somers 4067007f3d6STim J. Robbins (void)fprintf(stderr, 4077007f3d6STim J. Robbins "usage: nl [-p] [-b type] [-d delim] [-f type] [-h type] [-i incr] [-l num]\n" 4087007f3d6STim J. Robbins " [-n format] [-s sep] [-v startnum] [-w width] [file]\n"); 409f2155981SBrian Somers exit(EXIT_FAILURE); 410f2155981SBrian Somers } 411