1 /* 2 * Copyright (c) 2013 Johann 'Myrkraverk' Oskarsson <johann@myrkraverk.com> 3 * Copyright (c) 2011 Gary Mills 4 * Copyright 2011 Nexenta Systems, Inc. All rights reserved. 5 * Copyright (c) 1992 Diomidis Spinellis. 6 * Copyright (c) 1992, 1993 7 * The Regents of the University of California. All rights reserved. 8 * 9 * This code is derived from software contributed to Berkeley by 10 * Diomidis Spinellis of Imperial College, University of London. 11 * 12 * Redistribution and use in source and binary forms, with or without 13 * modification, are permitted provided that the following conditions 14 * are met: 15 * 1. Redistributions of source code must retain the above copyright 16 * notice, this list of conditions and the following disclaimer. 17 * 2. Redistributions in binary form must reproduce the above copyright 18 * notice, this list of conditions and the following disclaimer in the 19 * documentation and/or other materials provided with the distribution. 20 * 4. Neither the name of the University nor the names of its contributors 21 * may be used to endorse or promote products derived from this software 22 * without specific prior written permission. 23 * 24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 27 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 34 * SUCH DAMAGE. 35 */ 36 37 #include <sys/types.h> 38 #include <sys/mman.h> 39 #include <sys/param.h> 40 #include <sys/stat.h> 41 42 #include <err.h> 43 #include <errno.h> 44 #include <fcntl.h> 45 #include <getopt.h> 46 #include <libgen.h> 47 #include <libintl.h> 48 #include <limits.h> 49 #include <locale.h> 50 #include <regex.h> 51 #include <stddef.h> 52 #include <stdio.h> 53 #include <stdlib.h> 54 #include <string.h> 55 #include <unistd.h> 56 57 #include "defs.h" 58 #include "extern.h" 59 60 /* 61 * Linked list of units (strings and files) to be compiled 62 */ 63 struct s_compunit { 64 struct s_compunit *next; 65 enum e_cut {CU_FILE, CU_STRING} type; 66 char *s; /* Pointer to string or fname */ 67 }; 68 69 /* 70 * Linked list pointer to compilation units and pointer to current 71 * next pointer. 72 */ 73 static struct s_compunit *script, **cu_nextp = &script; 74 75 /* 76 * Linked list of files to be processed 77 */ 78 struct s_flist { 79 char *fname; 80 struct s_flist *next; 81 }; 82 83 /* 84 * Linked list pointer to files and pointer to current 85 * next pointer. 86 */ 87 static struct s_flist *files, **fl_nextp = &files; 88 89 FILE *infile; /* Current input file */ 90 FILE *outfile; /* Current output file */ 91 92 int aflag, eflag, nflag; 93 int rflags = 0; 94 static int rval; /* Exit status */ 95 96 static int ispan; /* Whether inplace editing spans across files */ 97 98 /* 99 * Current file and line number; line numbers restart across compilation 100 * units, but span across input files. The latter is optional if editing 101 * in place. 102 */ 103 const char *fname; /* File name. */ 104 const char *outfname; /* Output file name */ 105 static char oldfname[PATH_MAX]; /* Old file name (for in-place editing) */ 106 static char tmpfname[PATH_MAX]; /* Temporary file name (for in-place editing) */ 107 static const char *inplace; /* Inplace edit file extension. */ 108 ulong_t linenum; 109 110 static const struct option lopts[] = { 111 {"in-place", optional_argument, NULL, 'i'}, 112 {NULL, 0, NULL, 0} 113 }; 114 115 static void add_compunit(enum e_cut, char *); 116 static void add_file(char *); 117 static void usage(void); 118 119 120 int 121 main(int argc, char *argv[]) 122 { 123 int c, fflag; 124 char *temp_arg; 125 126 (void) setlocale(LC_ALL, ""); 127 128 #ifndef TEXT_DOMAIN 129 #define TEXT_DOMAIN "SYS_TEST" 130 #endif 131 (void) textdomain(TEXT_DOMAIN); 132 133 fflag = 0; 134 inplace = NULL; 135 136 while ((c = getopt_long(argc, argv, "EI::ae:f:i::lnr", lopts, NULL)) != 137 -1) 138 switch (c) { 139 case 'r': /* Gnu sed compat */ 140 case 'E': 141 rflags = REG_EXTENDED; 142 break; 143 case 'I': 144 if (optarg != NULL) 145 inplace = optarg; 146 else 147 inplace = ""; 148 ispan = 1; /* span across input files */ 149 break; 150 case 'a': 151 aflag = 1; 152 break; 153 case 'e': 154 eflag = 1; 155 if (asprintf(&temp_arg, "%s\n", optarg) < 1) 156 err(1, "asprintf"); 157 add_compunit(CU_STRING, temp_arg); 158 break; 159 case 'f': 160 fflag = 1; 161 add_compunit(CU_FILE, optarg); 162 break; 163 case 'i': 164 if (optarg != NULL) 165 inplace = optarg; 166 else 167 inplace = ""; 168 ispan = 0; /* don't span across input files */ 169 break; 170 case 'l': 171 /* On SunOS, setlinebuf "returns no useful value */ 172 (void) setlinebuf(stdout); 173 break; 174 case 'n': 175 nflag = 1; 176 break; 177 default: 178 case '?': 179 usage(); 180 } 181 argc -= optind; 182 argv += optind; 183 184 /* First usage case; script is the first arg */ 185 if (!eflag && !fflag && *argv) { 186 add_compunit(CU_STRING, *argv); 187 argv++; 188 } 189 190 compile(); 191 192 /* Continue with first and start second usage */ 193 if (*argv) 194 for (; *argv; argv++) 195 add_file(*argv); 196 else 197 add_file(NULL); 198 process(); 199 cfclose(prog, NULL); 200 if (fclose(stdout)) 201 err(1, "stdout"); 202 return (rval); 203 } 204 205 static void 206 usage(void) 207 { 208 (void) fputs(_("usage: sed script [-Ealn] [-i[extension]] [file...]\n" 209 " sed [-Ealn] [-i[extension]] [-e script]... " 210 "[-f script_file]... [file...]\n"), 211 stderr); 212 exit(1); 213 } 214 215 /* 216 * Like fgets, but go through the chain of compilation units chaining them 217 * together. Empty strings and files are ignored. 218 */ 219 char * 220 cu_fgets(char *buf, int n, int *more) 221 { 222 static enum {ST_EOF, ST_FILE, ST_STRING} state = ST_EOF; 223 static FILE *f; /* Current open file */ 224 static char *s; /* Current pointer inside string */ 225 static char string_ident[30]; 226 char *p; 227 228 again: 229 switch (state) { 230 case ST_EOF: 231 if (script == NULL) { 232 if (more != NULL) 233 *more = 0; 234 return (NULL); 235 } 236 linenum = 0; 237 switch (script->type) { 238 case CU_FILE: 239 if ((f = fopen(script->s, "r")) == NULL) 240 err(1, "%s", script->s); 241 fname = script->s; 242 state = ST_FILE; 243 goto again; 244 case CU_STRING: 245 if (((size_t)snprintf(string_ident, 246 sizeof (string_ident), "\"%s\"", script->s)) >= 247 sizeof (string_ident) - 1) 248 (void) strcpy(string_ident + 249 sizeof (string_ident) - 6, " ...\""); 250 fname = string_ident; 251 s = script->s; 252 state = ST_STRING; 253 goto again; 254 } 255 /*NOTREACHED*/ 256 257 case ST_FILE: 258 if ((p = fgets(buf, n, f)) != NULL) { 259 linenum++; 260 if (linenum == 1 && buf[0] == '#' && buf[1] == 'n') 261 nflag = 1; 262 if (more != NULL) 263 *more = !feof(f); 264 return (p); 265 } 266 script = script->next; 267 (void) fclose(f); 268 state = ST_EOF; 269 goto again; 270 case ST_STRING: 271 if (linenum == 0 && s[0] == '#' && s[1] == 'n') 272 nflag = 1; 273 p = buf; 274 for (;;) { 275 if (n-- <= 1) { 276 *p = '\0'; 277 linenum++; 278 if (more != NULL) 279 *more = 1; 280 return (buf); 281 } 282 switch (*s) { 283 case '\0': 284 state = ST_EOF; 285 if (s == script->s) { 286 script = script->next; 287 goto again; 288 } else { 289 script = script->next; 290 *p = '\0'; 291 linenum++; 292 if (more != NULL) 293 *more = 0; 294 return (buf); 295 } 296 case '\n': 297 *p++ = '\n'; 298 *p = '\0'; 299 s++; 300 linenum++; 301 if (more != NULL) 302 *more = 0; 303 return (buf); 304 default: 305 *p++ = *s++; 306 } 307 } 308 } 309 /* NOTREACHED */ 310 return (NULL); 311 } 312 313 /* 314 * Like fgets, but go through the list of files chaining them together. 315 * Set len to the length of the line. 316 */ 317 int 318 mf_fgets(SPACE *sp, enum e_spflag spflag) 319 { 320 struct stat sb, nsb; 321 ssize_t len; 322 static char *p = NULL; 323 static size_t plen = 0; 324 int c; 325 static int firstfile; 326 327 if (infile == NULL) { 328 /* stdin? */ 329 if (files->fname == NULL) { 330 if (inplace != NULL) 331 errx(1, 332 _("-I or -i may not be used with stdin")); 333 infile = stdin; 334 fname = "stdin"; 335 outfile = stdout; 336 outfname = "stdout"; 337 } 338 firstfile = 1; 339 } 340 341 for (;;) { 342 if (infile != NULL && (c = getc(infile)) != EOF) { 343 (void) ungetc(c, infile); 344 break; 345 } 346 /* If we are here then either eof or no files are open yet */ 347 if (infile == stdin) { 348 sp->len = 0; 349 return (0); 350 } 351 if (infile != NULL) { 352 (void) fclose(infile); 353 if (*oldfname != '\0') { 354 /* if there was a backup file, remove it */ 355 (void) unlink(oldfname); 356 /* 357 * Backup the original. Note that hard links 358 * are not supported on all filesystems. 359 */ 360 if ((link(fname, oldfname) != 0) && 361 (rename(fname, oldfname) != 0)) { 362 warn("rename()"); 363 if (*tmpfname) 364 (void) unlink(tmpfname); 365 exit(1); 366 } 367 *oldfname = '\0'; 368 } 369 if (*tmpfname != '\0') { 370 if (outfile != NULL && outfile != stdout) 371 if (fclose(outfile) != 0) { 372 warn("fclose()"); 373 (void) unlink(tmpfname); 374 exit(1); 375 } 376 outfile = NULL; 377 if (rename(tmpfname, fname) != 0) { 378 /* this should not happen really! */ 379 warn("rename()"); 380 (void) unlink(tmpfname); 381 exit(1); 382 } 383 *tmpfname = '\0'; 384 } 385 outfname = NULL; 386 } 387 if (firstfile == 0) 388 files = files->next; 389 else 390 firstfile = 0; 391 if (files == NULL) { 392 sp->len = 0; 393 return (0); 394 } 395 fname = files->fname; 396 if (inplace != NULL) { 397 char bn[PATH_MAX]; 398 char dn[PATH_MAX]; 399 (void) strlcpy(bn, fname, sizeof (bn)); 400 (void) strlcpy(dn, fname, sizeof (dn)); 401 if (lstat(fname, &sb) != 0) 402 err(1, "%s", fname); 403 if (!(sb.st_mode & S_IFREG)) 404 fatal(_("in-place editing only " 405 "works for regular files")); 406 if (*inplace != '\0') { 407 (void) strlcpy(oldfname, fname, 408 sizeof (oldfname)); 409 len = strlcat(oldfname, inplace, 410 sizeof (oldfname)); 411 if (len > sizeof (oldfname)) 412 fatal(_("name too long")); 413 } 414 len = snprintf(tmpfname, sizeof (tmpfname), 415 "%s/.!%ld!%s", dirname(dn), (long)getpid(), 416 basename(bn)); 417 if (len >= sizeof (tmpfname)) 418 fatal(_("name too long")); 419 (void) unlink(tmpfname); 420 if ((outfile = fopen(tmpfname, "w")) == NULL) 421 err(1, "%s", fname); 422 /* 423 * Some file systems don't support chown or 424 * chmod fully. On those, the owner/group and 425 * permissions will already be set to what 426 * they need to be. 427 */ 428 if (fstat(fileno(outfile), &nsb) != 0) { 429 warn("fstat()"); 430 } 431 if (((sb.st_uid != nsb.st_uid) || 432 (sb.st_gid != nsb.st_gid)) && 433 (fchown(fileno(outfile), sb.st_uid, sb.st_gid) 434 != 0)) 435 warn("fchown()"); 436 if ((sb.st_mode != nsb.st_mode) && 437 (fchmod(fileno(outfile), sb.st_mode & 07777) != 0)) 438 warn("fchmod()"); 439 outfname = tmpfname; 440 if (!ispan) { 441 linenum = 0; 442 resetstate(); 443 } 444 } else { 445 outfile = stdout; 446 outfname = "stdout"; 447 } 448 if ((infile = fopen(fname, "r")) == NULL) { 449 warn("%s", fname); 450 rval = 1; 451 continue; 452 } 453 } 454 /* 455 * We are here only when infile is open and we still have something 456 * to read from it. 457 * 458 * Use getline() so that we can handle essentially infinite 459 * input data. The p and plen are static so each invocation gives 460 * getline() the same buffer which is expanded as needed. 461 */ 462 len = getline(&p, &plen, infile); 463 if (len == -1) 464 err(1, "%s", fname); 465 if (len != 0 && p[len - 1] == '\n') 466 len--; 467 cspace(sp, p, len, spflag); 468 469 linenum++; 470 471 return (1); 472 } 473 474 /* 475 * Add a compilation unit to the linked list 476 */ 477 static void 478 add_compunit(enum e_cut type, char *s) 479 { 480 struct s_compunit *cu; 481 482 if ((cu = malloc(sizeof (struct s_compunit))) == NULL) 483 err(1, "malloc"); 484 cu->type = type; 485 cu->s = s; 486 cu->next = NULL; 487 *cu_nextp = cu; 488 cu_nextp = &cu->next; 489 } 490 491 /* 492 * Add a file to the linked list 493 */ 494 static void 495 add_file(char *s) 496 { 497 struct s_flist *fp; 498 499 if ((fp = malloc(sizeof (struct s_flist))) == NULL) 500 err(1, "malloc"); 501 fp->next = NULL; 502 *fl_nextp = fp; 503 fp->fname = s; 504 fl_nextp = &fp->next; 505 } 506 507 int 508 lastline(void) 509 { 510 int ch; 511 512 if (files->next != NULL && (inplace == NULL || ispan)) 513 return (0); 514 if ((ch = getc(infile)) == EOF) 515 return (1); 516 (void) ungetc(ch, infile); 517 return (0); 518 } 519