1 /*
2 * Copyright (c) 2013 Johann 'Myrkraverk' Oskarsson <johann@myrkraverk.com>
3 * Copyright (c) 2011 Gary Mills
4 * Copyright 2011 Nexenta Systems, Inc. All rights reserved.
5 * Copyright (c) 1992 Diomidis Spinellis.
6 * Copyright (c) 1992, 1993
7 * The Regents of the University of California. All rights reserved.
8 *
9 * This code is derived from software contributed to Berkeley by
10 * Diomidis Spinellis of Imperial College, University of London.
11 *
12 * Redistribution and use in source and binary forms, with or without
13 * modification, are permitted provided that the following conditions
14 * are met:
15 * 1. Redistributions of source code must retain the above copyright
16 * notice, this list of conditions and the following disclaimer.
17 * 2. Redistributions in binary form must reproduce the above copyright
18 * notice, this list of conditions and the following disclaimer in the
19 * documentation and/or other materials provided with the distribution.
20 * 4. Neither the name of the University nor the names of its contributors
21 * may be used to endorse or promote products derived from this software
22 * without specific prior written permission.
23 *
24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 * SUCH DAMAGE.
35 */
36
37 #include <sys/types.h>
38 #include <sys/mman.h>
39 #include <sys/param.h>
40 #include <sys/stat.h>
41
42 #include <err.h>
43 #include <errno.h>
44 #include <fcntl.h>
45 #include <getopt.h>
46 #include <libgen.h>
47 #include <libintl.h>
48 #include <limits.h>
49 #include <locale.h>
50 #include <regex.h>
51 #include <stddef.h>
52 #include <stdio.h>
53 #include <stdlib.h>
54 #include <string.h>
55 #include <unistd.h>
56
57 #include "defs.h"
58 #include "extern.h"
59
60 /*
61 * Linked list of units (strings and files) to be compiled
62 */
63 struct s_compunit {
64 struct s_compunit *next;
65 enum e_cut {CU_FILE, CU_STRING} type;
66 char *s; /* Pointer to string or fname */
67 };
68
69 /*
70 * Linked list pointer to compilation units and pointer to current
71 * next pointer.
72 */
73 static struct s_compunit *script, **cu_nextp = &script;
74
75 /*
76 * Linked list of files to be processed
77 */
78 struct s_flist {
79 char *fname;
80 struct s_flist *next;
81 };
82
83 /*
84 * Linked list pointer to files and pointer to current
85 * next pointer.
86 */
87 static struct s_flist *files, **fl_nextp = &files;
88
89 FILE *infile; /* Current input file */
90 FILE *outfile; /* Current output file */
91
92 int aflag, eflag, nflag;
93 int rflags = 0;
94 static int rval; /* Exit status */
95
96 static int ispan; /* Whether inplace editing spans across files */
97
98 /*
99 * Current file and line number; line numbers restart across compilation
100 * units, but span across input files. The latter is optional if editing
101 * in place.
102 */
103 const char *fname; /* File name. */
104 const char *outfname; /* Output file name */
105 static char oldfname[PATH_MAX]; /* Old file name (for in-place editing) */
106 static char tmpfname[PATH_MAX]; /* Temporary file name (for in-place editing) */
107 static const char *inplace; /* Inplace edit file extension. */
108 ulong_t linenum;
109
110 static const struct option lopts[] = {
111 {"in-place", optional_argument, NULL, 'i'},
112 {NULL, 0, NULL, 0}
113 };
114
115 static void add_compunit(enum e_cut, char *);
116 static void add_file(char *);
117 static void usage(void);
118
119
120 int
main(int argc,char * argv[])121 main(int argc, char *argv[])
122 {
123 int c, fflag;
124 char *temp_arg;
125
126 (void) setlocale(LC_ALL, "");
127
128 #ifndef TEXT_DOMAIN
129 #define TEXT_DOMAIN "SYS_TEST"
130 #endif
131 (void) textdomain(TEXT_DOMAIN);
132
133 fflag = 0;
134 inplace = NULL;
135
136 while ((c = getopt_long(argc, argv, "EI::ae:f:i::lnr", lopts, NULL)) !=
137 -1)
138 switch (c) {
139 case 'r': /* Gnu sed compat */
140 case 'E':
141 rflags = REG_EXTENDED;
142 break;
143 case 'I':
144 if (optarg != NULL)
145 inplace = optarg;
146 else
147 inplace = "";
148 ispan = 1; /* span across input files */
149 break;
150 case 'a':
151 aflag = 1;
152 break;
153 case 'e':
154 eflag = 1;
155 if (asprintf(&temp_arg, "%s\n", optarg) < 1)
156 err(1, "asprintf");
157 add_compunit(CU_STRING, temp_arg);
158 break;
159 case 'f':
160 fflag = 1;
161 add_compunit(CU_FILE, optarg);
162 break;
163 case 'i':
164 if (optarg != NULL)
165 inplace = optarg;
166 else
167 inplace = "";
168 ispan = 0; /* don't span across input files */
169 break;
170 case 'l':
171 /* On SunOS, setlinebuf "returns no useful value */
172 (void) setlinebuf(stdout);
173 break;
174 case 'n':
175 nflag = 1;
176 break;
177 default:
178 case '?':
179 usage();
180 }
181 argc -= optind;
182 argv += optind;
183
184 /* First usage case; script is the first arg */
185 if (!eflag && !fflag && *argv) {
186 add_compunit(CU_STRING, *argv);
187 argv++;
188 }
189
190 compile();
191
192 /* Continue with first and start second usage */
193 if (*argv)
194 for (; *argv; argv++)
195 add_file(*argv);
196 else
197 add_file(NULL);
198 process();
199 cfclose(prog, NULL);
200 if (fclose(stdout))
201 err(1, "stdout");
202 return (rval);
203 }
204
205 static void
usage(void)206 usage(void)
207 {
208 (void) fputs(_("usage: sed script [-Ealn] [-i[extension]] [file...]\n"
209 " sed [-Ealn] [-i[extension]] [-e script]... "
210 "[-f script_file]... [file...]\n"),
211 stderr);
212 exit(1);
213 }
214
215 /*
216 * Like fgets, but go through the chain of compilation units chaining them
217 * together. Empty strings and files are ignored.
218 */
219 char *
cu_fgets(char * buf,int n,int * more)220 cu_fgets(char *buf, int n, int *more)
221 {
222 static enum {ST_EOF, ST_FILE, ST_STRING} state = ST_EOF;
223 static FILE *f; /* Current open file */
224 static char *s; /* Current pointer inside string */
225 static char string_ident[30];
226 char *p;
227
228 again:
229 switch (state) {
230 case ST_EOF:
231 if (script == NULL) {
232 if (more != NULL)
233 *more = 0;
234 return (NULL);
235 }
236 linenum = 0;
237 switch (script->type) {
238 case CU_FILE:
239 if ((f = fopen(script->s, "r")) == NULL)
240 err(1, "%s", script->s);
241 fname = script->s;
242 state = ST_FILE;
243 goto again;
244 case CU_STRING:
245 if (((size_t)snprintf(string_ident,
246 sizeof (string_ident), "\"%s\"", script->s)) >=
247 sizeof (string_ident) - 1)
248 (void) strcpy(string_ident +
249 sizeof (string_ident) - 6, " ...\"");
250 fname = string_ident;
251 s = script->s;
252 state = ST_STRING;
253 goto again;
254 }
255 /*NOTREACHED*/
256
257 case ST_FILE:
258 if ((p = fgets(buf, n, f)) != NULL) {
259 linenum++;
260 if (linenum == 1 && buf[0] == '#' && buf[1] == 'n')
261 nflag = 1;
262 if (more != NULL)
263 *more = !feof(f);
264 return (p);
265 }
266 script = script->next;
267 (void) fclose(f);
268 state = ST_EOF;
269 goto again;
270 case ST_STRING:
271 if (linenum == 0 && s[0] == '#' && s[1] == 'n')
272 nflag = 1;
273 p = buf;
274 for (;;) {
275 if (n-- <= 1) {
276 *p = '\0';
277 linenum++;
278 if (more != NULL)
279 *more = 1;
280 return (buf);
281 }
282 switch (*s) {
283 case '\0':
284 state = ST_EOF;
285 if (s == script->s) {
286 script = script->next;
287 goto again;
288 } else {
289 script = script->next;
290 *p = '\0';
291 linenum++;
292 if (more != NULL)
293 *more = 0;
294 return (buf);
295 }
296 case '\n':
297 *p++ = '\n';
298 *p = '\0';
299 s++;
300 linenum++;
301 if (more != NULL)
302 *more = 0;
303 return (buf);
304 default:
305 *p++ = *s++;
306 }
307 }
308 }
309 /* NOTREACHED */
310 return (NULL);
311 }
312
313 /*
314 * Like fgets, but go through the list of files chaining them together.
315 * Set len to the length of the line.
316 */
317 int
mf_fgets(SPACE * sp,enum e_spflag spflag)318 mf_fgets(SPACE *sp, enum e_spflag spflag)
319 {
320 struct stat sb, nsb;
321 ssize_t len;
322 static char *p = NULL;
323 static size_t plen = 0;
324 int c;
325 static int firstfile;
326
327 if (infile == NULL) {
328 /* stdin? */
329 if (files->fname == NULL) {
330 if (inplace != NULL)
331 errx(1,
332 _("-I or -i may not be used with stdin"));
333 infile = stdin;
334 fname = "stdin";
335 outfile = stdout;
336 outfname = "stdout";
337 }
338 firstfile = 1;
339 }
340
341 for (;;) {
342 if (infile != NULL && (c = getc(infile)) != EOF) {
343 (void) ungetc(c, infile);
344 break;
345 }
346 /* If we are here then either eof or no files are open yet */
347 if (infile == stdin) {
348 sp->len = 0;
349 return (0);
350 }
351 if (infile != NULL) {
352 (void) fclose(infile);
353 if (*oldfname != '\0') {
354 /* if there was a backup file, remove it */
355 (void) unlink(oldfname);
356 /*
357 * Backup the original. Note that hard links
358 * are not supported on all filesystems.
359 */
360 if ((link(fname, oldfname) != 0) &&
361 (rename(fname, oldfname) != 0)) {
362 warn("rename()");
363 if (*tmpfname)
364 (void) unlink(tmpfname);
365 exit(1);
366 }
367 *oldfname = '\0';
368 }
369 if (*tmpfname != '\0') {
370 if (outfile != NULL && outfile != stdout)
371 if (fclose(outfile) != 0) {
372 warn("fclose()");
373 (void) unlink(tmpfname);
374 exit(1);
375 }
376 outfile = NULL;
377 if (rename(tmpfname, fname) != 0) {
378 /* this should not happen really! */
379 warn("rename()");
380 (void) unlink(tmpfname);
381 exit(1);
382 }
383 *tmpfname = '\0';
384 }
385 outfname = NULL;
386 }
387 if (firstfile == 0)
388 files = files->next;
389 else
390 firstfile = 0;
391 if (files == NULL) {
392 sp->len = 0;
393 return (0);
394 }
395 fname = files->fname;
396 if (inplace != NULL) {
397 char bn[PATH_MAX];
398 char dn[PATH_MAX];
399 (void) strlcpy(bn, fname, sizeof (bn));
400 (void) strlcpy(dn, fname, sizeof (dn));
401 if (lstat(fname, &sb) != 0)
402 err(1, "%s", fname);
403 if (!(sb.st_mode & S_IFREG))
404 fatal(_("in-place editing only "
405 "works for regular files"));
406 if (*inplace != '\0') {
407 (void) strlcpy(oldfname, fname,
408 sizeof (oldfname));
409 len = strlcat(oldfname, inplace,
410 sizeof (oldfname));
411 if (len > sizeof (oldfname))
412 fatal(_("name too long"));
413 }
414 len = snprintf(tmpfname, sizeof (tmpfname),
415 "%s/.!%ld!%s", dirname(dn), (long)getpid(),
416 basename(bn));
417 if (len >= sizeof (tmpfname))
418 fatal(_("name too long"));
419 (void) unlink(tmpfname);
420 if ((outfile = fopen(tmpfname, "w")) == NULL)
421 err(1, "%s", fname);
422 /*
423 * Some file systems don't support chown or
424 * chmod fully. On those, the owner/group and
425 * permissions will already be set to what
426 * they need to be.
427 */
428 if (fstat(fileno(outfile), &nsb) != 0) {
429 warn("fstat()");
430 }
431 if (((sb.st_uid != nsb.st_uid) ||
432 (sb.st_gid != nsb.st_gid)) &&
433 (fchown(fileno(outfile), sb.st_uid, sb.st_gid)
434 != 0))
435 warn("fchown()");
436 if ((sb.st_mode != nsb.st_mode) &&
437 (fchmod(fileno(outfile), sb.st_mode & 07777) != 0))
438 warn("fchmod()");
439 outfname = tmpfname;
440 if (!ispan) {
441 linenum = 0;
442 resetstate();
443 }
444 } else {
445 outfile = stdout;
446 outfname = "stdout";
447 }
448 if ((infile = fopen(fname, "r")) == NULL) {
449 warn("%s", fname);
450 rval = 1;
451 continue;
452 }
453 }
454 /*
455 * We are here only when infile is open and we still have something
456 * to read from it.
457 *
458 * Use getline() so that we can handle essentially infinite
459 * input data. The p and plen are static so each invocation gives
460 * getline() the same buffer which is expanded as needed.
461 */
462 len = getline(&p, &plen, infile);
463 if (len == -1)
464 err(1, "%s", fname);
465 if (len != 0 && p[len - 1] == '\n')
466 len--;
467 cspace(sp, p, len, spflag);
468
469 linenum++;
470
471 return (1);
472 }
473
474 /*
475 * Add a compilation unit to the linked list
476 */
477 static void
add_compunit(enum e_cut type,char * s)478 add_compunit(enum e_cut type, char *s)
479 {
480 struct s_compunit *cu;
481
482 if ((cu = malloc(sizeof (struct s_compunit))) == NULL)
483 err(1, "malloc");
484 cu->type = type;
485 cu->s = s;
486 cu->next = NULL;
487 *cu_nextp = cu;
488 cu_nextp = &cu->next;
489 }
490
491 /*
492 * Add a file to the linked list
493 */
494 static void
add_file(char * s)495 add_file(char *s)
496 {
497 struct s_flist *fp;
498
499 if ((fp = malloc(sizeof (struct s_flist))) == NULL)
500 err(1, "malloc");
501 fp->next = NULL;
502 *fl_nextp = fp;
503 fp->fname = s;
504 fl_nextp = &fp->next;
505 }
506
507 int
lastline(void)508 lastline(void)
509 {
510 int ch;
511
512 if (files->next != NULL && (inplace == NULL || ispan))
513 return (0);
514 if ((ch = getc(infile)) == EOF)
515 return (1);
516 (void) ungetc(ch, infile);
517 return (0);
518 }
519