xref: /titanic_44/usr/src/tools/aw/aw.c (revision 6ed9368a130d7c9a82e574da808d34034da33748)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 
22 /*
23  * Copyright 2010 Sun Microsystems, Inc.  All rights reserved.
24  * Use is subject to license terms.
25  */
26 
27 /*
28  * Wrapper for the GNU assembler to make it accept the Sun assembler
29  * arguments where possible.
30  *
31  * There are several limitations; the Sun assembler takes multiple
32  * source files, we only take one.
33  *
34  * -b, -s, -xF, -T plain not supported.
35  * -S isn't supported either, because while GNU as does generate
36  * listings with -a, there's no obvious mapping between sub-options.
37  * -K pic, -K PIC not supported either, though it's not clear what
38  * these actually do ..
39  * -Qy (not supported) adds a string to the .comment section
40  * describing the assembler version, while
41  * -Qn (supported) suppresses the string (also the default).
42  *
43  * We also add '-#' support to see invocation lines..
44  * We also add '-xarch=amd64' in case we need to feed the assembler
45  * something different (or in case we need to invoke a different binary
46  * altogether!)
47  */
48 
49 #include <sys/types.h>
50 #include <sys/wait.h>
51 #include <stdio.h>
52 #include <unistd.h>
53 #include <string.h>
54 #include <stdlib.h>
55 #include <sys/param.h>
56 
57 static const char *progname;
58 static int verbose;
59 
60 struct aelist {
61 	int ael_argc;
62 	struct ae {
63 		struct ae *ae_next;
64 		char *ae_arg;
65 	} *ael_head, *ael_tail;
66 };
67 
68 static struct aelist *
69 newael(void)
70 {
71 	return (calloc(sizeof (struct aelist), 1));
72 }
73 
74 static void
75 newae(struct aelist *ael, const char *arg)
76 {
77 	struct ae *ae;
78 
79 	ae = calloc(sizeof (*ae), 1);
80 	ae->ae_arg = strdup(arg);
81 	if (ael->ael_tail == NULL)
82 		ael->ael_head = ae;
83 	else
84 		ael->ael_tail->ae_next = ae;
85 	ael->ael_tail = ae;
86 	ael->ael_argc++;
87 }
88 
89 static void
90 fixae_arg(struct ae *ae, const char *newarg)
91 {
92 	free(ae->ae_arg);
93 	ae->ae_arg = strdup(newarg);
94 }
95 
96 static char **
97 aeltoargv(struct aelist *ael)
98 {
99 	struct ae *ae;
100 	char **argv;
101 	int argc;
102 
103 	argv = calloc(sizeof (*argv), ael->ael_argc + 1);
104 
105 	for (argc = 0, ae = ael->ael_head; ae; ae = ae->ae_next, argc++) {
106 		argv[argc] = ae->ae_arg;
107 		if (ae == ael->ael_tail)
108 			break;
109 	}
110 
111 	return (argv);
112 }
113 
114 static int
115 error(const char *arg)
116 {
117 	(void) fprintf(stderr,
118 	    "%s: as->gas mapping failed at or near arg '%s'\n", progname, arg);
119 	return (2);
120 }
121 
122 static int
123 usage(const char *arg)
124 {
125 	if (arg != NULL)
126 		(void) fprintf(stderr, "error: %s\n", arg);
127 	(void) fprintf(stderr, "Usage: %s [-V] [-#]\n"
128 	    "\t[-xarch=architecture]\n"
129 	    "\t[-o objfile] [-L]\n"
130 	    "\t[-P [[-Ipath] [-Dname] [-Dname=def] [-Uname]]...]\n"
131 	    "\t[-m] [-n] file.s ...\n", progname);
132 	return (3);
133 }
134 
135 static void
136 copyuntil(FILE *in, FILE *out, int termchar)
137 {
138 	int c;
139 
140 	while ((c = fgetc(in)) != EOF) {
141 		if (out && fputc(c, out) == EOF)
142 			exit(1);
143 		if (c == termchar)
144 			break;
145 	}
146 }
147 
148 /*
149  * Variant of copyuntil(), used for copying the path used
150  * for .file directives. This version removes the workspace
151  * from the head of the path, or failing that, attempts to remove
152  * /usr/include. This is a workaround for the way gas handles
153  * these directives. The objects produced by gas contain STT_FILE
154  * symbols for every .file directive. These FILE symbols contain our
155  * workspace paths, leading to wsdiff incorrectly flagging them as
156  * having changed. By clipping off the workspace from these paths,
157  * we eliminate these false positives.
158  */
159 static void
160 copyuntil_path(FILE *in, FILE *out, int termchar,
161     const char *wspace, size_t wspace_len)
162 {
163 #define	PROTO_INC "/proto/root_i386/usr/include/"
164 #define	SYS_INC "/usr/include/"
165 
166 	static const size_t proto_inc_len = sizeof (PROTO_INC) - 1;
167 	static const size_t sys_inc_len = sizeof (SYS_INC) - 1;
168 
169 	/*
170 	 * Dynamically sized buffer for reading paths. Retained
171 	 * and reused between calls.
172 	 */
173 	static char	*buf = NULL;
174 	static size_t	bufsize = 0;
175 
176 	size_t	bufcnt = 0;
177 	char	*bufptr;
178 	int	c;
179 
180 	/* Read the path into the buffer */
181 	while ((c = fgetc(in)) != EOF) {
182 		/*
183 		 * If we need a buffer, or need a larger buffer,
184 		 * fix that here.
185 		 */
186 		if (bufcnt >= bufsize) {
187 			bufsize = (bufsize == 0) ? MAXPATHLEN : (bufsize * 2);
188 			buf = realloc(buf, bufsize + 1); /* + room for NULL */
189 			if (buf == NULL) {
190 				perror("realloc");
191 				exit(1);
192 			}
193 		}
194 
195 		buf[bufcnt++] = c;
196 		if (c == termchar)
197 			break;
198 	}
199 	if (bufcnt == 0)
200 		return;
201 
202 	/*
203 	 * We have a non-empty buffer, and thus the opportunity
204 	 * to do some surgery on it before passing it to the output.
205 	 */
206 	buf[bufcnt] = '\0';
207 	bufptr = buf;
208 
209 	/*
210 	 * If our workspace is at the start, remove it.
211 	 * If not, then look for the system /usr/include instead.
212 	 */
213 	if ((wspace_len > 0) && (wspace_len < bufcnt) &&
214 	    (strncmp(bufptr, wspace, wspace_len) == 0)) {
215 		bufptr += wspace_len;
216 		bufcnt -= wspace_len;
217 
218 		/*
219 		 * Further opportunity: Also clip the prefix
220 		 * that leads to /usr/include in the proto.
221 		 */
222 		if ((proto_inc_len < bufcnt) &&
223 		    (strncmp(bufptr, PROTO_INC, proto_inc_len) == 0)) {
224 			bufptr += proto_inc_len;
225 			bufcnt -= proto_inc_len;
226 		}
227 	} else if ((sys_inc_len < bufcnt) &&
228 	    (strncmp(bufptr, SYS_INC, sys_inc_len) == 0)) {
229 		bufptr += sys_inc_len;
230 		bufcnt -= sys_inc_len;
231 	}
232 
233 	/* Output whatever is left */
234 	if (out && (fwrite(bufptr, 1, bufcnt, out) != bufcnt)) {
235 		perror("fwrite");
236 		exit(1);
237 	}
238 
239 #undef PROTO_INC
240 #undef SYS_INC
241 }
242 
243 /*
244  * The idea here is to take directives like this emitted
245  * by cpp:
246  *
247  *	# num
248  *
249  * and convert them to directives like this that are
250  * understood by the GNU assembler:
251  *
252  *	.line num
253  *
254  * and similarly:
255  *
256  *	# num "string" optional stuff
257  *
258  * is converted to
259  *
260  *	.line num
261  *	.file "string"
262  *
263  * While this could be done with a sequence of sed
264  * commands, this is simpler and faster..
265  */
266 static pid_t
267 filter(int pipein, int pipeout)
268 {
269 	pid_t pid;
270 	FILE *in, *out;
271 	char *wspace;
272 	size_t wspace_len;
273 
274 	if (verbose)
275 		(void) fprintf(stderr, "{#line filter} ");
276 
277 	switch (pid = fork()) {
278 	case 0:
279 		if (dup2(pipein, 0) == -1 ||
280 		    dup2(pipeout, 1) == -1) {
281 			perror("dup2");
282 			exit(1);
283 		}
284 		closefrom(3);
285 		break;
286 	case -1:
287 		perror("fork");
288 	default:
289 		return (pid);
290 	}
291 
292 	in = fdopen(0, "r");
293 	out = fdopen(1, "w");
294 
295 	/*
296 	 * Key off the CODEMGR_WS environment variable to detect
297 	 * if we're in an activated workspace, and to get the
298 	 * path to the workspace.
299 	 */
300 	wspace = getenv("CODEMGR_WS");
301 	if (wspace != NULL)
302 		wspace_len = strlen(wspace);
303 
304 	while (!feof(in)) {
305 		int c, num;
306 
307 		switch (c = fgetc(in)) {
308 		case '#':
309 			switch (fscanf(in, " %d", &num)) {
310 			case 0:
311 				/*
312 				 * discard comment lines completely
313 				 * discard ident strings completely too.
314 				 * (GNU as politely ignores them..)
315 				 */
316 				copyuntil(in, NULL, '\n');
317 				break;
318 			default:
319 				(void) fprintf(stderr, "fscanf botch?");
320 				/*FALLTHROUGH*/
321 			case EOF:
322 				exit(1);
323 				/*NOTREACHED*/
324 			case 1:
325 				/*
326 				 * This line has a number at the beginning;
327 				 * if it has a string after the number, then
328 				 * it's a filename.
329 				 *
330 				 * If this is an activated workspace, use
331 				 * copyuntil_path() to do path rewriting
332 				 * that will prevent workspace paths from
333 				 * being burned into the resulting object.
334 				 * If not in an activated workspace, then
335 				 * copy the existing path straight through
336 				 * without interpretation.
337 				 */
338 				if (fgetc(in) == ' ' && fgetc(in) == '"') {
339 					(void) fprintf(out, "\t.file \"");
340 					if (wspace != NULL)
341 						copyuntil_path(in, out, '"',
342 						    wspace, wspace_len);
343 					else
344 						copyuntil(in, out, '"');
345 					(void) fputc('\n', out);
346 				}
347 				(void) fprintf(out, "\t.line %d\n", num - 1);
348 				/*
349 				 * discard the rest of the line
350 				 */
351 				copyuntil(in, NULL, '\n');
352 				break;
353 			}
354 			break;
355 		case '\n':
356 			/*
357 			 * preserve newlines
358 			 */
359 			(void) fputc(c, out);
360 			break;
361 		case EOF:
362 			/*
363 			 * don't write EOF!
364 			 */
365 			break;
366 		default:
367 			/*
368 			 * lines that don't begin with '#' are copied
369 			 */
370 			(void) fputc(c, out);
371 			copyuntil(in, out, '\n');
372 			break;
373 		}
374 
375 		if (ferror(out))
376 			exit(1);
377 	}
378 
379 	exit(0);
380 	/*NOTREACHED*/
381 }
382 
383 static pid_t
384 invoke(char **argv, int pipein, int pipeout)
385 {
386 	pid_t pid;
387 
388 	if (verbose) {
389 		char **dargv = argv;
390 
391 		while (*dargv)
392 			(void) fprintf(stderr, "%s ", *dargv++);
393 	}
394 
395 	switch (pid = fork()) {
396 	case 0:
397 		if (pipein >= 0 && dup2(pipein, 0) == -1) {
398 			perror("dup2");
399 			exit(1);
400 		}
401 		if (pipeout >= 0 && dup2(pipeout, 1) == -1) {
402 			perror("dup2");
403 			exit(1);
404 		}
405 		closefrom(3);
406 		(void) execvp(argv[0], argv);
407 		perror("execvp");
408 		(void) fprintf(stderr, "%s: couldn't run %s\n",
409 		    progname, argv[0]);
410 		break;
411 	case -1:
412 		perror("fork");
413 	default:
414 		return (pid);
415 	}
416 	exit(2);
417 	/*NOTREACHED*/
418 }
419 
420 static int
421 pipeline(char **ppargv, char **asargv)
422 {
423 	int pipedes[4];
424 	int active = 0;
425 	int rval = 0;
426 	pid_t pid_pp, pid_f, pid_as;
427 
428 	if (pipe(pipedes) == -1 || pipe(pipedes + 2) == -1) {
429 		perror("pipe");
430 		return (4);
431 	}
432 
433 	if ((pid_pp = invoke(ppargv, -1, pipedes[0])) > 0)
434 		active++;
435 
436 	if (verbose)
437 		(void) fprintf(stderr, "| ");
438 
439 	if ((pid_f = filter(pipedes[1], pipedes[2])) > 0)
440 		active++;
441 
442 	if (verbose)
443 		(void) fprintf(stderr, "| ");
444 
445 	if ((pid_as = invoke(asargv, pipedes[3], -1)) > 0)
446 		active++;
447 
448 	if (verbose) {
449 		(void) fprintf(stderr, "\n");
450 		(void) fflush(stderr);
451 	}
452 
453 	closefrom(3);
454 
455 	if (active != 3)
456 		return (5);
457 
458 	while (active != 0) {
459 		pid_t pid;
460 		int stat;
461 
462 		if ((pid = wait(&stat)) == -1) {
463 			rval++;
464 			break;
465 		}
466 
467 		if (!WIFEXITED(stat))
468 			continue;
469 
470 		if (pid == pid_pp || pid == pid_f || pid == pid_as) {
471 			active--;
472 			if (WEXITSTATUS(stat) != 0)
473 				rval++;
474 		}
475 	}
476 
477 	return (rval);
478 }
479 
480 int
481 main(int argc, char *argv[])
482 {
483 	struct aelist *cpp = NULL;
484 	struct aelist *m4 = NULL;
485 	struct aelist *as = newael();
486 	char **asargv;
487 	char *outfile = NULL;
488 	char *srcfile = NULL;
489 	const char *dir, *cmd;
490 	static char as_pgm[MAXPATHLEN];
491 	static char as64_pgm[MAXPATHLEN];
492 	static char m4_pgm[MAXPATHLEN];
493 	static char m4_cmdefs[MAXPATHLEN];
494 	static char cpp_pgm[MAXPATHLEN];
495 	int as64 = 0;
496 	int code;
497 
498 	if ((progname = strrchr(argv[0], '/')) == NULL)
499 		progname = argv[0];
500 	else
501 		progname++;
502 
503 	/*
504 	 * Helpful when debugging, or when changing tool versions..
505 	 */
506 	if ((cmd = getenv("AW_AS")) != NULL)
507 		strlcpy(as_pgm, cmd, sizeof (as_pgm));
508 	else {
509 		if ((dir = getenv("AW_AS_DIR")) == NULL)
510 			dir = DEFAULT_AS_DIR;	/* /usr/sfw/bin */
511 		(void) snprintf(as_pgm, sizeof (as_pgm), "%s/gas", dir);
512 	}
513 
514 	if ((cmd = getenv("AW_AS64")) != NULL)
515 		strlcpy(as64_pgm, cmd, sizeof (as64_pgm));
516 	else {
517 		if ((dir = getenv("AW_AS64_DIR")) == NULL)
518 			dir = DEFAULT_AS64_DIR;	/* /usr/sfw/bin */
519 		(void) snprintf(as64_pgm, sizeof (as_pgm), "%s/gas", dir);
520 	}
521 
522 	if ((cmd = getenv("AW_M4")) != NULL)
523 		strlcpy(m4_pgm, cmd, sizeof (m4_pgm));
524 	else {
525 		if ((dir = getenv("AW_M4_DIR")) == NULL)
526 			dir = DEFAULT_M4_DIR;	/* /usr/ccs/bin */
527 		(void) snprintf(m4_pgm, sizeof (m4_pgm), "%s/m4", dir);
528 	}
529 
530 	if ((cmd = getenv("AW_M4LIB")) != NULL)
531 		strlcpy(m4_cmdefs, cmd, sizeof (m4_cmdefs));
532 	else {
533 		if ((dir = getenv("AW_M4LIB_DIR")) == NULL)
534 			dir = DEFAULT_M4LIB_DIR;	/* /usr/ccs/lib */
535 		(void) snprintf(m4_cmdefs, sizeof (m4_cmdefs),
536 		    "%s/cm4defs", dir);
537 	}
538 
539 	if ((cmd = getenv("AW_CPP")) != NULL)
540 		strlcpy(cpp_pgm, cmd, sizeof (cpp_pgm));
541 	else {
542 		if ((dir = getenv("AW_CPP_DIR")) == NULL)
543 			dir = DEFAULT_CPP_DIR;	/* /usr/ccs/lib */
544 		(void) snprintf(cpp_pgm, sizeof (cpp_pgm), "%s/cpp", dir);
545 	}
546 
547 	newae(as, as_pgm);
548 	newae(as, "--warn");
549 	newae(as, "--fatal-warnings");
550 	newae(as, "--traditional-format");
551 
552 	/*
553 	 * Walk the argument list, translating as we go ..
554 	 */
555 	while (--argc > 0) {
556 		char *arg;
557 		int arglen;
558 
559 		arg = *++argv;
560 		arglen = strlen(arg);
561 
562 		if (*arg != '-') {
563 			char *filename;
564 
565 			/*
566 			 * filenames ending in '.s' are taken to be
567 			 * assembler files, and provide the default
568 			 * basename of the output file.
569 			 *
570 			 * other files are passed through to the
571 			 * preprocessor, if present, or to gas if not.
572 			 */
573 			filename = arg;
574 			if (arglen > 2 &&
575 			    strcmp(arg + arglen - 2, ".s") == 0) {
576 				/*
577 				 * Though 'as' allows multiple assembler
578 				 * files to be processed in one invocation
579 				 * of the assembler, ON only processes one
580 				 * file at a time, which makes things a lot
581 				 * simpler!
582 				 */
583 				if (srcfile == NULL)
584 					srcfile = arg;
585 				else
586 					return (usage(
587 					    "one assembler file at a time"));
588 
589 				/*
590 				 * If we haven't seen a -o option yet,
591 				 * default the output to the basename
592 				 * of the input, substituting a .o on the end
593 				 */
594 				if (outfile == NULL) {
595 					char *argcopy;
596 
597 					argcopy = strdup(arg);
598 					argcopy[arglen - 1] = 'o';
599 
600 					if ((outfile = strrchr(
601 					    argcopy, '/')) == NULL)
602 						outfile = argcopy;
603 					else
604 						outfile++;
605 				}
606 			}
607 			if (cpp)
608 				newae(cpp, filename);
609 			else if (m4)
610 				newae(m4, filename);
611 			else
612 				newae(as, filename);
613 			continue;
614 		} else
615 			arglen--;
616 
617 		switch (arg[1]) {
618 		case 'K':
619 			/*
620 			 * -K pic
621 			 * -K PIC
622 			 */
623 			if (arglen == 1) {
624 				if ((arg = *++argv) == NULL || *arg == '\0')
625 					return (usage("malformed -K"));
626 				argc--;
627 			} else {
628 				arg += 2;
629 			}
630 			if (strcmp(arg, "PIC") != 0 && strcmp(arg, "pic") != 0)
631 				return (usage("malformed -K"));
632 			break;		/* just ignore -Kpic for gcc */
633 		case 'Q':
634 			if (strcmp(arg, "-Qn") == 0)
635 				break;
636 			/*FALLTHROUGH*/
637 		case 'b':
638 		case 's':
639 		case 'T':
640 			/*
641 			 * -b	Extra symbol table for source browser ..
642 			 *	not relevant to gas, thus should error.
643 			 * -s	Put stabs in .stabs section not stabs.excl
644 			 *	not clear if there's an equivalent
645 			 * -T	4.x migration option
646 			 */
647 		default:
648 			return (error(arg));
649 		case 'x':
650 			/*
651 			 * Accept -xarch special case to invoke alternate
652 			 * assemblers or assembler flags for different
653 			 * architectures.
654 			 */
655 			if (strcmp(arg, "-xarch=amd64") == 0 ||
656 			    strcmp(arg, "-xarch=generic64") == 0) {
657 				as64++;
658 				fixae_arg(as->ael_head, as64_pgm);
659 				break;
660 			}
661 			/*
662 			 * XX64: Is this useful to gas?
663 			 */
664 			if (strcmp(arg, "-xmodel=kernel") == 0)
665 				break;
666 
667 			/*
668 			 * -xF	Generates performance analysis data
669 			 *	no equivalent
670 			 */
671 			return (error(arg));
672 		case 'V':
673 			newae(as, arg);
674 			break;
675 		case '#':
676 			verbose++;
677 			break;
678 		case 'L':
679 			newae(as, "--keep-locals");
680 			break;
681 		case 'n':
682 			newae(as, "--no-warn");
683 			break;
684 		case 'o':
685 			if (arglen != 1)
686 				return (usage("bad -o flag"));
687 			if ((arg = *++argv) == NULL || *arg == '\0')
688 				return (usage("bad -o flag"));
689 			outfile = arg;
690 			argc--;
691 			arglen = strlen(arg + 1);
692 			break;
693 		case 'm':
694 			if (cpp)
695 				return (usage("-m conflicts with -P"));
696 			if (m4 == NULL) {
697 				m4 = newael();
698 				newae(m4, m4_pgm);
699 				newae(m4, m4_cmdefs);
700 			}
701 			break;
702 		case 'P':
703 			if (m4)
704 				return (usage("-P conflicts with -m"));
705 			if (cpp == NULL) {
706 				cpp = newael();
707 				newae(cpp, cpp_pgm);
708 				newae(cpp, "-D__GNUC_AS__");
709 			}
710 			break;
711 		case 'D':
712 		case 'U':
713 			if (cpp)
714 				newae(cpp, arg);
715 			else if (m4)
716 				newae(m4, arg);
717 			else
718 				newae(as, arg);
719 			break;
720 		case 'I':
721 			if (cpp)
722 				newae(cpp, arg);
723 			else
724 				newae(as, arg);
725 			break;
726 		case '-':	/* a gas-specific option */
727 			newae(as, arg);
728 			break;
729 		}
730 	}
731 
732 #if defined(__i386)
733 	if (as64)
734 		newae(as, "--64");
735 	else
736 		newae(as, "--32");
737 #endif
738 
739 	if (srcfile == NULL)
740 		return (usage("no source file(s) specified"));
741 	if (outfile == NULL)
742 		outfile = "a.out";
743 	newae(as, "-o");
744 	newae(as, outfile);
745 
746 	asargv = aeltoargv(as);
747 	if (cpp) {
748 #if defined(__sparc)
749 		newae(cpp, "-Dsparc");
750 		newae(cpp, "-D__sparc");
751 		if (as64)
752 			newae(cpp, "-D__sparcv9");
753 		else
754 			newae(cpp, "-D__sparcv8");
755 #elif defined(__i386) || defined(__x86)
756 		if (as64) {
757 			newae(cpp, "-D__x86_64");
758 			newae(cpp, "-D__amd64");
759 		} else {
760 			newae(cpp, "-Di386");
761 			newae(cpp, "-D__i386");
762 		}
763 #else
764 #error	"need isa-dependent defines"
765 #endif
766 		code = pipeline(aeltoargv(cpp), asargv);
767 	} else if (m4)
768 		code = pipeline(aeltoargv(m4), asargv);
769 	else {
770 		/*
771 		 * XXX	should arrange to fork/exec so that we
772 		 *	can unlink the output file if errors are
773 		 *	detected..
774 		 */
775 		(void) execvp(asargv[0], asargv);
776 		perror("execvp");
777 		(void) fprintf(stderr, "%s: couldn't run %s\n",
778 		    progname, asargv[0]);
779 		code = 7;
780 	}
781 	if (code != 0)
782 		(void) unlink(outfile);
783 	return (code);
784 }
785