xref: /illumos-gate/usr/src/cmd/sgs/libld/common/syms.c (revision 12042ab213b3af68474f48555504db816a449211)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 
22 /*
23  *	Copyright (c) 1988 AT&T
24  *	  All Rights Reserved
25  *
26  *
27  * Copyright (c) 1989, 2010, Oracle and/or its affiliates. All rights reserved.
28  */
29 
30 /*
31  * Symbol table management routines
32  */
33 
34 #define	ELF_TARGET_AMD64
35 
36 #include	<stdio.h>
37 #include	<string.h>
38 #include	<debug.h>
39 #include	"msg.h"
40 #include	"_libld.h"
41 
42 /*
43  * AVL tree comparator function:
44  *
45  * The primary key is the symbol name hash with a secondary key of the symbol
46  * name itself.
47  */
48 int
49 ld_sym_avl_comp(const void *elem1, const void *elem2)
50 {
51 	Sym_avlnode	*sav1 = (Sym_avlnode *)elem1;
52 	Sym_avlnode	*sav2 = (Sym_avlnode *)elem2;
53 	int		res;
54 
55 	res = sav1->sav_hash - sav2->sav_hash;
56 
57 	if (res < 0)
58 		return (-1);
59 	if (res > 0)
60 		return (1);
61 
62 	/*
63 	 * Hash is equal - now compare name
64 	 */
65 	res = strcmp(sav1->sav_name, sav2->sav_name);
66 	if (res == 0)
67 		return (0);
68 	if (res > 0)
69 		return (1);
70 	return (-1);
71 }
72 
73 /*
74  * Focal point for verifying symbol names.
75  */
76 inline static const char *
77 string(Ofl_desc *ofl, Ifl_desc *ifl, Sym *sym, const char *strs, size_t strsize,
78     int symndx, Word shndx, Word symsecndx, const char *symsecname,
79     const char *strsecname, sd_flag_t *flags)
80 {
81 	Word	name = sym->st_name;
82 
83 	if (name) {
84 		if ((ifl->ifl_flags & FLG_IF_HSTRTAB) == 0) {
85 			ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_FIL_NOSTRTABLE),
86 			    ifl->ifl_name, EC_WORD(symsecndx), symsecname,
87 			    symndx, EC_XWORD(name));
88 			return (NULL);
89 		}
90 		if (name >= (Word)strsize) {
91 			ld_eprintf(ofl, ERR_FATAL,
92 			    MSG_INTL(MSG_FIL_EXCSTRTABLE), ifl->ifl_name,
93 			    EC_WORD(symsecndx), symsecname, symndx,
94 			    EC_XWORD(name), strsecname, EC_XWORD(strsize));
95 			return (NULL);
96 		}
97 	}
98 
99 	/*
100 	 * Determine if we're dealing with a register and if so validate it.
101 	 * If it's a scratch register, a fabricated name will be returned.
102 	 */
103 	if (ld_targ.t_ms.ms_is_regsym != NULL) {
104 		const char *regname = (*ld_targ.t_ms.ms_is_regsym)(ofl, ifl,
105 		    sym, strs, symndx, shndx, symsecname, flags);
106 
107 		if (regname == (const char *)S_ERROR) {
108 			return (NULL);
109 		}
110 		if (regname)
111 			return (regname);
112 	}
113 
114 	/*
115 	 * If this isn't a register, but we have a global symbol with a null
116 	 * name, we're not going to be able to hash this, search for it, or
117 	 * do anything interesting.  However, we've been accepting a symbol of
118 	 * this kind for ages now, so give the user a warning (rather than a
119 	 * fatal error), just in case this instance exists somewhere in the
120 	 * world and hasn't, as yet, been a problem.
121 	 */
122 	if ((name == 0) && (ELF_ST_BIND(sym->st_info) != STB_LOCAL)) {
123 		ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_FIL_NONAMESYM),
124 		    ifl->ifl_name, EC_WORD(symsecndx), symsecname, symndx,
125 		    EC_XWORD(name));
126 	}
127 	return (strs + name);
128 }
129 
130 /*
131  * For producing symbol names strings to use in error messages.
132  * If the symbol has a non-null name, then the string returned by
133  * this function is the output from demangle(), surrounded by
134  * single quotes. For null names, a descriptive string giving
135  * the symbol section and index is generated.
136  *
137  * This function uses an internal static buffer to hold the resulting
138  * string. The value returned is usable by the caller until the next
139  * call, at which point it is overwritten.
140  */
141 static const char *
142 demangle_symname(const char *name, const char *symtab_name, Word symndx)
143 {
144 #define	INIT_BUFSIZE 256
145 
146 	static char	*buf;
147 	static size_t	bufsize = 0;
148 	size_t		len;
149 	int		use_name;
150 
151 	use_name = (name != NULL) && (*name != '\0');
152 
153 	if (use_name) {
154 		name = demangle(name);
155 		len = strlen(name) + 2;   /* Include room for quotes */
156 	} else {
157 		name = MSG_ORIG(MSG_STR_EMPTY);
158 		len = strlen(symtab_name) + 2 + CONV_INV_BUFSIZE;
159 	}
160 	len++;			/* Null termination */
161 
162 	/* If our buffer is too small, double it until it is big enough */
163 	if (len > bufsize) {
164 		size_t	new_bufsize = bufsize;
165 		char	*new_buf;
166 
167 		if (new_bufsize == 0)
168 			new_bufsize = INIT_BUFSIZE;
169 		while (len > new_bufsize)
170 			new_bufsize *= 2;
171 		if ((new_buf = libld_malloc(new_bufsize)) == NULL)
172 			return (name);
173 		buf = new_buf;
174 		bufsize = new_bufsize;
175 	}
176 
177 	if (use_name) {
178 		(void) snprintf(buf, bufsize, MSG_ORIG(MSG_FMT_SYMNAM), name);
179 	} else {
180 		(void) snprintf(buf, bufsize, MSG_ORIG(MSG_FMT_NULLSYMNAM),
181 		    symtab_name, EC_WORD(symndx));
182 	}
183 
184 	return (buf);
185 
186 #undef INIT_BUFSIZE
187 }
188 
189 /*
190  * Shared objects can be built that define specific symbols that can not be
191  * directly bound to.  These objects have a syminfo section (and an associated
192  * DF_1_NODIRECT dynamic flags entry).  Scan this table looking for symbols
193  * that can't be bound to directly, and if this files symbol is presently
194  * referenced, mark it so that we don't directly bind to it.
195  */
196 uintptr_t
197 ld_sym_nodirect(Is_desc *isp, Ifl_desc *ifl, Ofl_desc *ofl)
198 {
199 	Shdr		*sifshdr, *symshdr;
200 	Syminfo		*sifdata;
201 	Sym		*symdata;
202 	char		*strdata;
203 	ulong_t		cnt, _cnt;
204 
205 	/*
206 	 * Get the syminfo data, and determine the number of entries.
207 	 */
208 	sifshdr = isp->is_shdr;
209 	sifdata = (Syminfo *)isp->is_indata->d_buf;
210 	cnt =  sifshdr->sh_size / sifshdr->sh_entsize;
211 
212 	/*
213 	 * Get the associated symbol table.
214 	 */
215 	if ((sifshdr->sh_link == 0) || (sifshdr->sh_link >= ifl->ifl_shnum)) {
216 		/*
217 		 * Broken input file
218 		 */
219 		ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_FIL_INVSHINFO),
220 		    ifl->ifl_name, isp->is_name, EC_XWORD(sifshdr->sh_link));
221 		return (0);
222 	}
223 	symshdr = ifl->ifl_isdesc[sifshdr->sh_link]->is_shdr;
224 	symdata = ifl->ifl_isdesc[sifshdr->sh_link]->is_indata->d_buf;
225 
226 	/*
227 	 * Get the string table associated with the symbol table.
228 	 */
229 	strdata = ifl->ifl_isdesc[symshdr->sh_link]->is_indata->d_buf;
230 
231 	/*
232 	 * Traverse the syminfo data for symbols that can't be directly
233 	 * bound to.
234 	 */
235 	for (_cnt = 1, sifdata++; _cnt < cnt; _cnt++, sifdata++) {
236 		Sym		*sym;
237 		char		*str;
238 		Sym_desc	*sdp;
239 
240 		if ((sifdata->si_flags & SYMINFO_FLG_NOEXTDIRECT) == 0)
241 			continue;
242 
243 		sym = (Sym *)(symdata + _cnt);
244 		str = (char *)(strdata + sym->st_name);
245 
246 		if ((sdp = ld_sym_find(str, SYM_NOHASH, NULL, ofl)) != NULL) {
247 			if (ifl != sdp->sd_file)
248 				continue;
249 
250 			sdp->sd_flags &= ~FLG_SY_DIR;
251 			sdp->sd_flags |= FLG_SY_NDIR;
252 		}
253 	}
254 	return (0);
255 }
256 
257 /*
258  * If, during symbol processing, it is necessary to update a local symbols
259  * contents before we have generated the symbol tables in the output image,
260  * create a new symbol structure and copy the original symbol contents.  While
261  * we are processing the input files, their local symbols are part of the
262  * read-only mapped image.  Commonly, these symbols are copied to the new output
263  * file image and then updated to reflect their new address and any change in
264  * attributes.  However, sometimes during relocation counting, it is necessary
265  * to adjust the symbols information.  This routine provides for the generation
266  * of a new symbol image so that this update can be performed.
267  * All global symbols are copied to an internal symbol table to improve locality
268  * of reference and hence performance, and thus this copying is not necessary.
269  */
270 uintptr_t
271 ld_sym_copy(Sym_desc *sdp)
272 {
273 	Sym	*nsym;
274 
275 	if (sdp->sd_flags & FLG_SY_CLEAN) {
276 		if ((nsym = libld_malloc(sizeof (Sym))) == NULL)
277 			return (S_ERROR);
278 		*nsym = *(sdp->sd_sym);
279 		sdp->sd_sym = nsym;
280 		sdp->sd_flags &= ~FLG_SY_CLEAN;
281 	}
282 	return (1);
283 }
284 
285 /*
286  * Finds a given name in the link editors internal symbol table.  If no
287  * hash value is specified it is calculated.  A pointer to the located
288  * Sym_desc entry is returned, or NULL if the symbol is not found.
289  */
290 Sym_desc *
291 ld_sym_find(const char *name, Word hash, avl_index_t *where, Ofl_desc *ofl)
292 {
293 	Sym_avlnode	qsav, *sav;
294 
295 	if (hash == SYM_NOHASH)
296 		/* LINTED */
297 		hash = (Word)elf_hash((const char *)name);
298 	qsav.sav_hash = hash;
299 	qsav.sav_name = name;
300 
301 	/*
302 	 * Perform search for symbol in AVL tree.  Note that the 'where' field
303 	 * is passed in from the caller.  If a 'where' is present, it can be
304 	 * used in subsequent 'ld_sym_enter()' calls if required.
305 	 */
306 	sav = avl_find(&ofl->ofl_symavl, &qsav, where);
307 
308 	/*
309 	 * If symbol was not found in the avl tree, return null to show that.
310 	 */
311 	if (sav == NULL)
312 		return (NULL);
313 
314 	/*
315 	 * Return symbol found.
316 	 */
317 	return (sav->sav_sdp);
318 }
319 
320 /*
321  * Enter a new symbol into the link editors internal symbol table.
322  * If the symbol is from an input file, information regarding the input file
323  * and input section is also recorded.  Otherwise (file == NULL) the symbol
324  * has been internally generated (ie. _etext, _edata, etc.).
325  */
326 Sym_desc *
327 ld_sym_enter(const char *name, Sym *osym, Word hash, Ifl_desc *ifl,
328     Ofl_desc *ofl, Word ndx, Word shndx, sd_flag_t sdflags, avl_index_t *where)
329 {
330 	Sym_desc	*sdp;
331 	Sym_aux		*sap;
332 	Sym_avlnode	*savl;
333 	char		*_name;
334 	Sym		*nsym;
335 	Half		etype;
336 	uchar_t		vis;
337 	avl_index_t	_where;
338 
339 	/*
340 	 * Establish the file type.
341 	 */
342 	if (ifl)
343 		etype = ifl->ifl_ehdr->e_type;
344 	else
345 		etype = ET_NONE;
346 
347 	ofl->ofl_entercnt++;
348 
349 	/*
350 	 * Allocate a Sym Descriptor, Auxiliary Descriptor, and a Sym AVLNode -
351 	 * contiguously.
352 	 */
353 	if ((savl = libld_calloc(S_DROUND(sizeof (Sym_avlnode)) +
354 	    S_DROUND(sizeof (Sym_desc)) +
355 	    S_DROUND(sizeof (Sym_aux)), 1)) == NULL)
356 		return ((Sym_desc *)S_ERROR);
357 	sdp = (Sym_desc *)((uintptr_t)savl +
358 	    S_DROUND(sizeof (Sym_avlnode)));
359 	sap = (Sym_aux *)((uintptr_t)sdp +
360 	    S_DROUND(sizeof (Sym_desc)));
361 
362 	savl->sav_sdp = sdp;
363 	sdp->sd_file = ifl;
364 	sdp->sd_aux = sap;
365 	savl->sav_hash = sap->sa_hash = hash;
366 
367 	/*
368 	 * Copy the symbol table entry from the input file into the internal
369 	 * entry and have the symbol descriptor use it.
370 	 */
371 	sdp->sd_sym = nsym = &sap->sa_sym;
372 	*nsym = *osym;
373 	sdp->sd_shndx = shndx;
374 	sdp->sd_flags |= sdflags;
375 
376 	if ((_name = libld_malloc(strlen(name) + 1)) == NULL)
377 		return ((Sym_desc *)S_ERROR);
378 	savl->sav_name = sdp->sd_name = (const char *)strcpy(_name, name);
379 
380 	/*
381 	 * Enter Symbol in AVL tree.
382 	 */
383 	if (where == 0) {
384 		/* LINTED */
385 		Sym_avlnode	*_savl;
386 		/*
387 		 * If a previous ld_sym_find() hasn't initialized 'where' do it
388 		 * now.
389 		 */
390 		where = &_where;
391 		_savl = avl_find(&ofl->ofl_symavl, savl, where);
392 		assert(_savl == NULL);
393 	}
394 	avl_insert(&ofl->ofl_symavl, savl, *where);
395 
396 	/*
397 	 * Record the section index.  This is possible because the
398 	 * `ifl_isdesc' table is filled before we start symbol processing.
399 	 */
400 	if ((sdflags & FLG_SY_SPECSEC) || (nsym->st_shndx == SHN_UNDEF))
401 		sdp->sd_isc = NULL;
402 	else {
403 		sdp->sd_isc = ifl->ifl_isdesc[shndx];
404 
405 		/*
406 		 * If this symbol is from a relocatable object, make sure that
407 		 * it is still associated with a section.  For example, an
408 		 * unknown section type (SHT_NULL) would have been rejected on
409 		 * input with a warning.  Here, we make the use of the symbol
410 		 * fatal.  A symbol descriptor is still returned, so that the
411 		 * caller can continue processing all symbols, and hence flush
412 		 * out as many error conditions as possible.
413 		 */
414 		if ((etype == ET_REL) && (sdp->sd_isc == NULL)) {
415 			ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_SYM_INVSEC),
416 			    name, ifl->ifl_name, EC_XWORD(shndx));
417 			return (sdp);
418 		}
419 	}
420 
421 	/*
422 	 * Mark any COMMON symbols as 'tentative'.
423 	 */
424 	if (sdflags & FLG_SY_SPECSEC) {
425 		if (nsym->st_shndx == SHN_COMMON)
426 			sdp->sd_flags |= FLG_SY_TENTSYM;
427 #if	defined(_ELF64)
428 		else if ((ld_targ.t_m.m_mach == EM_AMD64) &&
429 		    (nsym->st_shndx == SHN_X86_64_LCOMMON))
430 			sdp->sd_flags |= FLG_SY_TENTSYM;
431 #endif
432 	}
433 
434 	/*
435 	 * Establish the symbols visibility and reference.
436 	 */
437 	vis = ELF_ST_VISIBILITY(nsym->st_other);
438 
439 	if ((etype == ET_NONE) || (etype == ET_REL)) {
440 		switch (vis) {
441 		case STV_DEFAULT:
442 			sdp->sd_flags |= FLG_SY_DEFAULT;
443 			break;
444 		case STV_INTERNAL:
445 		case STV_HIDDEN:
446 			sdp->sd_flags |= FLG_SY_HIDDEN;
447 			break;
448 		case STV_PROTECTED:
449 			sdp->sd_flags |= FLG_SY_PROTECT;
450 			break;
451 		case STV_EXPORTED:
452 			sdp->sd_flags |= FLG_SY_EXPORT;
453 			break;
454 		case STV_SINGLETON:
455 			sdp->sd_flags |= (FLG_SY_SINGLE | FLG_SY_NDIR);
456 			ofl->ofl_flags1 |= (FLG_OF1_NDIRECT | FLG_OF1_NGLBDIR);
457 			break;
458 		case STV_ELIMINATE:
459 			sdp->sd_flags |= (FLG_SY_HIDDEN | FLG_SY_ELIM);
460 			break;
461 		default:
462 			assert(vis <= STV_ELIMINATE);
463 		}
464 
465 		sdp->sd_ref = REF_REL_NEED;
466 
467 		/*
468 		 * Under -Bnodirect, all exported interfaces that have not
469 		 * explicitly been defined protected or directly bound to, are
470 		 * tagged to prevent direct binding.
471 		 */
472 		if ((ofl->ofl_flags1 & FLG_OF1_ALNODIR) &&
473 		    ((sdp->sd_flags & (FLG_SY_PROTECT | FLG_SY_DIR)) == 0) &&
474 		    (nsym->st_shndx != SHN_UNDEF)) {
475 			sdp->sd_flags |= FLG_SY_NDIR;
476 		}
477 	} else {
478 		sdp->sd_ref = REF_DYN_SEEN;
479 
480 		/*
481 		 * If this is a protected symbol, remember this.  Note, this
482 		 * state is different from the FLG_SY_PROTECT used to establish
483 		 * a symbol definitions visibility.  This state is used to warn
484 		 * against possible copy relocations against this referenced
485 		 * symbol.
486 		 */
487 		if (vis == STV_PROTECTED)
488 			sdp->sd_flags |= FLG_SY_PROT;
489 
490 		/*
491 		 * If this is a SINGLETON definition, then indicate the symbol
492 		 * can not be directly bound to, and retain the visibility.
493 		 * This visibility will be inherited by any references made to
494 		 * this symbol.
495 		 */
496 		if ((vis == STV_SINGLETON) && (nsym->st_shndx != SHN_UNDEF))
497 			sdp->sd_flags |= (FLG_SY_SINGLE | FLG_SY_NDIR);
498 
499 		/*
500 		 * If the new symbol is from a shared library and is associated
501 		 * with a SHT_NOBITS section then this symbol originated from a
502 		 * tentative symbol.
503 		 */
504 		if (sdp->sd_isc &&
505 		    (sdp->sd_isc->is_shdr->sh_type == SHT_NOBITS))
506 			sdp->sd_flags |= FLG_SY_TENTSYM;
507 	}
508 
509 	/*
510 	 * Reclassify any SHN_SUNW_IGNORE symbols to SHN_UNDEF so as to
511 	 * simplify future processing.
512 	 */
513 	if (nsym->st_shndx == SHN_SUNW_IGNORE) {
514 		sdp->sd_shndx = shndx = SHN_UNDEF;
515 		sdp->sd_flags |= (FLG_SY_REDUCED |
516 		    FLG_SY_HIDDEN | FLG_SY_IGNORE | FLG_SY_ELIM);
517 	}
518 
519 	/*
520 	 * If this is an undefined, or common symbol from a relocatable object
521 	 * determine whether it is a global or weak reference (see build_osym(),
522 	 * where REF_DYN_NEED definitions are returned back to undefines).
523 	 */
524 	if ((etype == ET_REL) &&
525 	    (ELF_ST_BIND(nsym->st_info) == STB_GLOBAL) &&
526 	    ((nsym->st_shndx == SHN_UNDEF) || ((sdflags & FLG_SY_SPECSEC) &&
527 #if	defined(_ELF64)
528 	    ((nsym->st_shndx == SHN_COMMON) ||
529 	    ((ld_targ.t_m.m_mach == EM_AMD64) &&
530 	    (nsym->st_shndx == SHN_X86_64_LCOMMON))))))
531 #else
532 	/* BEGIN CSTYLED */
533 	    (nsym->st_shndx == SHN_COMMON))))
534 	/* END CSTYLED */
535 #endif
536 		sdp->sd_flags |= FLG_SY_GLOBREF;
537 
538 	/*
539 	 * Record the input filename on the referenced or defined files list
540 	 * for possible later diagnostics.  The `sa_rfile' pointer contains the
541 	 * name of the file that first referenced this symbol and is used to
542 	 * generate undefined symbol diagnostics (refer to sym_undef_entry()).
543 	 * Note that this entry can be overridden if a reference from a
544 	 * relocatable object is found after a reference from a shared object
545 	 * (refer to sym_override()).
546 	 * The `sa_dfiles' list is used to maintain the list of files that
547 	 * define the same symbol.  This list can be used for two reasons:
548 	 *
549 	 *  -	To save the first definition of a symbol that is not available
550 	 *	for this link-edit.
551 	 *
552 	 *  -	To save all definitions of a symbol when the -m option is in
553 	 *	effect.  This is optional as it is used to list multiple
554 	 *	(interposed) definitions of a symbol (refer to ldmap_out()),
555 	 *	and can be quite expensive.
556 	 */
557 	if (nsym->st_shndx == SHN_UNDEF) {
558 		sap->sa_rfile = ifl->ifl_name;
559 	} else {
560 		if (sdp->sd_ref == REF_DYN_SEEN) {
561 			/*
562 			 * A symbol is determined to be unavailable if it
563 			 * belongs to a version of a shared object that this
564 			 * user does not wish to use, or if it belongs to an
565 			 * implicit shared object.
566 			 */
567 			if (ifl->ifl_vercnt) {
568 				Ver_index	*vip;
569 				Half		vndx = ifl->ifl_versym[ndx];
570 
571 				sap->sa_dverndx = vndx;
572 				vip = &ifl->ifl_verndx[vndx];
573 				if (!(vip->vi_flags & FLG_VER_AVAIL)) {
574 					sdp->sd_flags |= FLG_SY_NOTAVAIL;
575 					sap->sa_vfile = ifl->ifl_name;
576 				}
577 			}
578 			if (!(ifl->ifl_flags & FLG_IF_NEEDED))
579 				sdp->sd_flags |= FLG_SY_NOTAVAIL;
580 
581 		} else if (etype == ET_REL) {
582 			/*
583 			 * If this symbol has been obtained from a versioned
584 			 * input relocatable object then the new symbol must be
585 			 * promoted to the versioning of the output file.
586 			 */
587 			if (ifl->ifl_versym)
588 				ld_vers_promote(sdp, ndx, ifl, ofl);
589 		}
590 
591 		if ((ofl->ofl_flags & FLG_OF_GENMAP) &&
592 		    ((sdflags & FLG_SY_SPECSEC) == 0))
593 			if (aplist_append(&sap->sa_dfiles, ifl->ifl_name,
594 			    AL_CNT_SDP_DFILES) == NULL)
595 				return ((Sym_desc *)S_ERROR);
596 	}
597 
598 	/*
599 	 * Provided we're not processing a mapfile, diagnose the entered symbol.
600 	 * Mapfile processing requires the symbol to be updated with additional
601 	 * information, therefore the diagnosing of the symbol is deferred until
602 	 * later (see Dbg_map_symbol()).
603 	 */
604 	if ((ifl == NULL) || ((ifl->ifl_flags & FLG_IF_MAPFILE) == 0))
605 		DBG_CALL(Dbg_syms_entered(ofl, nsym, sdp));
606 
607 	return (sdp);
608 }
609 
610 /*
611  * Add a special symbol to the symbol table.  Takes special symbol name with
612  * and without underscores.  This routine is called, after all other symbol
613  * resolution has completed, to generate a reserved absolute symbol (the
614  * underscore version).  Special symbols are updated with the appropriate
615  * values in update_osym().  If the user has already defined this symbol
616  * issue a warning and leave the symbol as is.  If the non-underscore symbol
617  * is referenced then turn it into a weak alias of the underscored symbol.
618  *
619  * The bits in sdflags_u are OR'd into the flags field of the symbol for the
620  * underscored symbol.
621  *
622  * If this is a global symbol, and it hasn't explicitly been defined as being
623  * directly bound to, indicate that it can't be directly bound to.
624  * Historically, most special symbols only have meaning to the object in which
625  * they exist, however, they've always been global.  To ensure compatibility
626  * with any unexpected use presently in effect, ensure these symbols don't get
627  * directly bound to.  Note, that establishing this state here isn't sufficient
628  * to create a syminfo table, only if a syminfo table is being created by some
629  * other symbol directives will the nodirect binding be recorded.  This ensures
630  * we don't create syminfo sections for all objects we create, as this might add
631  * unnecessary bloat to users who haven't explicitly requested extra symbol
632  * information.
633  */
634 static uintptr_t
635 sym_add_spec(const char *name, const char *uname, Word sdaux_id,
636     sd_flag_t sdflags_u, sd_flag_t sdflags, Ofl_desc *ofl)
637 {
638 	Sym_desc	*sdp;
639 	Sym_desc	*usdp;
640 	Sym		*sym;
641 	Word		hash;
642 	avl_index_t	where;
643 
644 	/* LINTED */
645 	hash = (Word)elf_hash(uname);
646 	if (usdp = ld_sym_find(uname, hash, &where, ofl)) {
647 		/*
648 		 * If the underscore symbol exists and is undefined, or was
649 		 * defined in a shared library, convert it to a local symbol.
650 		 * Otherwise leave it as is and warn the user.
651 		 */
652 		if ((usdp->sd_shndx == SHN_UNDEF) ||
653 		    (usdp->sd_ref != REF_REL_NEED)) {
654 			usdp->sd_ref = REF_REL_NEED;
655 			usdp->sd_shndx = usdp->sd_sym->st_shndx = SHN_ABS;
656 			usdp->sd_flags |= FLG_SY_SPECSEC | sdflags_u;
657 			usdp->sd_sym->st_info =
658 			    ELF_ST_INFO(STB_GLOBAL, STT_OBJECT);
659 			usdp->sd_isc = NULL;
660 			usdp->sd_sym->st_size = 0;
661 			usdp->sd_sym->st_value = 0;
662 			/* LINTED */
663 			usdp->sd_aux->sa_symspec = (Half)sdaux_id;
664 
665 			/*
666 			 * If a user hasn't specifically indicated that the
667 			 * scope of this symbol be made local, then leave it
668 			 * as global (ie. prevent automatic scoping).  The GOT
669 			 * should be defined protected, whereas all other
670 			 * special symbols are tagged as no-direct.
671 			 */
672 			if (!SYM_IS_HIDDEN(usdp) &&
673 			    (sdflags & FLG_SY_DEFAULT)) {
674 				usdp->sd_aux->sa_overndx = VER_NDX_GLOBAL;
675 				if (sdaux_id == SDAUX_ID_GOT) {
676 					usdp->sd_flags &= ~FLG_SY_NDIR;
677 					usdp->sd_flags |= FLG_SY_PROTECT;
678 					usdp->sd_sym->st_other = STV_PROTECTED;
679 				} else if (
680 				    ((usdp->sd_flags & FLG_SY_DIR) == 0) &&
681 				    ((ofl->ofl_flags & FLG_OF_SYMBOLIC) == 0)) {
682 					usdp->sd_flags |= FLG_SY_NDIR;
683 				}
684 			}
685 			usdp->sd_flags |= sdflags;
686 
687 			/*
688 			 * If the reference originated from a mapfile ensure
689 			 * we mark the symbol as used.
690 			 */
691 			if (usdp->sd_flags & FLG_SY_MAPREF)
692 				usdp->sd_flags |= FLG_SY_MAPUSED;
693 
694 			DBG_CALL(Dbg_syms_updated(ofl, usdp, uname));
695 		} else {
696 			ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_RESERVE),
697 			    uname, usdp->sd_file->ifl_name);
698 		}
699 	} else {
700 		/*
701 		 * If the symbol does not exist create it.
702 		 */
703 		if ((sym = libld_calloc(sizeof (Sym), 1)) == NULL)
704 			return (S_ERROR);
705 		sym->st_shndx = SHN_ABS;
706 		sym->st_info = ELF_ST_INFO(STB_GLOBAL, STT_OBJECT);
707 		sym->st_size = 0;
708 		sym->st_value = 0;
709 		DBG_CALL(Dbg_syms_created(ofl->ofl_lml, uname));
710 		if ((usdp = ld_sym_enter(uname, sym, hash, (Ifl_desc *)NULL,
711 		    ofl, 0, SHN_ABS, (FLG_SY_SPECSEC | sdflags_u), &where)) ==
712 		    (Sym_desc *)S_ERROR)
713 			return (S_ERROR);
714 		usdp->sd_ref = REF_REL_NEED;
715 		/* LINTED */
716 		usdp->sd_aux->sa_symspec = (Half)sdaux_id;
717 
718 		usdp->sd_aux->sa_overndx = VER_NDX_GLOBAL;
719 
720 		if (sdaux_id == SDAUX_ID_GOT) {
721 			usdp->sd_flags |= FLG_SY_PROTECT;
722 			usdp->sd_sym->st_other = STV_PROTECTED;
723 		} else if ((sdflags & FLG_SY_DEFAULT) &&
724 		    ((ofl->ofl_flags & FLG_OF_SYMBOLIC) == 0)) {
725 			usdp->sd_flags |= FLG_SY_NDIR;
726 		}
727 		usdp->sd_flags |= sdflags;
728 	}
729 
730 	if (name && (sdp = ld_sym_find(name, SYM_NOHASH, NULL, ofl)) &&
731 	    (sdp->sd_sym->st_shndx == SHN_UNDEF)) {
732 		uchar_t	bind;
733 
734 		/*
735 		 * If the non-underscore symbol exists and is undefined
736 		 * convert it to be a local.  If the underscore has
737 		 * sa_symspec set (ie. it was created above) then simulate this
738 		 * as a weak alias.
739 		 */
740 		sdp->sd_ref = REF_REL_NEED;
741 		sdp->sd_shndx = sdp->sd_sym->st_shndx = SHN_ABS;
742 		sdp->sd_flags |= FLG_SY_SPECSEC;
743 		sdp->sd_isc = NULL;
744 		sdp->sd_sym->st_size = 0;
745 		sdp->sd_sym->st_value = 0;
746 		/* LINTED */
747 		sdp->sd_aux->sa_symspec = (Half)sdaux_id;
748 		if (usdp->sd_aux->sa_symspec) {
749 			usdp->sd_aux->sa_linkndx = 0;
750 			sdp->sd_aux->sa_linkndx = 0;
751 			bind = STB_WEAK;
752 		} else
753 			bind = STB_GLOBAL;
754 		sdp->sd_sym->st_info = ELF_ST_INFO(bind, STT_OBJECT);
755 
756 		/*
757 		 * If a user hasn't specifically indicated the scope of this
758 		 * symbol be made local then leave it as global (ie. prevent
759 		 * automatic scoping).  The GOT should be defined protected,
760 		 * whereas all other special symbols are tagged as no-direct.
761 		 */
762 		if (!SYM_IS_HIDDEN(sdp) &&
763 		    (sdflags & FLG_SY_DEFAULT)) {
764 			sdp->sd_aux->sa_overndx = VER_NDX_GLOBAL;
765 			if (sdaux_id == SDAUX_ID_GOT) {
766 				sdp->sd_flags &= ~FLG_SY_NDIR;
767 				sdp->sd_flags |= FLG_SY_PROTECT;
768 				sdp->sd_sym->st_other = STV_PROTECTED;
769 			} else if (((sdp->sd_flags & FLG_SY_DIR) == 0) &&
770 			    ((ofl->ofl_flags & FLG_OF_SYMBOLIC) == 0)) {
771 				sdp->sd_flags |= FLG_SY_NDIR;
772 			}
773 		}
774 		sdp->sd_flags |= sdflags;
775 
776 		/*
777 		 * If the reference originated from a mapfile ensure
778 		 * we mark the symbol as used.
779 		 */
780 		if (sdp->sd_flags & FLG_SY_MAPREF)
781 			sdp->sd_flags |= FLG_SY_MAPUSED;
782 
783 		DBG_CALL(Dbg_syms_updated(ofl, sdp, name));
784 	}
785 	return (1);
786 }
787 
788 
789 /*
790  * Undefined symbols can fall into one of four types:
791  *
792  *  -	the symbol is really undefined (SHN_UNDEF).
793  *
794  *  -	versioning has been enabled, however this symbol has not been assigned
795  *	to one of the defined versions.
796  *
797  *  -	the symbol has been defined by an implicitly supplied library, ie. one
798  *	which was encounted because it was NEEDED by another library, rather
799  *	than from a command line supplied library which would become the only
800  *	dependency of the output file being produced.
801  *
802  *  -	the symbol has been defined by a version of a shared object that is
803  *	not permitted for this link-edit.
804  *
805  * In all cases the file who made the first reference to this symbol will have
806  * been recorded via the `sa_rfile' pointer.
807  */
808 typedef enum {
809 	UNDEF,		NOVERSION,	IMPLICIT,	NOTAVAIL,
810 	BNDLOCAL
811 } Type;
812 
813 static const Msg format[] = {
814 	MSG_SYM_UND_UNDEF,		/* MSG_INTL(MSG_SYM_UND_UNDEF) */
815 	MSG_SYM_UND_NOVER,		/* MSG_INTL(MSG_SYM_UND_NOVER) */
816 	MSG_SYM_UND_IMPL,		/* MSG_INTL(MSG_SYM_UND_IMPL) */
817 	MSG_SYM_UND_NOTA,		/* MSG_INTL(MSG_SYM_UND_NOTA) */
818 	MSG_SYM_UND_BNDLOCAL		/* MSG_INTL(MSG_SYM_UND_BNDLOCAL) */
819 };
820 
821 /*
822  * Issue an undefined symbol message for the given symbol.
823  *
824  * entry:
825  *	ofl - Output descriptor
826  *	sdp - Undefined symbol to report
827  *	type - Type of undefined symbol
828  *	ofl_flag - One of 0, FLG_OF_FATAL, or FLG_OF_WARN.
829  *	undef_state - Address of variable to be initialized to 0
830  *		before the first call to sym_undef_entry, and passed
831  *		to each subsequent call. A non-zero value for *undef_state
832  *		indicates that this is not the first call in the series.
833  *
834  * exit:
835  *	If *undef_state is 0, a title is issued.
836  *
837  *	A message for the undefined symbol is issued.
838  *
839  *	If ofl_flag is non-zero, its value is OR'd into *undef_state. Otherwise,
840  *	all bits other than FLG_OF_FATAL and FLG_OF_WARN are set, in order to
841  *	provide *undef_state with a non-zero value. These other bits have
842  *	no meaning beyond that, and serve to ensure that *undef_state is
843  *	non-zero if sym_undef_entry() has been called.
844  */
845 static void
846 sym_undef_entry(Ofl_desc *ofl, Sym_desc *sdp, Type type, ofl_flag_t ofl_flag,
847     ofl_flag_t *undef_state)
848 {
849 	const char	*name1, *name2, *name3;
850 	Ifl_desc	*ifl = sdp->sd_file;
851 	Sym_aux		*sap = sdp->sd_aux;
852 
853 	if (*undef_state == 0)
854 		ld_eprintf(ofl, ERR_NONE, MSG_INTL(MSG_SYM_FMT_UNDEF),
855 		    MSG_INTL(MSG_SYM_UNDEF_ITM_11),
856 		    MSG_INTL(MSG_SYM_UNDEF_ITM_21),
857 		    MSG_INTL(MSG_SYM_UNDEF_ITM_12),
858 		    MSG_INTL(MSG_SYM_UNDEF_ITM_22));
859 
860 	ofl->ofl_flags |= ofl_flag;
861 	*undef_state |= ofl_flag ? ofl_flag : ~(FLG_OF_FATAL | FLG_OF_WARN);
862 
863 	switch (type) {
864 	case UNDEF:
865 	case BNDLOCAL:
866 		name1 = sap->sa_rfile;
867 		break;
868 	case NOVERSION:
869 		name1 = ifl->ifl_name;
870 		break;
871 	case IMPLICIT:
872 		name1 = sap->sa_rfile;
873 		name2 = ifl->ifl_name;
874 		break;
875 	case NOTAVAIL:
876 		name1 = sap->sa_rfile;
877 		name2 = sap->sa_vfile;
878 		name3 = ifl->ifl_verndx[sap->sa_dverndx].vi_name;
879 		break;
880 	default:
881 		return;
882 	}
883 
884 	ld_eprintf(ofl, ERR_NONE, MSG_INTL(format[type]),
885 	    demangle(sdp->sd_name), name1, name2, name3);
886 }
887 
888 /*
889  * If an undef symbol exists naming a bound for the output section,
890  * turn it into a defined symbol with the correct value.
891  *
892  * We set an arbitrary 1KB limit on the resulting symbol names.
893  */
894 static void
895 sym_add_bounds(Ofl_desc *ofl, Os_desc *osp, Word bound)
896 {
897 	Sym_desc *bsdp;
898 	char symn[1024];
899 	size_t nsz;
900 
901 	switch (bound) {
902 	case SDAUX_ID_SECBOUND_START:
903 		nsz = snprintf(symn, sizeof (symn), "%s%s",
904 		    MSG_ORIG(MSG_SYM_SECBOUND_START), osp->os_name);
905 		if (nsz >= sizeof (symn))
906 			return;
907 		break;
908 	case SDAUX_ID_SECBOUND_STOP:
909 		nsz = snprintf(symn, sizeof (symn), "%s%s",
910 		    MSG_ORIG(MSG_SYM_SECBOUND_STOP), osp->os_name);
911 		if (nsz >= sizeof (symn))
912 			return;
913 		break;
914 	default:
915 		assert(0);
916 	}
917 
918 	if ((bsdp = ld_sym_find(symn, SYM_NOHASH, NULL, ofl)) != NULL) {
919 		if ((bsdp->sd_shndx != SHN_UNDEF) &&
920 		    (bsdp->sd_ref == REF_REL_NEED)) {
921 			ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_RESERVE),
922 			    symn, bsdp->sd_file->ifl_name);
923 			return;
924 		}
925 
926 		DBG_CALL(Dbg_syms_updated(ofl, bsdp, symn));
927 
928 		bsdp->sd_aux->sa_symspec = bound;
929 		bsdp->sd_aux->sa_boundsec = osp;
930 		bsdp->sd_flags |= FLG_SY_SPECSEC;
931 		bsdp->sd_ref = REF_REL_NEED;
932 		bsdp->sd_sym->st_info = ELF_ST_INFO(STB_GLOBAL, STT_NOTYPE);
933 		bsdp->sd_sym->st_other = STV_PROTECTED;
934 		bsdp->sd_isc = NULL;
935 		bsdp->sd_sym->st_size = 0;
936 		bsdp->sd_sym->st_value = 0;
937 		bsdp->sd_shndx = bsdp->sd_sym->st_shndx = SHN_ABS;
938 	}
939 }
940 
941 static Boolean
942 is_cname(const char *name)
943 {
944 	if (strlen(name) == strspn(name,
945 	    "abcdefghijklmnopqrstuvwxyz"
946 	    "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
947 	    "0123456789"
948 	    "_"))
949 		return (TRUE);
950 	else
951 		return (FALSE);
952 }
953 
954 /*
955  * At this point all symbol input processing has been completed, therefore
956  * complete the symbol table entries by generating any necessary internal
957  * symbols.
958  */
959 uintptr_t
960 ld_sym_spec(Ofl_desc *ofl)
961 {
962 	Sym_desc	*sdp;
963 	Sg_desc		*sgp;
964 
965 	DBG_CALL(Dbg_syms_spec_title(ofl->ofl_lml));
966 
967 	/*
968 	 * For each section in the output file, look for symbols named for the
969 	 * __start/__stop patterns.  If references exist, flesh the symbols to
970 	 * be defined.
971 	 *
972 	 * The symbols are given values at the same time as the other special
973 	 * symbols.
974 	 */
975 	if (!(ofl->ofl_flags & FLG_OF_RELOBJ) ||
976 	    (ofl->ofl_flags & FLG_OF_KMOD)) {
977 		Aliste		idx1;
978 
979 		for (APLIST_TRAVERSE(ofl->ofl_segs, idx1, sgp)) {
980 			Os_desc *osp;
981 			Aliste idx2;
982 
983 			for (APLIST_TRAVERSE(sgp->sg_osdescs, idx2, osp)) {
984 				if (is_cname(osp->os_name)) {
985 					sym_add_bounds(ofl, osp,
986 					    SDAUX_ID_SECBOUND_START);
987 					sym_add_bounds(ofl, osp,
988 					    SDAUX_ID_SECBOUND_STOP);
989 				}
990 			}
991 		}
992 	}
993 
994 	if (ofl->ofl_flags & FLG_OF_RELOBJ)
995 		return (1);
996 
997 	if (sym_add_spec(MSG_ORIG(MSG_SYM_ETEXT), MSG_ORIG(MSG_SYM_ETEXT_U),
998 	    SDAUX_ID_ETEXT, 0, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
999 	    ofl) == S_ERROR)
1000 		return (S_ERROR);
1001 	if (sym_add_spec(MSG_ORIG(MSG_SYM_EDATA), MSG_ORIG(MSG_SYM_EDATA_U),
1002 	    SDAUX_ID_EDATA, 0, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1003 	    ofl) == S_ERROR)
1004 		return (S_ERROR);
1005 	if (sym_add_spec(MSG_ORIG(MSG_SYM_END), MSG_ORIG(MSG_SYM_END_U),
1006 	    SDAUX_ID_END, FLG_SY_DYNSORT, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1007 	    ofl) == S_ERROR)
1008 		return (S_ERROR);
1009 	if (sym_add_spec(MSG_ORIG(MSG_SYM_L_END), MSG_ORIG(MSG_SYM_L_END_U),
1010 	    SDAUX_ID_END, 0, FLG_SY_HIDDEN, ofl) == S_ERROR)
1011 		return (S_ERROR);
1012 	if (sym_add_spec(MSG_ORIG(MSG_SYM_L_START), MSG_ORIG(MSG_SYM_L_START_U),
1013 	    SDAUX_ID_START, 0, FLG_SY_HIDDEN, ofl) == S_ERROR)
1014 		return (S_ERROR);
1015 
1016 	/*
1017 	 * Historically we've always produced a _DYNAMIC symbol, even for
1018 	 * static executables (in which case its value will be 0).
1019 	 */
1020 	if (sym_add_spec(MSG_ORIG(MSG_SYM_DYNAMIC), MSG_ORIG(MSG_SYM_DYNAMIC_U),
1021 	    SDAUX_ID_DYN, FLG_SY_DYNSORT, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1022 	    ofl) == S_ERROR)
1023 		return (S_ERROR);
1024 
1025 	if (OFL_ALLOW_DYNSYM(ofl))
1026 		if (sym_add_spec(MSG_ORIG(MSG_SYM_PLKTBL),
1027 		    MSG_ORIG(MSG_SYM_PLKTBL_U), SDAUX_ID_PLT,
1028 		    FLG_SY_DYNSORT, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1029 		    ofl) == S_ERROR)
1030 			return (S_ERROR);
1031 
1032 	/*
1033 	 * A GOT reference will be accompanied by the associated GOT symbol.
1034 	 * Make sure it gets assigned the appropriate special attributes.
1035 	 */
1036 	if (((sdp = ld_sym_find(MSG_ORIG(MSG_SYM_GOFTBL_U),
1037 	    SYM_NOHASH, NULL, ofl)) != NULL) && (sdp->sd_ref != REF_DYN_SEEN)) {
1038 		if (sym_add_spec(MSG_ORIG(MSG_SYM_GOFTBL),
1039 		    MSG_ORIG(MSG_SYM_GOFTBL_U), SDAUX_ID_GOT, FLG_SY_DYNSORT,
1040 		    (FLG_SY_DEFAULT | FLG_SY_EXPDEF), ofl) == S_ERROR)
1041 			return (S_ERROR);
1042 	}
1043 
1044 	return (1);
1045 }
1046 
1047 /*
1048  * Determine a potential capability symbol's visibility.
1049  *
1050  * The -z symbolcap option transforms an object capabilities relocatable object
1051  * into a symbol capabilities relocatable object.  Any global function symbols,
1052  * or initialized global data symbols are candidates for transforming into local
1053  * symbol capabilities definitions.  However, if a user indicates that a symbol
1054  * should be demoted to local using a mapfile, then there is no need to
1055  * transform the associated global symbol.
1056  *
1057  * Normally, a symbol's visibility is determined after the symbol resolution
1058  * process, after all symbol state has been gathered and resolved.  However,
1059  * for -z symbolcap, this determination is too late.  When a global symbol is
1060  * read from an input file we need to determine it's visibility so as to decide
1061  * whether to create a local or not.
1062  *
1063  * If a user has explicitly defined this symbol as having local scope within a
1064  * mapfile, then a symbol of the same name already exists.  However, explicit
1065  * local definitions are uncommon, as most mapfiles define the global symbol
1066  * requirements together with an auto-reduction directive '*'.  If this state
1067  * has been defined, then we must make sure that the new symbol isn't a type
1068  * that can not be demoted to local.
1069  */
1070 static int
1071 sym_cap_vis(const char *name, Word hash, Sym *sym, Ofl_desc *ofl)
1072 {
1073 	Sym_desc	*sdp;
1074 	uchar_t		vis;
1075 	avl_index_t	where;
1076 	sd_flag_t	sdflags = 0;
1077 
1078 	/*
1079 	 * Determine the visibility of the new symbol.
1080 	 */
1081 	vis = ELF_ST_VISIBILITY(sym->st_other);
1082 	switch (vis) {
1083 	case STV_EXPORTED:
1084 		sdflags |= FLG_SY_EXPORT;
1085 		break;
1086 	case STV_SINGLETON:
1087 		sdflags |= FLG_SY_SINGLE;
1088 		break;
1089 	case STV_HIDDEN:
1090 		sdflags |= FLG_SY_HIDDEN;
1091 		break;
1092 	}
1093 
1094 	/*
1095 	 * Determine whether a symbol definition already exists, and if so
1096 	 * obtain the visibility.
1097 	 */
1098 	if ((sdp = ld_sym_find(name, hash, &where, ofl)) != NULL)
1099 		sdflags |= sdp->sd_flags;
1100 
1101 	/*
1102 	 * Determine whether the symbol flags indicate this symbol should be
1103 	 * hidden.
1104 	 */
1105 	if ((ofl->ofl_flags & (FLG_OF_AUTOLCL | FLG_OF_AUTOELM)) &&
1106 	    ((sdflags & MSK_SY_NOAUTO) == 0))
1107 		sdflags |= FLG_SY_HIDDEN;
1108 
1109 	return ((sdflags & FLG_SY_HIDDEN) == 0);
1110 }
1111 
1112 /*
1113  * This routine checks to see if a symbols visibility needs to be reduced to
1114  * either SYMBOLIC or LOCAL.  This routine can be called from either
1115  * reloc_init() or sym_validate().
1116  */
1117 void
1118 ld_sym_adjust_vis(Sym_desc *sdp, Ofl_desc *ofl)
1119 {
1120 	ofl_flag_t	oflags = ofl->ofl_flags;
1121 	Sym		*sym = sdp->sd_sym;
1122 
1123 	if ((sdp->sd_ref == REF_REL_NEED) &&
1124 	    (sdp->sd_sym->st_shndx != SHN_UNDEF)) {
1125 		/*
1126 		 * If auto-reduction/elimination is enabled, reduce any
1127 		 * non-versioned, and non-local capabilities global symbols.
1128 		 * A symbol is a candidate for auto-reduction/elimination if:
1129 		 *
1130 		 *  -	the symbol wasn't explicitly defined within a mapfile
1131 		 *	(in which case all the necessary state has been applied
1132 		 *	to the symbol), or
1133 		 *  -	the symbol isn't one of the family of reserved
1134 		 *	special symbols (ie. _end, _etext, etc.), or
1135 		 *  -	the symbol isn't a SINGLETON, or
1136 		 *  -	the symbol wasn't explicitly defined within a version
1137 		 *	definition associated with an input relocatable object.
1138 		 *
1139 		 * Indicate that the symbol has been reduced as it may be
1140 		 * necessary to print these symbols later.
1141 		 */
1142 		if ((oflags & (FLG_OF_AUTOLCL | FLG_OF_AUTOELM)) &&
1143 		    ((sdp->sd_flags & MSK_SY_NOAUTO) == 0)) {
1144 			if ((sdp->sd_flags & FLG_SY_HIDDEN) == 0) {
1145 				sdp->sd_flags |=
1146 				    (FLG_SY_REDUCED | FLG_SY_HIDDEN);
1147 			}
1148 
1149 			if (oflags & (FLG_OF_REDLSYM | FLG_OF_AUTOELM)) {
1150 				sdp->sd_flags |= FLG_SY_ELIM;
1151 				sym->st_other = STV_ELIMINATE |
1152 				    (sym->st_other & ~MSK_SYM_VISIBILITY);
1153 			} else if (ELF_ST_VISIBILITY(sym->st_other) !=
1154 			    STV_INTERNAL)
1155 				sym->st_other = STV_HIDDEN |
1156 				    (sym->st_other & ~MSK_SYM_VISIBILITY);
1157 		}
1158 
1159 		/*
1160 		 * If -Bsymbolic is in effect, and the symbol hasn't explicitly
1161 		 * been defined nodirect (via a mapfile), then bind the global
1162 		 * symbol symbolically and assign the STV_PROTECTED visibility
1163 		 * attribute.
1164 		 */
1165 		if ((oflags & FLG_OF_SYMBOLIC) &&
1166 		    ((sdp->sd_flags & (FLG_SY_HIDDEN | FLG_SY_NDIR)) == 0)) {
1167 			sdp->sd_flags |= FLG_SY_PROTECT;
1168 			if (ELF_ST_VISIBILITY(sym->st_other) == STV_DEFAULT)
1169 				sym->st_other = STV_PROTECTED |
1170 				    (sym->st_other & ~MSK_SYM_VISIBILITY);
1171 		}
1172 	}
1173 
1174 	/*
1175 	 * Indicate that this symbol has had it's visibility checked so that
1176 	 * we don't need to do this investigation again.
1177 	 */
1178 	sdp->sd_flags |= FLG_SY_VISIBLE;
1179 }
1180 
1181 /*
1182  * Make sure a symbol definition is local to the object being built.
1183  */
1184 inline static int
1185 ensure_sym_local(Ofl_desc *ofl, Sym_desc *sdp, const char *str)
1186 {
1187 	if (sdp->sd_sym->st_shndx == SHN_UNDEF) {
1188 		if (str) {
1189 			ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_SYM_UNDEF),
1190 			    str, demangle((char *)sdp->sd_name));
1191 		}
1192 		return (1);
1193 	}
1194 	if (sdp->sd_ref != REF_REL_NEED) {
1195 		if (str) {
1196 			ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_SYM_EXTERN),
1197 			    str, demangle((char *)sdp->sd_name),
1198 			    sdp->sd_file->ifl_name);
1199 		}
1200 		return (1);
1201 	}
1202 
1203 	sdp->sd_flags |= FLG_SY_UPREQD;
1204 	if (sdp->sd_isc) {
1205 		sdp->sd_isc->is_flags |= FLG_IS_SECTREF;
1206 		sdp->sd_isc->is_file->ifl_flags |= FLG_IF_FILEREF;
1207 	}
1208 	return (0);
1209 }
1210 
1211 /*
1212  * Make sure all the symbol definitions required for initarray, finiarray, or
1213  * preinitarray's are local to the object being built.
1214  */
1215 static int
1216 ensure_array_local(Ofl_desc *ofl, APlist *apl, const char *str)
1217 {
1218 	Aliste		idx;
1219 	Sym_desc	*sdp;
1220 	int		ret = 0;
1221 
1222 	for (APLIST_TRAVERSE(apl, idx, sdp))
1223 		ret += ensure_sym_local(ofl, sdp, str);
1224 
1225 	return (ret);
1226 }
1227 
1228 /*
1229  * After all symbol table input processing has been finished, and all relocation
1230  * counting has been carried out (ie. no more symbols will be read, generated,
1231  * or modified), validate and count the relevant entries:
1232  *
1233  *  -	check and print any undefined symbols remaining.  Note that if a symbol
1234  *	has been defined by virtue of the inclusion of	an implicit shared
1235  *	library, it is still classed as undefined.
1236  *
1237  *  -	count the number of global needed symbols together with the size of
1238  *	their associated name strings (if scoping has been indicated these
1239  *	symbols may be reduced to locals).
1240  *
1241  *  -	establish the size and alignment requirements for the global .bss
1242  *	section (the alignment of this section is based on the first symbol
1243  *	that it will contain).
1244  */
1245 uintptr_t
1246 ld_sym_validate(Ofl_desc *ofl)
1247 {
1248 	Sym_avlnode	*sav;
1249 	Sym_desc	*sdp;
1250 	Sym		*sym;
1251 	ofl_flag_t	oflags = ofl->ofl_flags;
1252 	ofl_flag_t	undef = 0, needed = 0, verdesc = 0;
1253 	Xword		bssalign = 0, tlsalign = 0;
1254 	Boolean		need_bss, need_tlsbss;
1255 	Xword		bsssize = 0, tlssize = 0;
1256 #if	defined(_ELF64)
1257 	Xword		lbssalign = 0, lbsssize = 0;
1258 	Boolean		need_lbss;
1259 #endif
1260 	int		ret, allow_ldynsym;
1261 	uchar_t		type;
1262 	ofl_flag_t	undef_state = 0;
1263 
1264 	DBG_CALL(Dbg_basic_validate(ofl->ofl_lml));
1265 
1266 	/*
1267 	 * The need_XXX booleans are used to determine whether we need to
1268 	 * create each type of bss section. We used to create these sections
1269 	 * if the sum of the required sizes for each type were non-zero.
1270 	 * However, it is possible for a compiler to generate COMMON variables
1271 	 * of zero-length and this tricks that logic --- even zero-length
1272 	 * symbols need an output section.
1273 	 */
1274 	need_bss = need_tlsbss = FALSE;
1275 #if	defined(_ELF64)
1276 	need_lbss = FALSE;
1277 #endif
1278 
1279 	/*
1280 	 * Determine how undefined symbols are handled:
1281 	 *
1282 	 * fatal:
1283 	 *	If this link-edit calls for no undefined symbols to remain
1284 	 *	(this is the default case when generating an executable but
1285 	 *	can be enforced for any object using -z defs), a fatal error
1286 	 *	condition will be indicated.
1287 	 *
1288 	 * warning:
1289 	 *	If we're creating a shared object, and either the -Bsymbolic
1290 	 *	flag is set, or the user has turned on the -z guidance feature,
1291 	 *	then a non-fatal warning is issued for each symbol.
1292 	 *
1293 	 * ignore:
1294 	 *	In all other cases, undefined symbols are quietly allowed.
1295 	 */
1296 	if (oflags & FLG_OF_NOUNDEF) {
1297 		undef = FLG_OF_FATAL;
1298 	} else if (oflags & FLG_OF_SHAROBJ) {
1299 		if ((oflags & FLG_OF_SYMBOLIC) ||
1300 		    OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS))
1301 			undef = FLG_OF_WARN;
1302 	}
1303 
1304 	/*
1305 	 * If the symbol is referenced from an implicitly included shared object
1306 	 * (ie. it's not on the NEEDED list) then the symbol is also classified
1307 	 * as undefined and a fatal error condition will be indicated.
1308 	 */
1309 	if ((oflags & FLG_OF_NOUNDEF) || !(oflags & FLG_OF_SHAROBJ))
1310 		needed = FLG_OF_FATAL;
1311 	else if ((oflags & FLG_OF_SHAROBJ) &&
1312 	    OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS))
1313 		needed = FLG_OF_WARN;
1314 
1315 	/*
1316 	 * If the output image is being versioned, then all symbol definitions
1317 	 * must be associated with a version.  Any symbol that isn't associated
1318 	 * with a version is classified as undefined, and a fatal error
1319 	 * condition is indicated.
1320 	 */
1321 	if ((oflags & FLG_OF_VERDEF) && (ofl->ofl_vercnt > VER_NDX_GLOBAL))
1322 		verdesc = FLG_OF_FATAL;
1323 
1324 	allow_ldynsym = OFL_ALLOW_LDYNSYM(ofl);
1325 
1326 	if (allow_ldynsym) {
1327 		/*
1328 		 * Normally, we disallow symbols with 0 size from appearing
1329 		 * in a dyn[sym|tls]sort section. However, there are some
1330 		 * symbols that serve special purposes that we want to exempt
1331 		 * from this rule. Look them up, and set their
1332 		 * FLG_SY_DYNSORT flag.
1333 		 */
1334 		static const char *special[] = {
1335 			MSG_ORIG(MSG_SYM_INIT_U),	/* _init */
1336 			MSG_ORIG(MSG_SYM_FINI_U),	/* _fini */
1337 			MSG_ORIG(MSG_SYM_START),	/* _start */
1338 			NULL
1339 		};
1340 		int i;
1341 
1342 		for (i = 0; special[i] != NULL; i++) {
1343 			if (((sdp = ld_sym_find(special[i],
1344 			    SYM_NOHASH, NULL, ofl)) != NULL) &&
1345 			    (sdp->sd_sym->st_size == 0)) {
1346 				if (ld_sym_copy(sdp) == S_ERROR)
1347 					return (S_ERROR);
1348 				sdp->sd_flags |= FLG_SY_DYNSORT;
1349 			}
1350 		}
1351 	}
1352 
1353 	/*
1354 	 * Collect and validate the globals from the internal symbol table.
1355 	 */
1356 	for (sav = avl_first(&ofl->ofl_symavl); sav;
1357 	    sav = AVL_NEXT(&ofl->ofl_symavl, sav)) {
1358 		Is_desc		*isp;
1359 		int		undeferr = 0;
1360 		uchar_t		vis;
1361 
1362 		sdp = sav->sav_sdp;
1363 
1364 		/*
1365 		 * If undefined symbols are allowed, and we're not being
1366 		 * asked to supply guidance, ignore any symbols that are
1367 		 * not needed.
1368 		 */
1369 		if (!(oflags & FLG_OF_NOUNDEF) &&
1370 		    !OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS) &&
1371 		    (sdp->sd_ref == REF_DYN_SEEN))
1372 			continue;
1373 
1374 		/*
1375 		 * If the symbol originates from an external or parent mapfile
1376 		 * reference and hasn't been matched to a reference from a
1377 		 * relocatable object, ignore it.
1378 		 */
1379 		if ((sdp->sd_flags & (FLG_SY_EXTERN | FLG_SY_PARENT)) &&
1380 		    ((sdp->sd_flags & FLG_SY_MAPUSED) == 0)) {
1381 			sdp->sd_flags |= FLG_SY_INVALID;
1382 			continue;
1383 		}
1384 
1385 		sym = sdp->sd_sym;
1386 		type = ELF_ST_TYPE(sym->st_info);
1387 
1388 		/*
1389 		 * Sanity check TLS.
1390 		 */
1391 		if ((type == STT_TLS) && (sym->st_size != 0) &&
1392 		    (sym->st_shndx != SHN_UNDEF) &&
1393 		    (sym->st_shndx != SHN_COMMON)) {
1394 			Is_desc		*isp = sdp->sd_isc;
1395 			Ifl_desc	*ifl = sdp->sd_file;
1396 
1397 			if ((isp == NULL) || (isp->is_shdr == NULL) ||
1398 			    ((isp->is_shdr->sh_flags & SHF_TLS) == 0)) {
1399 				ld_eprintf(ofl, ERR_FATAL,
1400 				    MSG_INTL(MSG_SYM_TLS),
1401 				    demangle(sdp->sd_name), ifl->ifl_name);
1402 				continue;
1403 			}
1404 		}
1405 
1406 		if ((sdp->sd_flags & FLG_SY_VISIBLE) == 0)
1407 			ld_sym_adjust_vis(sdp, ofl);
1408 
1409 		if ((sdp->sd_flags & FLG_SY_REDUCED) &&
1410 		    (oflags & FLG_OF_PROCRED)) {
1411 			DBG_CALL(Dbg_syms_reduce(ofl, DBG_SYM_REDUCE_GLOBAL,
1412 			    sdp, 0, 0));
1413 		}
1414 
1415 		/*
1416 		 * Record any STV_SINGLETON existence.
1417 		 */
1418 		if ((vis = ELF_ST_VISIBILITY(sym->st_other)) == STV_SINGLETON)
1419 			ofl->ofl_dtflags_1 |= DF_1_SINGLETON;
1420 
1421 		/*
1422 		 * If building a shared object or executable, and this is a
1423 		 * non-weak UNDEF symbol with reduced visibility (STV_*), then
1424 		 * give a fatal error.
1425 		 */
1426 		if (((oflags & FLG_OF_RELOBJ) == 0) &&
1427 		    (sym->st_shndx == SHN_UNDEF) &&
1428 		    (ELF_ST_BIND(sym->st_info) != STB_WEAK)) {
1429 			if (vis && (vis != STV_SINGLETON)) {
1430 				sym_undef_entry(ofl, sdp, BNDLOCAL,
1431 				    FLG_OF_FATAL, &undef_state);
1432 				continue;
1433 			}
1434 		}
1435 
1436 		/*
1437 		 * If this symbol is defined in a non-allocatable section,
1438 		 * reduce it to local symbol.
1439 		 */
1440 		if (((isp = sdp->sd_isc) != 0) && isp->is_shdr &&
1441 		    ((isp->is_shdr->sh_flags & SHF_ALLOC) == 0)) {
1442 			sdp->sd_flags |= (FLG_SY_REDUCED | FLG_SY_HIDDEN);
1443 		}
1444 
1445 		/*
1446 		 * If this symbol originated as a SHN_SUNW_IGNORE, it will have
1447 		 * been processed as an SHN_UNDEF.  Return the symbol to its
1448 		 * original index for validation, and propagation to the output
1449 		 * file.
1450 		 */
1451 		if (sdp->sd_flags & FLG_SY_IGNORE)
1452 			sdp->sd_shndx = SHN_SUNW_IGNORE;
1453 
1454 		if (undef) {
1455 			/*
1456 			 * If a non-weak reference remains undefined, or if a
1457 			 * mapfile reference is not bound to the relocatable
1458 			 * objects that make up the object being built, we have
1459 			 * a fatal error.
1460 			 *
1461 			 * The exceptions are symbols which are defined to be
1462 			 * found in the parent (FLG_SY_PARENT), which is really
1463 			 * only meaningful for direct binding, or are defined
1464 			 * external (FLG_SY_EXTERN) so as to suppress -zdefs
1465 			 * errors.
1466 			 *
1467 			 * Register symbols are always allowed to be UNDEF.
1468 			 *
1469 			 * Note that we don't include references created via -u
1470 			 * in the same shared object binding test.  This is for
1471 			 * backward compatibility, in that a number of archive
1472 			 * makefile rules used -u to cause archive extraction.
1473 			 * These same rules have been cut and pasted to apply
1474 			 * to shared objects, and thus although the -u reference
1475 			 * is redundant, flagging it as fatal could cause some
1476 			 * build to fail.  Also we have documented the use of
1477 			 * -u as a mechanism to cause binding to weak version
1478 			 * definitions, thus giving users an error condition
1479 			 * would be incorrect.
1480 			 */
1481 			if (!(sdp->sd_flags & FLG_SY_REGSYM) &&
1482 			    ((sym->st_shndx == SHN_UNDEF) &&
1483 			    ((ELF_ST_BIND(sym->st_info) != STB_WEAK) &&
1484 			    ((sdp->sd_flags &
1485 			    (FLG_SY_PARENT | FLG_SY_EXTERN)) == 0)) ||
1486 			    ((sdp->sd_flags &
1487 			    (FLG_SY_MAPREF | FLG_SY_MAPUSED | FLG_SY_HIDDEN |
1488 			    FLG_SY_PROTECT)) == FLG_SY_MAPREF))) {
1489 				sym_undef_entry(ofl, sdp, UNDEF, undef,
1490 				    &undef_state);
1491 				undeferr = 1;
1492 			}
1493 
1494 		} else {
1495 			/*
1496 			 * For building things like shared objects (or anything
1497 			 * -znodefs), undefined symbols are allowed.
1498 			 *
1499 			 * If a mapfile reference remains undefined the user
1500 			 * would probably like a warning at least (they've
1501 			 * usually mis-spelt the reference).  Refer to the above
1502 			 * comments for discussion on -u references, which
1503 			 * are not tested for in the same manner.
1504 			 */
1505 			if ((sdp->sd_flags &
1506 			    (FLG_SY_MAPREF | FLG_SY_MAPUSED)) ==
1507 			    FLG_SY_MAPREF) {
1508 				sym_undef_entry(ofl, sdp, UNDEF, FLG_OF_WARN,
1509 				    &undef_state);
1510 				undeferr = 1;
1511 			}
1512 		}
1513 
1514 		/*
1515 		 * If this symbol comes from a dependency mark the dependency
1516 		 * as required (-z ignore can result in unused dependencies
1517 		 * being dropped).  If we need to record dependency versioning
1518 		 * information indicate what version of the needed shared object
1519 		 * this symbol is part of.  Flag the symbol as undefined if it
1520 		 * has not been made available to us.
1521 		 */
1522 		if ((sdp->sd_ref == REF_DYN_NEED) &&
1523 		    (!(sdp->sd_flags & FLG_SY_REFRSD))) {
1524 			sdp->sd_file->ifl_flags |= FLG_IF_DEPREQD;
1525 
1526 			/*
1527 			 * Capture that we've bound to a symbol that doesn't
1528 			 * allow being directly bound to.
1529 			 */
1530 			if (sdp->sd_flags & FLG_SY_NDIR)
1531 				ofl->ofl_flags1 |= FLG_OF1_NGLBDIR;
1532 
1533 			if (sdp->sd_file->ifl_vercnt) {
1534 				int		vndx;
1535 				Ver_index	*vip;
1536 
1537 				vndx = sdp->sd_aux->sa_dverndx;
1538 				vip = &sdp->sd_file->ifl_verndx[vndx];
1539 				if (vip->vi_flags & FLG_VER_AVAIL) {
1540 					vip->vi_flags |= FLG_VER_REFER;
1541 				} else {
1542 					sym_undef_entry(ofl, sdp, NOTAVAIL,
1543 					    FLG_OF_FATAL, &undef_state);
1544 					continue;
1545 				}
1546 			}
1547 		}
1548 
1549 		/*
1550 		 * Test that we do not bind to symbol supplied from an implicit
1551 		 * shared object.  If a binding is from a weak reference it can
1552 		 * be ignored.
1553 		 */
1554 		if (needed && !undeferr && (sdp->sd_flags & FLG_SY_GLOBREF) &&
1555 		    (sdp->sd_ref == REF_DYN_NEED) &&
1556 		    (sdp->sd_flags & FLG_SY_NOTAVAIL)) {
1557 			sym_undef_entry(ofl, sdp, IMPLICIT, needed,
1558 			    &undef_state);
1559 			if (needed == FLG_OF_FATAL)
1560 				continue;
1561 		}
1562 
1563 		/*
1564 		 * Test that a symbol isn't going to be reduced to local scope
1565 		 * which actually wants to bind to a shared object - if so it's
1566 		 * a fatal error.
1567 		 */
1568 		if ((sdp->sd_ref == REF_DYN_NEED) &&
1569 		    (sdp->sd_flags & (FLG_SY_HIDDEN | FLG_SY_PROTECT))) {
1570 			sym_undef_entry(ofl, sdp, BNDLOCAL, FLG_OF_FATAL,
1571 			    &undef_state);
1572 			continue;
1573 		}
1574 
1575 		/*
1576 		 * If the output image is to be versioned then all symbol
1577 		 * definitions must be associated with a version.  Remove any
1578 		 * versioning that might be left associated with an undefined
1579 		 * symbol.
1580 		 */
1581 		if (verdesc && (sdp->sd_ref == REF_REL_NEED)) {
1582 			if (sym->st_shndx == SHN_UNDEF) {
1583 				if (sdp->sd_aux && sdp->sd_aux->sa_overndx)
1584 					sdp->sd_aux->sa_overndx = 0;
1585 			} else {
1586 				if (!SYM_IS_HIDDEN(sdp) && sdp->sd_aux &&
1587 				    (sdp->sd_aux->sa_overndx == 0)) {
1588 					sym_undef_entry(ofl, sdp, NOVERSION,
1589 					    verdesc, &undef_state);
1590 					continue;
1591 				}
1592 			}
1593 		}
1594 
1595 		/*
1596 		 * If we don't need the symbol there's no need to process it
1597 		 * any further.
1598 		 */
1599 		if (sdp->sd_ref == REF_DYN_SEEN)
1600 			continue;
1601 
1602 		/*
1603 		 * Calculate the size and alignment requirements for the global
1604 		 * .bss and .tls sections.  If we're building a relocatable
1605 		 * object only account for scoped COMMON symbols (these will
1606 		 * be converted to .bss references).
1607 		 *
1608 		 * When -z nopartial is in effect, partially initialized
1609 		 * symbols are directed to the special .data section
1610 		 * created for that purpose (ofl->ofl_isparexpn).
1611 		 * Otherwise, partially initialized symbols go to .bss.
1612 		 *
1613 		 * Also refer to make_mvsections() in sunwmove.c
1614 		 */
1615 		if ((sym->st_shndx == SHN_COMMON) &&
1616 		    (((oflags & FLG_OF_RELOBJ) == 0) ||
1617 		    ld_sym_reducable(ofl, sdp))) {
1618 			if ((sdp->sd_move == NULL) ||
1619 			    ((sdp->sd_flags & FLG_SY_PAREXPN) == 0)) {
1620 				if (type != STT_TLS) {
1621 					need_bss = TRUE;
1622 					bsssize = (Xword)S_ROUND(bsssize,
1623 					    sym->st_value) + sym->st_size;
1624 					if (sym->st_value > bssalign)
1625 						bssalign = sym->st_value;
1626 				} else {
1627 					need_tlsbss = TRUE;
1628 					tlssize = (Xword)S_ROUND(tlssize,
1629 					    sym->st_value) + sym->st_size;
1630 					if (sym->st_value > tlsalign)
1631 						tlsalign = sym->st_value;
1632 				}
1633 			}
1634 		}
1635 
1636 #if	defined(_ELF64)
1637 		/*
1638 		 * Calculate the size and alignment requirement for the global
1639 		 * .lbss. TLS or partially initialized symbols do not need to be
1640 		 * considered yet.
1641 		 */
1642 		if ((ld_targ.t_m.m_mach == EM_AMD64) &&
1643 		    (sym->st_shndx == SHN_X86_64_LCOMMON)) {
1644 			need_lbss = TRUE;
1645 			lbsssize = (Xword)S_ROUND(lbsssize, sym->st_value) +
1646 			    sym->st_size;
1647 			if (sym->st_value > lbssalign)
1648 				lbssalign = sym->st_value;
1649 		}
1650 #endif
1651 		/*
1652 		 * If a symbol was referenced via the command line
1653 		 * (ld -u <>, ...), then this counts as a reference against the
1654 		 * symbol. Mark any section that symbol is defined in.
1655 		 */
1656 		if (((isp = sdp->sd_isc) != 0) &&
1657 		    (sdp->sd_flags & FLG_SY_CMDREF)) {
1658 			isp->is_flags |= FLG_IS_SECTREF;
1659 			isp->is_file->ifl_flags |= FLG_IF_FILEREF;
1660 		}
1661 
1662 		/*
1663 		 * Update the symbol count and the associated name string size.
1664 		 * Note, a capabilities symbol must remain as visible as a
1665 		 * global symbol.  However, the runtime linker recognizes the
1666 		 * hidden requirement and ensures the symbol isn't made globally
1667 		 * available at runtime.
1668 		 */
1669 		if (ld_sym_reducable(ofl, sdp)) {
1670 			/*
1671 			 * If any reductions are being processed, keep a count
1672 			 * of eliminated symbols, and if the symbol is being
1673 			 * reduced to local, count it's size for the .symtab.
1674 			 */
1675 			if (sdp->sd_flags & FLG_SY_ELIM) {
1676 				ofl->ofl_elimcnt++;
1677 			} else {
1678 				ofl->ofl_scopecnt++;
1679 				if ((((sdp->sd_flags & FLG_SY_REGSYM) == 0) ||
1680 				    sym->st_name) && (st_insert(ofl->ofl_strtab,
1681 				    sdp->sd_name) == -1))
1682 					return (S_ERROR);
1683 				if (allow_ldynsym && sym->st_name &&
1684 				    ldynsym_symtype[type]) {
1685 					ofl->ofl_dynscopecnt++;
1686 					if (st_insert(ofl->ofl_dynstrtab,
1687 					    sdp->sd_name) == -1)
1688 						return (S_ERROR);
1689 					/* Include it in sort section? */
1690 					DYNSORT_COUNT(sdp, sym, type, ++);
1691 				}
1692 			}
1693 		} else {
1694 			ofl->ofl_globcnt++;
1695 
1696 			/*
1697 			 * Check to see if this global variable should go into
1698 			 * a sort section. Sort sections require a
1699 			 * .SUNW_ldynsym section, so, don't check unless a
1700 			 * .SUNW_ldynsym is allowed.
1701 			 */
1702 			if (allow_ldynsym)
1703 				DYNSORT_COUNT(sdp, sym, type, ++);
1704 
1705 			/*
1706 			 * If global direct bindings are in effect, or this
1707 			 * symbol has bound to a dependency which was specified
1708 			 * as requiring direct bindings, and it hasn't
1709 			 * explicitly been defined as a non-direct binding
1710 			 * symbol, mark it.
1711 			 */
1712 			if (((ofl->ofl_dtflags_1 & DF_1_DIRECT) || (isp &&
1713 			    (isp->is_file->ifl_flags & FLG_IF_DIRECT))) &&
1714 			    ((sdp->sd_flags & FLG_SY_NDIR) == 0))
1715 				sdp->sd_flags |= FLG_SY_DIR;
1716 
1717 			/*
1718 			 * Insert the symbol name.
1719 			 */
1720 			if (((sdp->sd_flags & FLG_SY_REGSYM) == 0) ||
1721 			    sym->st_name) {
1722 				if (st_insert(ofl->ofl_strtab,
1723 				    sdp->sd_name) == -1)
1724 					return (S_ERROR);
1725 
1726 				if (!(ofl->ofl_flags & FLG_OF_RELOBJ) &&
1727 				    (st_insert(ofl->ofl_dynstrtab,
1728 				    sdp->sd_name) == -1))
1729 					return (S_ERROR);
1730 			}
1731 
1732 			/*
1733 			 * If this section offers a global symbol - record that
1734 			 * fact.
1735 			 */
1736 			if (isp) {
1737 				isp->is_flags |= FLG_IS_SECTREF;
1738 				isp->is_file->ifl_flags |= FLG_IF_FILEREF;
1739 			}
1740 		}
1741 	}
1742 
1743 	/*
1744 	 * Guidance: Use -z defs|nodefs when building shared objects.
1745 	 *
1746 	 * Our caller issues this, unless we mask it out here. So we mask it
1747 	 * out unless we've issued at least one warnings or fatal error.
1748 	 */
1749 	if (!((oflags & FLG_OF_SHAROBJ) && OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS) &&
1750 	    (undef_state & (FLG_OF_FATAL | FLG_OF_WARN))))
1751 		ofl->ofl_guideflags |= FLG_OFG_NO_DEFS;
1752 
1753 	/*
1754 	 * If we've encountered a fatal error during symbol validation then
1755 	 * return now.
1756 	 */
1757 	if (ofl->ofl_flags & FLG_OF_FATAL)
1758 		return (1);
1759 
1760 	/*
1761 	 * Now that symbol resolution is completed, scan any register symbols.
1762 	 * From now on, we're only interested in those that contribute to the
1763 	 * output file.
1764 	 */
1765 	if (ofl->ofl_regsyms) {
1766 		int	ndx;
1767 
1768 		for (ndx = 0; ndx < ofl->ofl_regsymsno; ndx++) {
1769 			if ((sdp = ofl->ofl_regsyms[ndx]) == NULL)
1770 				continue;
1771 			if (sdp->sd_ref != REF_REL_NEED) {
1772 				ofl->ofl_regsyms[ndx] = NULL;
1773 				continue;
1774 			}
1775 
1776 			ofl->ofl_regsymcnt++;
1777 			if (sdp->sd_sym->st_name == 0)
1778 				sdp->sd_name = MSG_ORIG(MSG_STR_EMPTY);
1779 
1780 			if (SYM_IS_HIDDEN(sdp) ||
1781 			    (ELF_ST_BIND(sdp->sd_sym->st_info) == STB_LOCAL))
1782 				ofl->ofl_lregsymcnt++;
1783 		}
1784 	}
1785 
1786 	/*
1787 	 * Generate the .bss section now that we know its size and alignment.
1788 	 */
1789 	if (need_bss) {
1790 		if (ld_make_bss(ofl, bsssize, bssalign,
1791 		    ld_targ.t_id.id_bss) == S_ERROR)
1792 			return (S_ERROR);
1793 	}
1794 	if (need_tlsbss) {
1795 		if (ld_make_bss(ofl, tlssize, tlsalign,
1796 		    ld_targ.t_id.id_tlsbss) == S_ERROR)
1797 			return (S_ERROR);
1798 	}
1799 #if	defined(_ELF64)
1800 	if ((ld_targ.t_m.m_mach == EM_AMD64) &&
1801 	    need_lbss && !(oflags & FLG_OF_RELOBJ)) {
1802 		if (ld_make_bss(ofl, lbsssize, lbssalign,
1803 		    ld_targ.t_id.id_lbss) == S_ERROR)
1804 			return (S_ERROR);
1805 	}
1806 #endif
1807 	/*
1808 	 * Determine what entry point symbol we need, and if found save its
1809 	 * symbol descriptor so that we can update the ELF header entry with the
1810 	 * symbols value later (see update_oehdr).  Make sure the symbol is
1811 	 * tagged to ensure its update in case -s is in effect.  Use any -e
1812 	 * option first, or the default entry points `_start' and `main'.
1813 	 */
1814 	ret = 0;
1815 	if (ofl->ofl_entry) {
1816 		if ((sdp = ld_sym_find(ofl->ofl_entry, SYM_NOHASH,
1817 		    NULL, ofl)) == NULL) {
1818 			ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_ARG_NOENTRY),
1819 			    ofl->ofl_entry);
1820 			ret++;
1821 		} else if (ensure_sym_local(ofl, sdp,
1822 		    MSG_INTL(MSG_SYM_ENTRY)) != 0) {
1823 			ret++;
1824 		} else {
1825 			ofl->ofl_entry = (void *)sdp;
1826 		}
1827 	} else if (((sdp = ld_sym_find(MSG_ORIG(MSG_SYM_START),
1828 	    SYM_NOHASH, NULL, ofl)) != NULL) && (ensure_sym_local(ofl,
1829 	    sdp, 0) == 0)) {
1830 		ofl->ofl_entry = (void *)sdp;
1831 
1832 	} else if (((sdp = ld_sym_find(MSG_ORIG(MSG_SYM_MAIN),
1833 	    SYM_NOHASH, NULL, ofl)) != NULL) && (ensure_sym_local(ofl,
1834 	    sdp, 0) == 0)) {
1835 		ofl->ofl_entry = (void *)sdp;
1836 	}
1837 
1838 	/*
1839 	 * If ld -zdtrace=<sym> was given, then validate that the symbol is
1840 	 * defined within the current object being built.
1841 	 */
1842 	if ((sdp = ofl->ofl_dtracesym) != 0)
1843 		ret += ensure_sym_local(ofl, sdp, MSG_ORIG(MSG_STR_DTRACE));
1844 
1845 	/*
1846 	 * If any initarray, finiarray or preinitarray functions have been
1847 	 * requested, make sure they are defined within the current object
1848 	 * being built.
1849 	 */
1850 	if (ofl->ofl_initarray) {
1851 		ret += ensure_array_local(ofl, ofl->ofl_initarray,
1852 		    MSG_ORIG(MSG_SYM_INITARRAY));
1853 	}
1854 	if (ofl->ofl_finiarray) {
1855 		ret += ensure_array_local(ofl, ofl->ofl_finiarray,
1856 		    MSG_ORIG(MSG_SYM_FINIARRAY));
1857 	}
1858 	if (ofl->ofl_preiarray) {
1859 		ret += ensure_array_local(ofl, ofl->ofl_preiarray,
1860 		    MSG_ORIG(MSG_SYM_PREINITARRAY));
1861 	}
1862 
1863 	if (ret)
1864 		return (S_ERROR);
1865 
1866 	/*
1867 	 * If we're required to record any needed dependencies versioning
1868 	 * information calculate it now that all symbols have been validated.
1869 	 */
1870 	if ((oflags & (FLG_OF_VERNEED | FLG_OF_NOVERSEC)) == FLG_OF_VERNEED)
1871 		return (ld_vers_check_need(ofl));
1872 	else
1873 		return (1);
1874 }
1875 
1876 /*
1877  * qsort(3c) comparison function.  As an optimization for associating weak
1878  * symbols to their strong counterparts sort global symbols according to their
1879  * section index, address and binding.
1880  */
1881 static int
1882 compare(const void *sdpp1, const void *sdpp2)
1883 {
1884 	Sym_desc	*sdp1 = *((Sym_desc **)sdpp1);
1885 	Sym_desc	*sdp2 = *((Sym_desc **)sdpp2);
1886 	Sym		*sym1, *sym2;
1887 	uchar_t		bind1, bind2;
1888 
1889 	/*
1890 	 * Symbol descriptors may be zero, move these to the front of the
1891 	 * sorted array.
1892 	 */
1893 	if (sdp1 == NULL)
1894 		return (-1);
1895 	if (sdp2 == NULL)
1896 		return (1);
1897 
1898 	sym1 = sdp1->sd_sym;
1899 	sym2 = sdp2->sd_sym;
1900 
1901 	/*
1902 	 * Compare the symbols section index.  This is important when sorting
1903 	 * the symbol tables of relocatable objects.  In this case, a symbols
1904 	 * value is the offset within the associated section, and thus many
1905 	 * symbols can have the same value, but are effectively different
1906 	 * addresses.
1907 	 */
1908 	if (sym1->st_shndx > sym2->st_shndx)
1909 		return (1);
1910 	if (sym1->st_shndx < sym2->st_shndx)
1911 		return (-1);
1912 
1913 	/*
1914 	 * Compare the symbols value (address).
1915 	 */
1916 	if (sym1->st_value > sym2->st_value)
1917 		return (1);
1918 	if (sym1->st_value < sym2->st_value)
1919 		return (-1);
1920 
1921 	bind1 = ELF_ST_BIND(sym1->st_info);
1922 	bind2 = ELF_ST_BIND(sym2->st_info);
1923 
1924 	/*
1925 	 * If two symbols have the same address place the weak symbol before
1926 	 * any strong counterpart.
1927 	 */
1928 	if (bind1 > bind2)
1929 		return (-1);
1930 	if (bind1 < bind2)
1931 		return (1);
1932 
1933 	return (0);
1934 }
1935 
1936 /*
1937  * Issue a MSG_SYM_BADADDR error from ld_sym_process(). This error
1938  * is issued when a symbol address/size is not contained by the
1939  * target section.
1940  *
1941  * Such objects are at least partially corrupt, and the user would
1942  * be well advised to be skeptical of them, and to ask their compiler
1943  * supplier to fix the problem. However, a distinction needs to be
1944  * made between symbols that reference readonly text, and those that
1945  * access writable data. Other than throwing off profiling results,
1946  * the readonly section case is less serious. We have encountered
1947  * such objects in the field. In order to allow existing objects
1948  * to continue working, we issue a warning rather than a fatal error
1949  * if the symbol is against readonly text. Other cases are fatal.
1950  */
1951 static void
1952 issue_badaddr_msg(Ifl_desc *ifl, Ofl_desc *ofl, Sym_desc *sdp,
1953     Sym *sym, Word shndx)
1954 {
1955 	Error		err;
1956 	const char	*msg;
1957 
1958 	if ((sdp->sd_isc->is_shdr->sh_flags & (SHF_WRITE | SHF_ALLOC)) ==
1959 	    SHF_ALLOC) {
1960 		msg = MSG_INTL(MSG_SYM_BADADDR_ROTXT);
1961 		err = ERR_WARNING;
1962 	} else {
1963 		msg = MSG_INTL(MSG_SYM_BADADDR);
1964 		err = ERR_FATAL;
1965 	}
1966 
1967 	ld_eprintf(ofl, err, msg, demangle(sdp->sd_name),
1968 	    ifl->ifl_name, shndx, sdp->sd_isc->is_name,
1969 	    EC_XWORD(sdp->sd_isc->is_shdr->sh_size),
1970 	    EC_XWORD(sym->st_value), EC_XWORD(sym->st_size));
1971 }
1972 
1973 /*
1974  * Global symbols that are candidates for translation to local capability
1975  * symbols under -z symbolcap, are maintained on a local symbol list.  Once
1976  * all symbols of a file are processed, this list is traversed to cull any
1977  * unnecessary weak symbol aliases.
1978  */
1979 typedef struct {
1980 	Sym_desc	*c_nsdp;	/* new lead symbol */
1981 	Sym_desc	*c_osdp;	/* original symbol */
1982 	Cap_group	*c_group;	/* symbol capability group */
1983 	Word		c_ndx;		/* symbol index */
1984 } Cap_pair;
1985 
1986 /*
1987  * Process the symbol table for the specified input file.  At this point all
1988  * input sections from this input file have been assigned an input section
1989  * descriptor which is saved in the `ifl_isdesc' array.
1990  *
1991  *  -	local symbols are saved (as is) if the input file is a relocatable
1992  *	object
1993  *
1994  *  -	global symbols are added to the linkers internal symbol table if they
1995  *	are not already present, otherwise a symbol resolution function is
1996  *	called upon to resolve the conflict.
1997  */
1998 uintptr_t
1999 ld_sym_process(Is_desc *isc, Ifl_desc *ifl, Ofl_desc *ofl)
2000 {
2001 	/*
2002 	 * This macro tests the given symbol to see if it is out of
2003 	 * range relative to the section it references.
2004 	 *
2005 	 * entry:
2006 	 *	- ifl is a relative object (ET_REL)
2007 	 *	_sdp - Symbol descriptor
2008 	 *	_sym - Symbol
2009 	 *	_type - Symbol type
2010 	 *
2011 	 * The following are tested:
2012 	 *	- Symbol length is non-zero
2013 	 *	- Symbol type is a type that references code or data
2014 	 *	- Referenced section is not 0 (indicates an UNDEF symbol)
2015 	 *	  and is not in the range of special values above SHN_LORESERVE
2016 	 *	  (excluding SHN_XINDEX, which is OK).
2017 	 *	- We have a valid section header for the target section
2018 	 *
2019 	 * If the above are all true, and the symbol position is not
2020 	 * contained by the target section, this macro evaluates to
2021 	 * True (1). Otherwise, False(0).
2022 	 */
2023 #define	SYM_LOC_BADADDR(_sdp, _sym, _type) \
2024 	(_sym->st_size && dynsymsort_symtype[_type] && \
2025 	(_sym->st_shndx != SHN_UNDEF) && \
2026 	((_sym->st_shndx < SHN_LORESERVE) || \
2027 		(_sym->st_shndx == SHN_XINDEX)) && \
2028 	_sdp->sd_isc && _sdp->sd_isc->is_shdr && \
2029 	((_sym->st_value + _sym->st_size) > _sdp->sd_isc->is_shdr->sh_size))
2030 
2031 	Conv_inv_buf_t	inv_buf;
2032 	Sym		*sym = (Sym *)isc->is_indata->d_buf;
2033 	Word		*symshndx = NULL;
2034 	Shdr		*shdr = isc->is_shdr;
2035 	Sym_desc	*sdp;
2036 	size_t		strsize;
2037 	char		*strs;
2038 	uchar_t		type, bind;
2039 	Word		ndx, hash, local, total;
2040 	uchar_t		osabi = ifl->ifl_ehdr->e_ident[EI_OSABI];
2041 	Half		mach = ifl->ifl_ehdr->e_machine;
2042 	Half		etype = ifl->ifl_ehdr->e_type;
2043 	int		etype_rel;
2044 	const char	*symsecname, *strsecname;
2045 	Word		symsecndx;
2046 	avl_index_t	where;
2047 	int		test_gnu_hidden_bit, weak;
2048 	Cap_desc	*cdp = NULL;
2049 	Alist		*cappairs = NULL;
2050 
2051 	/*
2052 	 * Its possible that a file may contain more that one symbol table,
2053 	 * ie. .dynsym and .symtab in a shared library.  Only process the first
2054 	 * table (here, we assume .dynsym comes before .symtab).
2055 	 */
2056 	if (ifl->ifl_symscnt)
2057 		return (1);
2058 
2059 	if (isc->is_symshndx)
2060 		symshndx = isc->is_symshndx->is_indata->d_buf;
2061 
2062 	DBG_CALL(Dbg_syms_process(ofl->ofl_lml, ifl));
2063 
2064 	symsecndx = isc->is_scnndx;
2065 	if (isc->is_name)
2066 		symsecname = isc->is_name;
2067 	else
2068 		symsecname = MSG_ORIG(MSG_STR_EMPTY);
2069 
2070 	/*
2071 	 * From the symbol tables section header information determine which
2072 	 * strtab table is needed to locate the actual symbol names.
2073 	 */
2074 	if (ifl->ifl_flags & FLG_IF_HSTRTAB) {
2075 		ndx = shdr->sh_link;
2076 		if ((ndx == 0) || (ndx >= ifl->ifl_shnum)) {
2077 			ld_eprintf(ofl, ERR_FATAL,
2078 			    MSG_INTL(MSG_FIL_INVSHLINK), ifl->ifl_name,
2079 			    EC_WORD(symsecndx), symsecname, EC_XWORD(ndx));
2080 			return (S_ERROR);
2081 		}
2082 		strsize = ifl->ifl_isdesc[ndx]->is_shdr->sh_size;
2083 		strs = ifl->ifl_isdesc[ndx]->is_indata->d_buf;
2084 		if (ifl->ifl_isdesc[ndx]->is_name)
2085 			strsecname = ifl->ifl_isdesc[ndx]->is_name;
2086 		else
2087 			strsecname = MSG_ORIG(MSG_STR_EMPTY);
2088 	} else {
2089 		/*
2090 		 * There is no string table section in this input file
2091 		 * although there are symbols in this symbol table section.
2092 		 * This means that these symbols do not have names.
2093 		 * Currently, only scratch register symbols are allowed
2094 		 * not to have names.
2095 		 */
2096 		strsize = 0;
2097 		strs = (char *)MSG_ORIG(MSG_STR_EMPTY);
2098 		strsecname = MSG_ORIG(MSG_STR_EMPTY);
2099 	}
2100 
2101 	/*
2102 	 * Determine the number of local symbols together with the total
2103 	 * number we have to process.
2104 	 */
2105 	total = (Word)(shdr->sh_size / shdr->sh_entsize);
2106 	local = shdr->sh_info;
2107 
2108 	/*
2109 	 * Allocate a symbol table index array and a local symbol array
2110 	 * (global symbols are processed and added to the ofl->ofl_symbkt[]
2111 	 * array).  If we are dealing with a relocatable object, allocate the
2112 	 * local symbol descriptors.  If this isn't a relocatable object we
2113 	 * still have to process any shared object locals to determine if any
2114 	 * register symbols exist.  Although these aren't added to the output
2115 	 * image, they are used as part of symbol resolution.
2116 	 */
2117 	if ((ifl->ifl_oldndx = libld_malloc((size_t)(total *
2118 	    sizeof (Sym_desc *)))) == NULL)
2119 		return (S_ERROR);
2120 	etype_rel = (etype == ET_REL);
2121 	if (etype_rel && local) {
2122 		if ((ifl->ifl_locs =
2123 		    libld_calloc(sizeof (Sym_desc), local)) == NULL)
2124 			return (S_ERROR);
2125 		/* LINTED */
2126 		ifl->ifl_locscnt = (Word)local;
2127 	}
2128 	ifl->ifl_symscnt = total;
2129 
2130 	/*
2131 	 * If there are local symbols to save add them to the symbol table
2132 	 * index array.
2133 	 */
2134 	if (local) {
2135 		int		allow_ldynsym = OFL_ALLOW_LDYNSYM(ofl);
2136 		Sym_desc	*last_file_sdp = NULL;
2137 		int		last_file_ndx = 0;
2138 
2139 		for (sym++, ndx = 1; ndx < local; sym++, ndx++) {
2140 			sd_flag_t	sdflags = FLG_SY_CLEAN;
2141 			Word		shndx;
2142 			const char	*name;
2143 			Sym_desc	*rsdp;
2144 			int		shndx_bad = 0;
2145 			int		symtab_enter = 1;
2146 
2147 			/*
2148 			 * Determine and validate the associated section index.
2149 			 */
2150 			if (symshndx && (sym->st_shndx == SHN_XINDEX)) {
2151 				shndx = symshndx[ndx];
2152 			} else if ((shndx = sym->st_shndx) >= SHN_LORESERVE) {
2153 				sdflags |= FLG_SY_SPECSEC;
2154 			} else if (shndx > ifl->ifl_shnum) {
2155 				/* We need the name before we can issue error */
2156 				shndx_bad = 1;
2157 			}
2158 
2159 			/*
2160 			 * Check if st_name has a valid value or not.
2161 			 */
2162 			if ((name = string(ofl, ifl, sym, strs, strsize, ndx,
2163 			    shndx, symsecndx, symsecname, strsecname,
2164 			    &sdflags)) == NULL)
2165 				continue;
2166 
2167 			/*
2168 			 * Now that we have the name, if the section index
2169 			 * was bad, report it.
2170 			 */
2171 			if (shndx_bad) {
2172 				ld_eprintf(ofl, ERR_WARNING,
2173 				    MSG_INTL(MSG_SYM_INVSHNDX),
2174 				    demangle_symname(name, symsecname, ndx),
2175 				    ifl->ifl_name,
2176 				    conv_sym_shndx(osabi, mach, sym->st_shndx,
2177 				    CONV_FMT_DECIMAL, &inv_buf));
2178 				continue;
2179 			}
2180 
2181 			/*
2182 			 * If this local symbol table originates from a shared
2183 			 * object, then we're only interested in recording
2184 			 * register symbols.  As local symbol descriptors aren't
2185 			 * allocated for shared objects, one will be allocated
2186 			 * to associated with the register symbol.  This symbol
2187 			 * won't become part of the output image, but we must
2188 			 * process it to test for register conflicts.
2189 			 */
2190 			rsdp = sdp = NULL;
2191 			if (sdflags & FLG_SY_REGSYM) {
2192 				/*
2193 				 * The presence of FLG_SY_REGSYM means that
2194 				 * the pointers in ld_targ.t_ms are non-NULL.
2195 				 */
2196 				rsdp = (*ld_targ.t_ms.ms_reg_find)(sym, ofl);
2197 				if (rsdp != 0) {
2198 					/*
2199 					 * The fact that another register def-
2200 					 * inition has been found is fatal.
2201 					 * Call the verification routine to get
2202 					 * the error message and move on.
2203 					 */
2204 					(void) (*ld_targ.t_ms.ms_reg_check)
2205 					    (rsdp, sym, name, ifl, ofl);
2206 					continue;
2207 				}
2208 
2209 				if (etype == ET_DYN) {
2210 					if ((sdp = libld_calloc(
2211 					    sizeof (Sym_desc), 1)) == NULL)
2212 						return (S_ERROR);
2213 					sdp->sd_ref = REF_DYN_SEEN;
2214 
2215 					/* Will not appear in output object */
2216 					symtab_enter = 0;
2217 				}
2218 			} else if (etype == ET_DYN)
2219 				continue;
2220 
2221 			/*
2222 			 * Fill in the remaining symbol descriptor information.
2223 			 */
2224 			if (sdp == NULL) {
2225 				sdp = &(ifl->ifl_locs[ndx]);
2226 				sdp->sd_ref = REF_REL_NEED;
2227 				sdp->sd_symndx = ndx;
2228 			}
2229 			if (rsdp == NULL) {
2230 				sdp->sd_name = name;
2231 				sdp->sd_sym = sym;
2232 				sdp->sd_shndx = shndx;
2233 				sdp->sd_flags = sdflags;
2234 				sdp->sd_file = ifl;
2235 				ifl->ifl_oldndx[ndx] = sdp;
2236 			}
2237 
2238 			DBG_CALL(Dbg_syms_entry(ofl->ofl_lml, ndx, sdp));
2239 
2240 			/*
2241 			 * Reclassify any SHN_SUNW_IGNORE symbols to SHN_UNDEF
2242 			 * so as to simplify future processing.
2243 			 */
2244 			if (sym->st_shndx == SHN_SUNW_IGNORE) {
2245 				sdp->sd_shndx = shndx = SHN_UNDEF;
2246 				sdp->sd_flags |= (FLG_SY_IGNORE | FLG_SY_ELIM);
2247 			}
2248 
2249 			/*
2250 			 * Process any register symbols.
2251 			 */
2252 			if (sdp->sd_flags & FLG_SY_REGSYM) {
2253 				/*
2254 				 * Add a diagnostic to indicate we've caught a
2255 				 * register symbol, as this can be useful if a
2256 				 * register conflict is later discovered.
2257 				 */
2258 				DBG_CALL(Dbg_syms_entered(ofl, sym, sdp));
2259 
2260 				/*
2261 				 * If this register symbol hasn't already been
2262 				 * recorded, enter it now.
2263 				 *
2264 				 * The presence of FLG_SY_REGSYM means that
2265 				 * the pointers in ld_targ.t_ms are non-NULL.
2266 				 */
2267 				if ((rsdp == NULL) &&
2268 				    ((*ld_targ.t_ms.ms_reg_enter)(sdp, ofl) ==
2269 				    0))
2270 					return (S_ERROR);
2271 			}
2272 
2273 			/*
2274 			 * Assign an input section.
2275 			 */
2276 			if ((sym->st_shndx != SHN_UNDEF) &&
2277 			    ((sdp->sd_flags & FLG_SY_SPECSEC) == 0))
2278 				sdp->sd_isc = ifl->ifl_isdesc[shndx];
2279 
2280 			/*
2281 			 * If this symbol falls within the range of a section
2282 			 * being discarded, then discard the symbol itself.
2283 			 * There is no reason to keep this local symbol.
2284 			 */
2285 			if (sdp->sd_isc &&
2286 			    (sdp->sd_isc->is_flags & FLG_IS_DISCARD)) {
2287 				sdp->sd_flags |= FLG_SY_ISDISC;
2288 				DBG_CALL(Dbg_syms_discarded(ofl->ofl_lml, sdp));
2289 				continue;
2290 			}
2291 
2292 			/*
2293 			 * Skip any section symbols as new versions of these
2294 			 * will be created.
2295 			 */
2296 			if ((type = ELF_ST_TYPE(sym->st_info)) == STT_SECTION) {
2297 				if (sym->st_shndx == SHN_UNDEF) {
2298 					ld_eprintf(ofl, ERR_WARNING,
2299 					    MSG_INTL(MSG_SYM_INVSHNDX),
2300 					    demangle_symname(name, symsecname,
2301 					    ndx), ifl->ifl_name,
2302 					    conv_sym_shndx(osabi, mach,
2303 					    sym->st_shndx, CONV_FMT_DECIMAL,
2304 					    &inv_buf));
2305 				}
2306 				continue;
2307 			}
2308 
2309 			/*
2310 			 * For a relocatable object, if this symbol is defined
2311 			 * and has non-zero length and references an address
2312 			 * within an associated section, then check its extents
2313 			 * to make sure the section boundaries encompass it.
2314 			 * If they don't, the ELF file is corrupt.
2315 			 */
2316 			if (etype_rel) {
2317 				if (SYM_LOC_BADADDR(sdp, sym, type)) {
2318 					issue_badaddr_msg(ifl, ofl, sdp,
2319 					    sym, shndx);
2320 					if (ofl->ofl_flags & FLG_OF_FATAL)
2321 						continue;
2322 				}
2323 
2324 				/*
2325 				 * We have observed relocatable objects
2326 				 * containing identical adjacent STT_FILE
2327 				 * symbols. Discard any other than the first,
2328 				 * as they are all equivalent and the extras
2329 				 * do not add information.
2330 				 *
2331 				 * For the purpose of this test, we assume
2332 				 * that only the symbol type and the string
2333 				 * table offset (st_name) matter.
2334 				 */
2335 				if (type == STT_FILE) {
2336 					int toss = (last_file_sdp != NULL) &&
2337 					    ((ndx - 1) == last_file_ndx) &&
2338 					    (sym->st_name ==
2339 					    last_file_sdp->sd_sym->st_name);
2340 
2341 					last_file_sdp = sdp;
2342 					last_file_ndx = ndx;
2343 					if (toss) {
2344 						sdp->sd_flags |= FLG_SY_INVALID;
2345 						DBG_CALL(Dbg_syms_dup_discarded(
2346 						    ofl->ofl_lml, ndx, sdp));
2347 						continue;
2348 					}
2349 				}
2350 			}
2351 
2352 
2353 			/*
2354 			 * Sanity check for TLS
2355 			 */
2356 			if ((sym->st_size != 0) && ((type == STT_TLS) &&
2357 			    (sym->st_shndx != SHN_COMMON))) {
2358 				Is_desc	*isp = sdp->sd_isc;
2359 
2360 				if ((isp == NULL) || (isp->is_shdr == NULL) ||
2361 				    ((isp->is_shdr->sh_flags & SHF_TLS) == 0)) {
2362 					ld_eprintf(ofl, ERR_FATAL,
2363 					    MSG_INTL(MSG_SYM_TLS),
2364 					    demangle(sdp->sd_name),
2365 					    ifl->ifl_name);
2366 					continue;
2367 				}
2368 			}
2369 
2370 			/*
2371 			 * Carry our some basic sanity checks (these are just
2372 			 * some of the erroneous symbol entries we've come
2373 			 * across, there's probably a lot more).  The symbol
2374 			 * will not be carried forward to the output file, which
2375 			 * won't be a problem unless a relocation is required
2376 			 * against it.
2377 			 */
2378 			if (((sdp->sd_flags & FLG_SY_SPECSEC) &&
2379 			    ((sym->st_shndx == SHN_COMMON)) ||
2380 			    ((type == STT_FILE) &&
2381 			    (sym->st_shndx != SHN_ABS))) ||
2382 			    (sdp->sd_isc && (sdp->sd_isc->is_osdesc == NULL))) {
2383 				ld_eprintf(ofl, ERR_WARNING,
2384 				    MSG_INTL(MSG_SYM_INVSHNDX),
2385 				    demangle_symname(name, symsecname, ndx),
2386 				    ifl->ifl_name,
2387 				    conv_sym_shndx(osabi, mach, sym->st_shndx,
2388 				    CONV_FMT_DECIMAL, &inv_buf));
2389 				sdp->sd_isc = NULL;
2390 				sdp->sd_flags |= FLG_SY_INVALID;
2391 				continue;
2392 			}
2393 
2394 			/*
2395 			 * As these local symbols will become part of the output
2396 			 * image, record their number and name string size.
2397 			 * Globals are counted after all input file processing
2398 			 * (and hence symbol resolution) is complete during
2399 			 * sym_validate().
2400 			 */
2401 			if (!(ofl->ofl_flags & FLG_OF_REDLSYM) &&
2402 			    symtab_enter) {
2403 				ofl->ofl_locscnt++;
2404 
2405 				if ((((sdp->sd_flags & FLG_SY_REGSYM) == 0) ||
2406 				    sym->st_name) && (st_insert(ofl->ofl_strtab,
2407 				    sdp->sd_name) == -1))
2408 					return (S_ERROR);
2409 
2410 				if (allow_ldynsym && sym->st_name &&
2411 				    ldynsym_symtype[type]) {
2412 					ofl->ofl_dynlocscnt++;
2413 					if (st_insert(ofl->ofl_dynstrtab,
2414 					    sdp->sd_name) == -1)
2415 						return (S_ERROR);
2416 					/* Include it in sort section? */
2417 					DYNSORT_COUNT(sdp, sym, type, ++);
2418 				}
2419 			}
2420 		}
2421 	}
2422 
2423 	/*
2424 	 * The GNU ld interprets the top bit of the 16-bit Versym value
2425 	 * (0x8000) as the "hidden" bit. If this bit is set, the linker
2426 	 * is supposed to act as if that symbol does not exist. The Solaris
2427 	 * linker does not support this mechanism, or the model of interface
2428 	 * evolution that it allows, but we honor it in GNU ld produced
2429 	 * objects in order to interoperate with them.
2430 	 *
2431 	 * Determine if we should honor the GNU hidden bit for this file.
2432 	 */
2433 	test_gnu_hidden_bit = ((ifl->ifl_flags & FLG_IF_GNUVER) != 0) &&
2434 	    (ifl->ifl_versym != NULL);
2435 
2436 	/*
2437 	 * Determine whether object capabilities for this file are being
2438 	 * converted into symbol capabilities.  If so, global function symbols,
2439 	 * and initialized global data symbols, need special translation and
2440 	 * processing.
2441 	 */
2442 	if ((etype == ET_REL) && (ifl->ifl_flags & FLG_IF_OTOSCAP))
2443 		cdp = ifl->ifl_caps;
2444 
2445 	/*
2446 	 * Now scan the global symbols entering them in the internal symbol
2447 	 * table or resolving them as necessary.
2448 	 */
2449 	sym = (Sym *)isc->is_indata->d_buf;
2450 	sym += local;
2451 	weak = 0;
2452 	/* LINTED */
2453 	for (ndx = (int)local; ndx < total; sym++, ndx++) {
2454 		const char	*name;
2455 		sd_flag_t	sdflags = 0;
2456 		Word		shndx;
2457 		int		shndx_bad = 0;
2458 		Sym		*nsym = sym;
2459 		Cap_pair	*cpp = NULL;
2460 		uchar_t		ntype;
2461 
2462 		/*
2463 		 * Determine and validate the associated section index.
2464 		 */
2465 		if (symshndx && (nsym->st_shndx == SHN_XINDEX)) {
2466 			shndx = symshndx[ndx];
2467 		} else if ((shndx = nsym->st_shndx) >= SHN_LORESERVE) {
2468 			sdflags |= FLG_SY_SPECSEC;
2469 		} else if (shndx > ifl->ifl_shnum) {
2470 			/* We need the name before we can issue error */
2471 			shndx_bad = 1;
2472 		}
2473 
2474 		/*
2475 		 * Check if st_name has a valid value or not.
2476 		 */
2477 		if ((name = string(ofl, ifl, nsym, strs, strsize, ndx, shndx,
2478 		    symsecndx, symsecname, strsecname, &sdflags)) == NULL)
2479 			continue;
2480 
2481 		/*
2482 		 * Now that we have the name, report an erroneous section index.
2483 		 */
2484 		if (shndx_bad) {
2485 			ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_INVSHNDX),
2486 			    demangle_symname(name, symsecname, ndx),
2487 			    ifl->ifl_name,
2488 			    conv_sym_shndx(osabi, mach, nsym->st_shndx,
2489 			    CONV_FMT_DECIMAL, &inv_buf));
2490 			continue;
2491 		}
2492 
2493 		/*
2494 		 * Test for the GNU hidden bit, and ignore symbols that
2495 		 * have it set.
2496 		 */
2497 		if (test_gnu_hidden_bit &&
2498 		    ((ifl->ifl_versym[ndx] & 0x8000) != 0))
2499 			continue;
2500 
2501 		/*
2502 		 * The linker itself will generate symbols for _end, _etext,
2503 		 * _edata, _DYNAMIC and _PROCEDURE_LINKAGE_TABLE_, so don't
2504 		 * bother entering these symbols from shared objects.  This
2505 		 * results in some wasted resolution processing, which is hard
2506 		 * to feel, but if nothing else, pollutes diagnostic relocation
2507 		 * output.
2508 		 */
2509 		if (name[0] && (etype == ET_DYN) && (nsym->st_size == 0) &&
2510 		    (ELF_ST_TYPE(nsym->st_info) == STT_OBJECT) &&
2511 		    (name[0] == '_') && ((name[1] == 'e') ||
2512 		    (name[1] == 'D') || (name[1] == 'P')) &&
2513 		    ((strcmp(name, MSG_ORIG(MSG_SYM_ETEXT_U)) == 0) ||
2514 		    (strcmp(name, MSG_ORIG(MSG_SYM_EDATA_U)) == 0) ||
2515 		    (strcmp(name, MSG_ORIG(MSG_SYM_END_U)) == 0) ||
2516 		    (strcmp(name, MSG_ORIG(MSG_SYM_DYNAMIC_U)) == 0) ||
2517 		    (strcmp(name, MSG_ORIG(MSG_SYM_PLKTBL_U)) == 0))) {
2518 			ifl->ifl_oldndx[ndx] = 0;
2519 			continue;
2520 		}
2521 
2522 		/*
2523 		 * The '-z wrap=XXX' option emulates the GNU ld --wrap=XXX
2524 		 * option. When XXX is the symbol to be wrapped:
2525 		 *
2526 		 *  -	An undefined reference to XXX is converted to __wrap_XXX
2527 		 *  -	An undefined reference to __real_XXX is converted to XXX
2528 		 *
2529 		 * The idea is that the user can supply a wrapper function
2530 		 * __wrap_XXX that does some work, and then uses the name
2531 		 * __real_XXX to pass the call on to the real function. The
2532 		 * wrapper objects are linked with the original unmodified
2533 		 * objects to produce a wrapped version of the output object.
2534 		 */
2535 		if (ofl->ofl_wrap && name[0] && (shndx == SHN_UNDEF)) {
2536 			WrapSymNode wsn, *wsnp;
2537 
2538 			/*
2539 			 * If this is the __real_XXX form, advance the
2540 			 * pointer to reference the wrapped name.
2541 			 */
2542 			wsn.wsn_name = name;
2543 			if ((*name == '_') &&
2544 			    (strncmp(name, MSG_ORIG(MSG_STR_UU_REAL_U),
2545 			    MSG_STR_UU_REAL_U_SIZE) == 0))
2546 				wsn.wsn_name += MSG_STR_UU_REAL_U_SIZE;
2547 
2548 			/*
2549 			 * Is this symbol in the wrap AVL tree? If so, map
2550 			 * XXX to __wrap_XXX, and __real_XXX to XXX. Note that
2551 			 * wsn.wsn_name will equal the current value of name
2552 			 * if the __real_ prefix is not present.
2553 			 */
2554 			if ((wsnp = avl_find(ofl->ofl_wrap, &wsn, 0)) != NULL) {
2555 				const char *old_name = name;
2556 
2557 				name = (wsn.wsn_name == name) ?
2558 				    wsnp->wsn_wrapname : wsn.wsn_name;
2559 				DBG_CALL(Dbg_syms_wrap(ofl->ofl_lml, ndx,
2560 				    old_name, name));
2561 			}
2562 		}
2563 
2564 		/*
2565 		 * Determine and validate the symbols binding.
2566 		 */
2567 		bind = ELF_ST_BIND(nsym->st_info);
2568 		if ((bind != STB_GLOBAL) && (bind != STB_WEAK)) {
2569 			ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_NONGLOB),
2570 			    demangle_symname(name, symsecname, ndx),
2571 			    ifl->ifl_name,
2572 			    conv_sym_info_bind(bind, 0, &inv_buf));
2573 			continue;
2574 		}
2575 		if (bind == STB_WEAK)
2576 			weak++;
2577 
2578 		/*
2579 		 * If this symbol falls within the range of a section being
2580 		 * discarded, then discard the symbol itself.
2581 		 */
2582 		if (((sdflags & FLG_SY_SPECSEC) == 0) &&
2583 		    (nsym->st_shndx != SHN_UNDEF)) {
2584 			Is_desc	*isp;
2585 
2586 			if (shndx >= ifl->ifl_shnum) {
2587 				/*
2588 				 * Carry our some basic sanity checks
2589 				 * The symbol will not be carried forward to
2590 				 * the output file, which won't be a problem
2591 				 * unless a relocation is required against it.
2592 				 */
2593 				ld_eprintf(ofl, ERR_WARNING,
2594 				    MSG_INTL(MSG_SYM_INVSHNDX),
2595 				    demangle_symname(name, symsecname, ndx),
2596 				    ifl->ifl_name,
2597 				    conv_sym_shndx(osabi, mach, nsym->st_shndx,
2598 				    CONV_FMT_DECIMAL, &inv_buf));
2599 				continue;
2600 			}
2601 
2602 			isp = ifl->ifl_isdesc[shndx];
2603 			if (isp && (isp->is_flags & FLG_IS_DISCARD)) {
2604 				if ((sdp =
2605 				    libld_calloc(sizeof (Sym_desc), 1)) == NULL)
2606 					return (S_ERROR);
2607 
2608 				/*
2609 				 * Create a dummy symbol entry so that if we
2610 				 * find any references to this discarded symbol
2611 				 * we can compensate.
2612 				 */
2613 				sdp->sd_name = name;
2614 				sdp->sd_sym = nsym;
2615 				sdp->sd_file = ifl;
2616 				sdp->sd_isc = isp;
2617 				sdp->sd_flags = FLG_SY_ISDISC;
2618 				ifl->ifl_oldndx[ndx] = sdp;
2619 
2620 				DBG_CALL(Dbg_syms_discarded(ofl->ofl_lml, sdp));
2621 				continue;
2622 			}
2623 		}
2624 
2625 		/*
2626 		 * If object capabilities for this file are being converted
2627 		 * into symbol capabilities, then:
2628 		 *
2629 		 *  -	Any global function, or initialized global data symbol
2630 		 *	definitions (ie., those that are not associated with
2631 		 *	special symbol types, ie., ABS, COMMON, etc.), and which
2632 		 *	have not been reduced to locals, are converted to symbol
2633 		 *	references (UNDEF).  This ensures that any reference to
2634 		 *	the original symbol, for example from a relocation, get
2635 		 *	associated to a capabilities family lead symbol, ie., a
2636 		 *	generic instance.
2637 		 *
2638 		 *  -	For each global function, or object symbol definition,
2639 		 *	a new local symbol is created.  The function or object
2640 		 *	is renamed using the capabilities CA_SUNW_ID definition
2641 		 *	(which might have been fabricated for this purpose -
2642 		 *	see get_cap_group()).  The new symbol name is:
2643 		 *
2644 		 *	    <original name>%<capability group identifier>
2645 		 *
2646 		 *	This symbol is associated to the same location, and
2647 		 *	becomes a capabilities family member.
2648 		 */
2649 		/* LINTED */
2650 		hash = (Word)elf_hash(name);
2651 
2652 		ntype = ELF_ST_TYPE(nsym->st_info);
2653 		if (cdp && (nsym->st_shndx != SHN_UNDEF) &&
2654 		    ((sdflags & FLG_SY_SPECSEC) == 0) &&
2655 		    ((ntype == STT_FUNC) || (ntype == STT_OBJECT))) {
2656 			/*
2657 			 * Determine this symbol's visibility.  If a mapfile has
2658 			 * indicated this symbol should be local, then there's
2659 			 * no point in transforming this global symbol to a
2660 			 * capabilities symbol.  Otherwise, create a symbol
2661 			 * capability pair descriptor to record this symbol as
2662 			 * a candidate for translation.
2663 			 */
2664 			if (sym_cap_vis(name, hash, sym, ofl) &&
2665 			    ((cpp = alist_append(&cappairs, NULL,
2666 			    sizeof (Cap_pair), AL_CNT_CAP_PAIRS)) == NULL))
2667 				return (S_ERROR);
2668 		}
2669 
2670 		if (cpp) {
2671 			Sym	*rsym;
2672 
2673 			DBG_CALL(Dbg_syms_cap_convert(ofl, ndx, name, nsym));
2674 
2675 			/*
2676 			 * Allocate a new symbol descriptor to represent the
2677 			 * transformed global symbol.  The descriptor points
2678 			 * to the original symbol information (which might
2679 			 * indicate a global or weak visibility).  The symbol
2680 			 * information will be transformed into a local symbol
2681 			 * later, after any weak aliases are culled.
2682 			 */
2683 			if ((cpp->c_osdp =
2684 			    libld_malloc(sizeof (Sym_desc))) == NULL)
2685 				return (S_ERROR);
2686 
2687 			cpp->c_osdp->sd_name = name;
2688 			cpp->c_osdp->sd_sym = nsym;
2689 			cpp->c_osdp->sd_shndx = shndx;
2690 			cpp->c_osdp->sd_file = ifl;
2691 			cpp->c_osdp->sd_isc = ifl->ifl_isdesc[shndx];
2692 			cpp->c_osdp->sd_ref = REF_REL_NEED;
2693 
2694 			/*
2695 			 * Save the capabilities group this symbol belongs to,
2696 			 * and the original symbol index.
2697 			 */
2698 			cpp->c_group = cdp->ca_groups->apl_data[0];
2699 			cpp->c_ndx = ndx;
2700 
2701 			/*
2702 			 * Replace the original symbol definition with a symbol
2703 			 * reference.  Make sure this reference isn't left as a
2704 			 * weak.
2705 			 */
2706 			if ((rsym = libld_malloc(sizeof (Sym))) == NULL)
2707 				return (S_ERROR);
2708 
2709 			*rsym = *nsym;
2710 
2711 			rsym->st_info = ELF_ST_INFO(STB_GLOBAL, ntype);
2712 			rsym->st_shndx = shndx = SHN_UNDEF;
2713 			rsym->st_value = 0;
2714 			rsym->st_size = 0;
2715 
2716 			sdflags |= FLG_SY_CAP;
2717 
2718 			nsym = rsym;
2719 		}
2720 
2721 		/*
2722 		 * If the symbol does not already exist in the internal symbol
2723 		 * table add it, otherwise resolve the conflict.  If the symbol
2724 		 * from this file is kept, retain its symbol table index for
2725 		 * possible use in associating a global alias.
2726 		 */
2727 		if ((sdp = ld_sym_find(name, hash, &where, ofl)) == NULL) {
2728 			DBG_CALL(Dbg_syms_global(ofl->ofl_lml, ndx, name));
2729 			if ((sdp = ld_sym_enter(name, nsym, hash, ifl, ofl, ndx,
2730 			    shndx, sdflags, &where)) == (Sym_desc *)S_ERROR)
2731 				return (S_ERROR);
2732 
2733 		} else if (ld_sym_resolve(sdp, nsym, ifl, ofl, ndx, shndx,
2734 		    sdflags) == S_ERROR)
2735 			return (S_ERROR);
2736 
2737 		/*
2738 		 * Now that we have a symbol descriptor, retain the descriptor
2739 		 * for later use by symbol capabilities processing.
2740 		 */
2741 		if (cpp)
2742 			cpp->c_nsdp = sdp;
2743 
2744 		/*
2745 		 * After we've compared a defined symbol in one shared
2746 		 * object, flag the symbol so we don't compare it again.
2747 		 */
2748 		if ((etype == ET_DYN) && (nsym->st_shndx != SHN_UNDEF) &&
2749 		    ((sdp->sd_flags & FLG_SY_SOFOUND) == 0))
2750 			sdp->sd_flags |= FLG_SY_SOFOUND;
2751 
2752 		/*
2753 		 * If the symbol is accepted from this file retain the symbol
2754 		 * index for possible use in aliasing.
2755 		 */
2756 		if (sdp->sd_file == ifl)
2757 			sdp->sd_symndx = ndx;
2758 
2759 		ifl->ifl_oldndx[ndx] = sdp;
2760 
2761 		/*
2762 		 * If we've accepted a register symbol, continue to validate
2763 		 * it.
2764 		 */
2765 		if (sdp->sd_flags & FLG_SY_REGSYM) {
2766 			Sym_desc	*rsdp;
2767 
2768 			/*
2769 			 * The presence of FLG_SY_REGSYM means that
2770 			 * the pointers in ld_targ.t_ms are non-NULL.
2771 			 */
2772 			rsdp = (*ld_targ.t_ms.ms_reg_find)(sdp->sd_sym, ofl);
2773 			if (rsdp == NULL) {
2774 				if ((*ld_targ.t_ms.ms_reg_enter)(sdp, ofl) == 0)
2775 					return (S_ERROR);
2776 			} else if (rsdp != sdp) {
2777 				(void) (*ld_targ.t_ms.ms_reg_check)(rsdp,
2778 				    sdp->sd_sym, sdp->sd_name, ifl, ofl);
2779 			}
2780 		}
2781 
2782 		/*
2783 		 * For a relocatable object, if this symbol is defined
2784 		 * and has non-zero length and references an address
2785 		 * within an associated section, then check its extents
2786 		 * to make sure the section boundaries encompass it.
2787 		 * If they don't, the ELF file is corrupt. Note that this
2788 		 * global symbol may have come from another file to satisfy
2789 		 * an UNDEF symbol of the same name from this one. In that
2790 		 * case, we don't check it, because it was already checked
2791 		 * as part of its own file.
2792 		 */
2793 		if (etype_rel && (sdp->sd_file == ifl)) {
2794 			Sym *tsym = sdp->sd_sym;
2795 
2796 			if (SYM_LOC_BADADDR(sdp, tsym,
2797 			    ELF_ST_TYPE(tsym->st_info))) {
2798 				issue_badaddr_msg(ifl, ofl, sdp,
2799 				    tsym, tsym->st_shndx);
2800 				continue;
2801 			}
2802 		}
2803 	}
2804 	DBG_CALL(Dbg_util_nl(ofl->ofl_lml, DBG_NL_STD));
2805 
2806 	/*
2807 	 * Associate weak (alias) symbols to their non-weak counterparts by
2808 	 * scanning the global symbols one more time.
2809 	 *
2810 	 * This association is needed when processing the symbols from a shared
2811 	 * object dependency when a a weak definition satisfies a reference:
2812 	 *
2813 	 *  -	When building a dynamic executable, if a referenced symbol is a
2814 	 *	data item, the symbol data is copied to the executables address
2815 	 *	space.  In this copy-relocation case, we must also reassociate
2816 	 *	the alias symbol with its new location in the executable.
2817 	 *
2818 	 *  -	If the referenced symbol is a function then we may need to
2819 	 *	promote the symbols binding from undefined weak to undefined,
2820 	 *	otherwise the run-time linker will not generate the correct
2821 	 *	relocation error should the symbol not be found.
2822 	 *
2823 	 * Weak alias association is also required when a local dynsym table
2824 	 * is being created.  This table should only contain one instance of a
2825 	 * symbol that is associated to a given address.
2826 	 *
2827 	 * The true association between a weak/strong symbol pair is that both
2828 	 * symbol entries are identical, thus first we create a sorted symbol
2829 	 * list keyed off of the symbols section index and value.  If the symbol
2830 	 * belongs to the same section and has the same value, then the chances
2831 	 * are that the rest of the symbols data is the same.  This list is then
2832 	 * scanned for weak symbols, and if one is found then any strong
2833 	 * association will exist in the entries that follow.  Thus we just have
2834 	 * to scan one (typically a single alias) or more (in the uncommon
2835 	 * instance of multiple weak to strong associations) entries to
2836 	 * determine if a match exists.
2837 	 */
2838 	if (weak && (OFL_ALLOW_LDYNSYM(ofl) || (etype == ET_DYN)) &&
2839 	    (total > local)) {
2840 		static Sym_desc	**sort;
2841 		static size_t	osize = 0;
2842 		size_t		nsize = (total - local) * sizeof (Sym_desc *);
2843 
2844 		/*
2845 		 * As we might be processing many input files, and many symbols,
2846 		 * try and reuse a static sort buffer.  Note, presently we're
2847 		 * playing the game of never freeing any buffers as there's a
2848 		 * belief this wastes time.
2849 		 */
2850 		if ((osize == 0) || (nsize > osize)) {
2851 			if ((sort = libld_malloc(nsize)) == NULL)
2852 				return (S_ERROR);
2853 			osize = nsize;
2854 		}
2855 		(void) memcpy((void *)sort, &ifl->ifl_oldndx[local], nsize);
2856 
2857 		qsort(sort, (total - local), sizeof (Sym_desc *), compare);
2858 
2859 		for (ndx = 0; ndx < (total - local); ndx++) {
2860 			Sym_desc	*wsdp = sort[ndx];
2861 			Sym		*wsym;
2862 			int		sndx;
2863 
2864 			/*
2865 			 * Ignore any empty symbol descriptor, or the case where
2866 			 * the symbol has been resolved to a different file.
2867 			 */
2868 			if ((wsdp == NULL) || (wsdp->sd_file != ifl))
2869 				continue;
2870 
2871 			wsym = wsdp->sd_sym;
2872 
2873 			if ((wsym->st_shndx == SHN_UNDEF) ||
2874 			    (wsdp->sd_flags & FLG_SY_SPECSEC) ||
2875 			    (ELF_ST_BIND(wsym->st_info) != STB_WEAK))
2876 				continue;
2877 
2878 			/*
2879 			 * We have a weak symbol, if it has a strong alias it
2880 			 * will have been sorted to one of the following sort
2881 			 * table entries.  Note that we could have multiple weak
2882 			 * symbols aliased to one strong (if this occurs then
2883 			 * the strong symbol only maintains one alias back to
2884 			 * the last weak).
2885 			 */
2886 			for (sndx = ndx + 1; sndx < (total - local); sndx++) {
2887 				Sym_desc	*ssdp = sort[sndx];
2888 				Sym		*ssym;
2889 				sd_flag_t	w_dynbits, s_dynbits;
2890 
2891 				/*
2892 				 * Ignore any empty symbol descriptor, or the
2893 				 * case where the symbol has been resolved to a
2894 				 * different file.
2895 				 */
2896 				if ((ssdp == NULL) || (ssdp->sd_file != ifl))
2897 					continue;
2898 
2899 				ssym = ssdp->sd_sym;
2900 
2901 				if (ssym->st_shndx == SHN_UNDEF)
2902 					continue;
2903 
2904 				if ((ssym->st_shndx != wsym->st_shndx) ||
2905 				    (ssym->st_value != wsym->st_value))
2906 					break;
2907 
2908 				if ((ssym->st_size != wsym->st_size) ||
2909 				    (ssdp->sd_flags & FLG_SY_SPECSEC) ||
2910 				    (ELF_ST_BIND(ssym->st_info) == STB_WEAK))
2911 					continue;
2912 
2913 				/*
2914 				 * If a sharable object, set link fields so
2915 				 * that they reference each other.`
2916 				 */
2917 				if (etype == ET_DYN) {
2918 					ssdp->sd_aux->sa_linkndx =
2919 					    (Word)wsdp->sd_symndx;
2920 					wsdp->sd_aux->sa_linkndx =
2921 					    (Word)ssdp->sd_symndx;
2922 				}
2923 
2924 				/*
2925 				 * Determine which of these two symbols go into
2926 				 * the sort section.  If a mapfile has made
2927 				 * explicit settings of the FLG_SY_*DYNSORT
2928 				 * flags for both symbols, then we do what they
2929 				 * say.  If one has the DYNSORT flags set, we
2930 				 * set the NODYNSORT bit in the other.  And if
2931 				 * neither has an explicit setting, then we
2932 				 * favor the weak symbol because they usually
2933 				 * lack the leading underscore.
2934 				 */
2935 				w_dynbits = wsdp->sd_flags &
2936 				    (FLG_SY_DYNSORT | FLG_SY_NODYNSORT);
2937 				s_dynbits = ssdp->sd_flags &
2938 				    (FLG_SY_DYNSORT | FLG_SY_NODYNSORT);
2939 				if (!(w_dynbits && s_dynbits)) {
2940 					if (s_dynbits) {
2941 						if (s_dynbits == FLG_SY_DYNSORT)
2942 							wsdp->sd_flags |=
2943 							    FLG_SY_NODYNSORT;
2944 					} else if (w_dynbits !=
2945 					    FLG_SY_NODYNSORT) {
2946 						ssdp->sd_flags |=
2947 						    FLG_SY_NODYNSORT;
2948 					}
2949 				}
2950 				break;
2951 			}
2952 		}
2953 	}
2954 
2955 	/*
2956 	 * Having processed all symbols, under -z symbolcap, reprocess any
2957 	 * symbols that are being translated from global to locals.  The symbol
2958 	 * pair that has been collected defines the original symbol (c_osdp),
2959 	 * which will become a local, and the new symbol (c_nsdp), which will
2960 	 * become a reference (UNDEF) for the original.
2961 	 *
2962 	 * Scan these symbol pairs looking for weak symbols, which have non-weak
2963 	 * aliases.  There is no need to translate both of these symbols to
2964 	 * locals, only the global is necessary.
2965 	 */
2966 	if (cappairs) {
2967 		Aliste		idx1;
2968 		Cap_pair	*cpp1;
2969 
2970 		for (ALIST_TRAVERSE(cappairs, idx1, cpp1)) {
2971 			Sym_desc	*sdp1 = cpp1->c_osdp;
2972 			Sym		*sym1 = sdp1->sd_sym;
2973 			uchar_t		bind1 = ELF_ST_BIND(sym1->st_info);
2974 			Aliste		idx2;
2975 			Cap_pair	*cpp2;
2976 
2977 			/*
2978 			 * If this symbol isn't weak, it's capability member is
2979 			 * retained for the creation of a local symbol.
2980 			 */
2981 			if (bind1 != STB_WEAK)
2982 				continue;
2983 
2984 			/*
2985 			 * If this is a weak symbol, traverse the capabilities
2986 			 * list again to determine if a corresponding non-weak
2987 			 * symbol exists.
2988 			 */
2989 			for (ALIST_TRAVERSE(cappairs, idx2, cpp2)) {
2990 				Sym_desc	*sdp2 = cpp2->c_osdp;
2991 				Sym		*sym2 = sdp2->sd_sym;
2992 				uchar_t		bind2 =
2993 				    ELF_ST_BIND(sym2->st_info);
2994 
2995 				if ((cpp1 == cpp2) ||
2996 				    (cpp1->c_group != cpp2->c_group) ||
2997 				    (sym1->st_value != sym2->st_value) ||
2998 				    (bind2 == STB_WEAK))
2999 					continue;
3000 
3001 				/*
3002 				 * The weak symbol (sym1) has a non-weak (sym2)
3003 				 * counterpart.  There's no point in translating
3004 				 * both of these equivalent symbols to locals.
3005 				 * Add this symbol capability alias to the
3006 				 * capabilities family information, and remove
3007 				 * the weak symbol.
3008 				 */
3009 				if (ld_cap_add_family(ofl, cpp2->c_nsdp,
3010 				    cpp1->c_nsdp, NULL, NULL) == S_ERROR)
3011 					return (S_ERROR);
3012 
3013 				free((void *)cpp1->c_osdp);
3014 				(void) alist_delete(cappairs, &idx1);
3015 			}
3016 		}
3017 
3018 		DBG_CALL(Dbg_util_nl(ofl->ofl_lml, DBG_NL_STD));
3019 
3020 		/*
3021 		 * The capability pairs information now represents all the
3022 		 * global symbols that need transforming to locals.  These
3023 		 * local symbols are renamed using their group identifiers.
3024 		 */
3025 		for (ALIST_TRAVERSE(cappairs, idx1, cpp1)) {
3026 			Sym_desc	*osdp = cpp1->c_osdp;
3027 			Objcapset	*capset;
3028 			size_t		nsize, tsize;
3029 			const char	*oname;
3030 			char		*cname, *idstr;
3031 			Sym		*csym;
3032 
3033 			/*
3034 			 * If the local symbol has not yet been translated
3035 			 * convert it to a local symbol with a name.
3036 			 */
3037 			if ((osdp->sd_flags & FLG_SY_CAP) != 0)
3038 				continue;
3039 
3040 			/*
3041 			 * As we're converting object capabilities to symbol
3042 			 * capabilities, obtain the capabilities set for this
3043 			 * object, so as to retrieve the CA_SUNW_ID value.
3044 			 */
3045 			capset = &cpp1->c_group->cg_set;
3046 
3047 			/*
3048 			 * Create a new name from the existing symbol and the
3049 			 * capabilities group identifier.  Note, the delimiter
3050 			 * between the symbol name and identifier name is hard-
3051 			 * coded here (%), so that we establish a convention
3052 			 * for transformed symbol names.
3053 			 */
3054 			oname = osdp->sd_name;
3055 
3056 			idstr = capset->oc_id.cs_str;
3057 			nsize = strlen(oname);
3058 			tsize = nsize + 1 + strlen(idstr) + 1;
3059 			if ((cname = libld_malloc(tsize)) == 0)
3060 				return (S_ERROR);
3061 
3062 			(void) strcpy(cname, oname);
3063 			cname[nsize++] = '%';
3064 			(void) strcpy(&cname[nsize], idstr);
3065 
3066 			/*
3067 			 * Allocate a new symbol table entry, transform this
3068 			 * symbol to a local, and assign the new name.
3069 			 */
3070 			if ((csym = libld_malloc(sizeof (Sym))) == NULL)
3071 				return (S_ERROR);
3072 
3073 			*csym = *osdp->sd_sym;
3074 			csym->st_info = ELF_ST_INFO(STB_LOCAL,
3075 			    ELF_ST_TYPE(osdp->sd_sym->st_info));
3076 
3077 			osdp->sd_name = cname;
3078 			osdp->sd_sym = csym;
3079 			osdp->sd_flags = FLG_SY_CAP;
3080 
3081 			/*
3082 			 * Keep track of this new local symbol.  As -z symbolcap
3083 			 * can only be used to create a relocatable object, a
3084 			 * dynamic symbol table can't exist.  Ensure there is
3085 			 * space reserved in the string table.
3086 			 */
3087 			ofl->ofl_caploclcnt++;
3088 			if (st_insert(ofl->ofl_strtab, cname) == -1)
3089 				return (S_ERROR);
3090 
3091 			DBG_CALL(Dbg_syms_cap_local(ofl, cpp1->c_ndx,
3092 			    cname, csym, osdp));
3093 
3094 			/*
3095 			 * Establish this capability pair as a family.
3096 			 */
3097 			if (ld_cap_add_family(ofl, cpp1->c_nsdp, osdp,
3098 			    cpp1->c_group, &ifl->ifl_caps->ca_syms) == S_ERROR)
3099 				return (S_ERROR);
3100 		}
3101 	}
3102 
3103 	return (1);
3104 
3105 #undef SYM_LOC_BADADDR
3106 }
3107 
3108 /*
3109  * Add an undefined symbol to the symbol table.  The reference originates from
3110  * the location identified by the message id (mid).  These references can
3111  * originate from command line options such as -e, -u, -initarray, etc.
3112  * (identified with MSG_INTL(MSG_STR_COMMAND)), or from internally generated
3113  * TLS relocation references (identified with MSG_INTL(MSG_STR_TLSREL)).
3114  */
3115 Sym_desc *
3116 ld_sym_add_u(const char *name, Ofl_desc *ofl, Msg mid)
3117 {
3118 	Sym		*sym;
3119 	Ifl_desc	*ifl = NULL, *_ifl;
3120 	Sym_desc	*sdp;
3121 	Word		hash;
3122 	Aliste		idx;
3123 	avl_index_t	where;
3124 	const char	*reference = MSG_INTL(mid);
3125 
3126 	/*
3127 	 * As an optimization, determine whether we've already generated this
3128 	 * reference.  If the symbol doesn't already exist we'll create it.
3129 	 * Or if the symbol does exist from a different source, we'll resolve
3130 	 * the conflict.
3131 	 */
3132 	/* LINTED */
3133 	hash = (Word)elf_hash(name);
3134 	if ((sdp = ld_sym_find(name, hash, &where, ofl)) != NULL) {
3135 		if ((sdp->sd_sym->st_shndx == SHN_UNDEF) &&
3136 		    (sdp->sd_file->ifl_name == reference))
3137 			return (sdp);
3138 	}
3139 
3140 	/*
3141 	 * Determine whether a pseudo input file descriptor exists to represent
3142 	 * the command line, as any global symbol needs an input file descriptor
3143 	 * during any symbol resolution (refer to map_ifl() which provides a
3144 	 * similar method for adding symbols from mapfiles).
3145 	 */
3146 	for (APLIST_TRAVERSE(ofl->ofl_objs, idx, _ifl))
3147 		if (strcmp(_ifl->ifl_name, reference) == 0) {
3148 			ifl = _ifl;
3149 			break;
3150 		}
3151 
3152 	/*
3153 	 * If no descriptor exists create one.
3154 	 */
3155 	if (ifl == NULL) {
3156 		if ((ifl = libld_calloc(sizeof (Ifl_desc), 1)) == NULL)
3157 			return ((Sym_desc *)S_ERROR);
3158 		ifl->ifl_name = reference;
3159 		ifl->ifl_flags = FLG_IF_NEEDED | FLG_IF_FILEREF;
3160 		if ((ifl->ifl_ehdr = libld_calloc(sizeof (Ehdr), 1)) == NULL)
3161 			return ((Sym_desc *)S_ERROR);
3162 		ifl->ifl_ehdr->e_type = ET_REL;
3163 
3164 		if (aplist_append(&ofl->ofl_objs, ifl, AL_CNT_OFL_OBJS) == NULL)
3165 			return ((Sym_desc *)S_ERROR);
3166 	}
3167 
3168 	/*
3169 	 * Allocate a symbol structure and add it to the global symbol table.
3170 	 */
3171 	if ((sym = libld_calloc(sizeof (Sym), 1)) == NULL)
3172 		return ((Sym_desc *)S_ERROR);
3173 	sym->st_info = ELF_ST_INFO(STB_GLOBAL, STT_NOTYPE);
3174 	sym->st_shndx = SHN_UNDEF;
3175 
3176 	DBG_CALL(Dbg_syms_process(ofl->ofl_lml, ifl));
3177 	if (sdp == NULL) {
3178 		DBG_CALL(Dbg_syms_global(ofl->ofl_lml, 0, name));
3179 		if ((sdp = ld_sym_enter(name, sym, hash, ifl, ofl, 0, SHN_UNDEF,
3180 		    0, &where)) == (Sym_desc *)S_ERROR)
3181 			return ((Sym_desc *)S_ERROR);
3182 	} else if (ld_sym_resolve(sdp, sym, ifl, ofl, 0,
3183 	    SHN_UNDEF, 0) == S_ERROR)
3184 		return ((Sym_desc *)S_ERROR);
3185 
3186 	sdp->sd_flags &= ~FLG_SY_CLEAN;
3187 	sdp->sd_flags |= FLG_SY_CMDREF;
3188 
3189 	return (sdp);
3190 }
3191 
3192 /*
3193  * STT_SECTION symbols have their st_name field set to NULL, and consequently
3194  * have no name. Generate a name suitable for diagnostic use for such a symbol
3195  * and store it in the input section descriptor. The resulting name will be
3196  * of the form:
3197  *
3198  *	"XXX (section)"
3199  *
3200  * where XXX is the name of the section.
3201  *
3202  * entry:
3203  *	isc - Input section associated with the symbol.
3204  *	fmt - NULL, or format string to use.
3205  *
3206  * exit:
3207  *	Sets isp->is_sym_name to the allocated string. Returns the
3208  *	string pointer, or NULL on allocation failure.
3209  */
3210 const char *
3211 ld_stt_section_sym_name(Is_desc *isp)
3212 {
3213 	const char	*fmt;
3214 	char		*str;
3215 	size_t		len;
3216 
3217 	if ((isp == NULL) || (isp->is_name == NULL))
3218 		return (NULL);
3219 
3220 	if (isp->is_sym_name == NULL) {
3221 		fmt = (isp->is_flags & FLG_IS_GNSTRMRG) ?
3222 		    MSG_INTL(MSG_STR_SECTION_MSTR) : MSG_INTL(MSG_STR_SECTION);
3223 
3224 		len = strlen(fmt) + strlen(isp->is_name) + 1;
3225 
3226 		if ((str = libld_malloc(len)) == NULL)
3227 			return (NULL);
3228 		(void) snprintf(str, len, fmt, isp->is_name);
3229 		isp->is_sym_name = str;
3230 	}
3231 
3232 	return (isp->is_sym_name);
3233 }
3234 
3235 /*
3236  * If we're producing a relocatable object and the symbol is eligible for
3237  * COMDAT section, it shouldn't be reduced in scope as that will break the
3238  * COMDAT matching when the output object is later consumed.  Leave it alone,
3239  * and any reduction (and COMDAT) processing will occur then.
3240  *
3241  * Otherwise, any hidden symbol is reduced when reductions are being processed.
3242  */
3243 Boolean
3244 ld_sym_reducable(Ofl_desc *ofl, Sym_desc *sdp)
3245 {
3246 	Is_desc *isc = sdp->sd_isc;
3247 
3248 	if (((ofl->ofl_flags & FLG_OF_RELOBJ) != 0) &&
3249 	    (isc != NULL) &&
3250 	    ((isc->is_flags & FLG_IS_COMDAT) != 0)) {
3251 		return (FALSE);
3252 	} else {
3253 		return (SYM_IS_HIDDEN(sdp) &&
3254 		    (ofl->ofl_flags & FLG_OF_PROCRED));
3255 	}
3256 }
3257