1 /*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21
22 /*
23 * Copyright (c) 1988 AT&T
24 * All Rights Reserved
25 *
26 *
27 * Copyright (c) 1989, 2010, Oracle and/or its affiliates. All rights reserved.
28 */
29
30 /*
31 * Symbol table management routines
32 */
33
34 #define ELF_TARGET_AMD64
35
36 #include <stdio.h>
37 #include <string.h>
38 #include <debug.h>
39 #include "msg.h"
40 #include "_libld.h"
41
42 /*
43 * AVL tree comparator function:
44 *
45 * The primary key is the symbol name hash with a secondary key of the symbol
46 * name itself.
47 */
48 int
49 ld_sym_avl_comp(const void *elem1, const void *elem2)
50 {
51 Sym_avlnode *sav1 = (Sym_avlnode *)elem1;
52 Sym_avlnode *sav2 = (Sym_avlnode *)elem2;
53 int res;
54
55 res = sav1->sav_hash - sav2->sav_hash;
56
57 if (res < 0)
58 return (-1);
59 if (res > 0)
60 return (1);
61
62 /*
63 * Hash is equal - now compare name
64 */
65 res = strcmp(sav1->sav_name, sav2->sav_name);
66 if (res == 0)
67 return (0);
68 if (res > 0)
69 return (1);
70 return (-1);
71 }
72
73 /*
74 * Focal point for verifying symbol names.
75 */
76 inline static const char *
77 string(Ofl_desc *ofl, Ifl_desc *ifl, Sym *sym, const char *strs, size_t strsize,
78 int symndx, Word shndx, Word symsecndx, const char *symsecname,
79 const char *strsecname, sd_flag_t *flags)
80 {
81 Word name = sym->st_name;
82
83 if (name) {
84 if ((ifl->ifl_flags & FLG_IF_HSTRTAB) == 0) {
85 ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_FIL_NOSTRTABLE),
86 ifl->ifl_name, EC_WORD(symsecndx), symsecname,
87 symndx, EC_XWORD(name));
88 return (NULL);
89 }
90 if (name >= (Word)strsize) {
91 ld_eprintf(ofl, ERR_FATAL,
92 MSG_INTL(MSG_FIL_EXCSTRTABLE), ifl->ifl_name,
93 EC_WORD(symsecndx), symsecname, symndx,
94 EC_XWORD(name), strsecname, EC_XWORD(strsize));
95 return (NULL);
96 }
97 }
98
99 /*
100 * Determine if we're dealing with a register and if so validate it.
101 * If it's a scratch register, a fabricated name will be returned.
102 */
103 if (ld_targ.t_ms.ms_is_regsym != NULL) {
104 const char *regname = (*ld_targ.t_ms.ms_is_regsym)(ofl, ifl,
105 sym, strs, symndx, shndx, symsecname, flags);
106
107 if (regname == (const char *)S_ERROR) {
108 return (NULL);
109 }
110 if (regname)
111 return (regname);
112 }
113
114 /*
115 * If this isn't a register, but we have a global symbol with a null
116 * name, we're not going to be able to hash this, search for it, or
117 * do anything interesting. However, we've been accepting a symbol of
118 * this kind for ages now, so give the user a warning (rather than a
119 * fatal error), just in case this instance exists somewhere in the
120 * world and hasn't, as yet, been a problem.
121 */
122 if ((name == 0) && (ELF_ST_BIND(sym->st_info) != STB_LOCAL)) {
123 ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_FIL_NONAMESYM),
124 ifl->ifl_name, EC_WORD(symsecndx), symsecname, symndx,
125 EC_XWORD(name));
126 }
127 return (strs + name);
128 }
129
130 /*
131 * For producing symbol names strings to use in error messages.
132 * If the symbol has a non-null name, then the string returned by
133 * this function is the output from demangle(), surrounded by
134 * single quotes. For null names, a descriptive string giving
135 * the symbol section and index is generated.
136 *
137 * This function uses an internal static buffer to hold the resulting
138 * string. The value returned is usable by the caller until the next
139 * call, at which point it is overwritten.
140 */
141 static const char *
142 demangle_symname(const char *name, const char *symtab_name, Word symndx)
143 {
144 #define INIT_BUFSIZE 256
145
146 static char *buf;
147 static size_t bufsize = 0;
148 size_t len;
149 int use_name;
150
151 use_name = (name != NULL) && (*name != '\0');
152
153 if (use_name) {
154 name = demangle(name);
155 len = strlen(name) + 2; /* Include room for quotes */
156 } else {
157 name = MSG_ORIG(MSG_STR_EMPTY);
158 len = strlen(symtab_name) + 2 + CONV_INV_BUFSIZE;
159 }
160 len++; /* Null termination */
161
162 /* If our buffer is too small, double it until it is big enough */
163 if (len > bufsize) {
164 size_t new_bufsize = bufsize;
165 char *new_buf;
166
167 if (new_bufsize == 0)
168 new_bufsize = INIT_BUFSIZE;
169 while (len > new_bufsize)
170 new_bufsize *= 2;
171 if ((new_buf = libld_malloc(new_bufsize)) == NULL)
172 return (name);
173 buf = new_buf;
174 bufsize = new_bufsize;
175 }
176
177 if (use_name) {
178 (void) snprintf(buf, bufsize, MSG_ORIG(MSG_FMT_SYMNAM), name);
179 } else {
180 (void) snprintf(buf, bufsize, MSG_ORIG(MSG_FMT_NULLSYMNAM),
181 symtab_name, EC_WORD(symndx));
182 }
183
184 return (buf);
185
186 #undef INIT_BUFSIZE
187 }
188
189 /*
190 * Shared objects can be built that define specific symbols that can not be
191 * directly bound to. These objects have a syminfo section (and an associated
192 * DF_1_NODIRECT dynamic flags entry). Scan this table looking for symbols
193 * that can't be bound to directly, and if this files symbol is presently
194 * referenced, mark it so that we don't directly bind to it.
195 */
196 uintptr_t
197 ld_sym_nodirect(Is_desc *isp, Ifl_desc *ifl, Ofl_desc *ofl)
198 {
199 Shdr *sifshdr, *symshdr;
200 Syminfo *sifdata;
201 Sym *symdata;
202 char *strdata;
203 ulong_t cnt, _cnt;
204
205 /*
206 * Get the syminfo data, and determine the number of entries.
207 */
208 sifshdr = isp->is_shdr;
209 sifdata = (Syminfo *)isp->is_indata->d_buf;
210 cnt = sifshdr->sh_size / sifshdr->sh_entsize;
211
212 /*
213 * Get the associated symbol table.
214 */
215 if ((sifshdr->sh_link == 0) || (sifshdr->sh_link >= ifl->ifl_shnum)) {
216 /*
217 * Broken input file
218 */
219 ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_FIL_INVSHINFO),
220 ifl->ifl_name, isp->is_name, EC_XWORD(sifshdr->sh_link));
221 return (0);
222 }
223 symshdr = ifl->ifl_isdesc[sifshdr->sh_link]->is_shdr;
224 symdata = ifl->ifl_isdesc[sifshdr->sh_link]->is_indata->d_buf;
225
226 /*
227 * Get the string table associated with the symbol table.
228 */
229 strdata = ifl->ifl_isdesc[symshdr->sh_link]->is_indata->d_buf;
230
231 /*
232 * Traverse the syminfo data for symbols that can't be directly
233 * bound to.
234 */
235 for (_cnt = 1, sifdata++; _cnt < cnt; _cnt++, sifdata++) {
236 Sym *sym;
237 char *str;
238 Sym_desc *sdp;
239
240 if ((sifdata->si_flags & SYMINFO_FLG_NOEXTDIRECT) == 0)
241 continue;
242
243 sym = (Sym *)(symdata + _cnt);
244 str = (char *)(strdata + sym->st_name);
245
246 if ((sdp = ld_sym_find(str, SYM_NOHASH, NULL, ofl)) != NULL) {
247 if (ifl != sdp->sd_file)
248 continue;
249
250 sdp->sd_flags &= ~FLG_SY_DIR;
251 sdp->sd_flags |= FLG_SY_NDIR;
252 }
253 }
254 return (0);
255 }
256
257 /*
258 * If, during symbol processing, it is necessary to update a local symbols
259 * contents before we have generated the symbol tables in the output image,
260 * create a new symbol structure and copy the original symbol contents. While
261 * we are processing the input files, their local symbols are part of the
262 * read-only mapped image. Commonly, these symbols are copied to the new output
263 * file image and then updated to reflect their new address and any change in
264 * attributes. However, sometimes during relocation counting, it is necessary
265 * to adjust the symbols information. This routine provides for the generation
266 * of a new symbol image so that this update can be performed.
267 * All global symbols are copied to an internal symbol table to improve locality
268 * of reference and hence performance, and thus this copying is not necessary.
269 */
270 uintptr_t
271 ld_sym_copy(Sym_desc *sdp)
272 {
273 Sym *nsym;
274
275 if (sdp->sd_flags & FLG_SY_CLEAN) {
276 if ((nsym = libld_malloc(sizeof (Sym))) == NULL)
277 return (S_ERROR);
278 *nsym = *(sdp->sd_sym);
279 sdp->sd_sym = nsym;
280 sdp->sd_flags &= ~FLG_SY_CLEAN;
281 }
282 return (1);
283 }
284
285 /*
286 * Finds a given name in the link editors internal symbol table. If no
287 * hash value is specified it is calculated. A pointer to the located
288 * Sym_desc entry is returned, or NULL if the symbol is not found.
289 */
290 Sym_desc *
291 ld_sym_find(const char *name, Word hash, avl_index_t *where, Ofl_desc *ofl)
292 {
293 Sym_avlnode qsav, *sav;
294
295 if (hash == SYM_NOHASH)
296 /* LINTED */
297 hash = (Word)elf_hash((const char *)name);
298 qsav.sav_hash = hash;
299 qsav.sav_name = name;
300
301 /*
302 * Perform search for symbol in AVL tree. Note that the 'where' field
303 * is passed in from the caller. If a 'where' is present, it can be
304 * used in subsequent 'ld_sym_enter()' calls if required.
305 */
306 sav = avl_find(&ofl->ofl_symavl, &qsav, where);
307
308 /*
309 * If symbol was not found in the avl tree, return null to show that.
310 */
311 if (sav == NULL)
312 return (NULL);
313
314 /*
315 * Return symbol found.
316 */
317 return (sav->sav_sdp);
318 }
319
320 /*
321 * Enter a new symbol into the link editors internal symbol table.
322 * If the symbol is from an input file, information regarding the input file
323 * and input section is also recorded. Otherwise (file == NULL) the symbol
324 * has been internally generated (ie. _etext, _edata, etc.).
325 */
326 Sym_desc *
327 ld_sym_enter(const char *name, Sym *osym, Word hash, Ifl_desc *ifl,
328 Ofl_desc *ofl, Word ndx, Word shndx, sd_flag_t sdflags, avl_index_t *where)
329 {
330 Sym_desc *sdp;
331 Sym_aux *sap;
332 Sym_avlnode *savl;
333 char *_name;
334 Sym *nsym;
335 Half etype;
336 uchar_t vis;
337 avl_index_t _where;
338
339 /*
340 * Establish the file type.
341 */
342 if (ifl)
343 etype = ifl->ifl_ehdr->e_type;
344 else
345 etype = ET_NONE;
346
347 ofl->ofl_entercnt++;
348
349 /*
350 * Allocate a Sym Descriptor, Auxiliary Descriptor, and a Sym AVLNode -
351 * contiguously.
352 */
353 if ((savl = libld_calloc(S_DROUND(sizeof (Sym_avlnode)) +
354 S_DROUND(sizeof (Sym_desc)) +
355 S_DROUND(sizeof (Sym_aux)), 1)) == NULL)
356 return ((Sym_desc *)S_ERROR);
357 sdp = (Sym_desc *)((uintptr_t)savl +
358 S_DROUND(sizeof (Sym_avlnode)));
359 sap = (Sym_aux *)((uintptr_t)sdp +
360 S_DROUND(sizeof (Sym_desc)));
361
362 savl->sav_sdp = sdp;
363 sdp->sd_file = ifl;
364 sdp->sd_aux = sap;
365 savl->sav_hash = sap->sa_hash = hash;
366
367 /*
368 * Copy the symbol table entry from the input file into the internal
369 * entry and have the symbol descriptor use it.
370 */
371 sdp->sd_sym = nsym = &sap->sa_sym;
372 *nsym = *osym;
373 sdp->sd_shndx = shndx;
374 sdp->sd_flags |= sdflags;
375
376 if ((_name = libld_malloc(strlen(name) + 1)) == NULL)
377 return ((Sym_desc *)S_ERROR);
378 savl->sav_name = sdp->sd_name = (const char *)strcpy(_name, name);
379
380 /*
381 * Enter Symbol in AVL tree.
382 */
383 if (where == 0) {
384 /* LINTED */
385 Sym_avlnode *_savl;
386 /*
387 * If a previous ld_sym_find() hasn't initialized 'where' do it
388 * now.
389 */
390 where = &_where;
391 _savl = avl_find(&ofl->ofl_symavl, savl, where);
392 assert(_savl == NULL);
393 }
394 avl_insert(&ofl->ofl_symavl, savl, *where);
395
396 /*
397 * Record the section index. This is possible because the
398 * `ifl_isdesc' table is filled before we start symbol processing.
399 */
400 if ((sdflags & FLG_SY_SPECSEC) || (nsym->st_shndx == SHN_UNDEF))
401 sdp->sd_isc = NULL;
402 else {
403 sdp->sd_isc = ifl->ifl_isdesc[shndx];
404
405 /*
406 * If this symbol is from a relocatable object, make sure that
407 * it is still associated with a section. For example, an
408 * unknown section type (SHT_NULL) would have been rejected on
409 * input with a warning. Here, we make the use of the symbol
410 * fatal. A symbol descriptor is still returned, so that the
411 * caller can continue processing all symbols, and hence flush
412 * out as many error conditions as possible.
413 */
414 if ((etype == ET_REL) && (sdp->sd_isc == NULL)) {
415 ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_SYM_INVSEC),
416 name, ifl->ifl_name, EC_XWORD(shndx));
417 return (sdp);
418 }
419 }
420
421 /*
422 * Mark any COMMON symbols as 'tentative'.
423 */
424 if (sdflags & FLG_SY_SPECSEC) {
425 if (nsym->st_shndx == SHN_COMMON)
426 sdp->sd_flags |= FLG_SY_TENTSYM;
427 #if defined(_ELF64)
428 else if ((ld_targ.t_m.m_mach == EM_AMD64) &&
429 (nsym->st_shndx == SHN_X86_64_LCOMMON))
430 sdp->sd_flags |= FLG_SY_TENTSYM;
431 #endif
432 }
433
434 /*
435 * Establish the symbols visibility and reference.
436 */
437 vis = ELF_ST_VISIBILITY(nsym->st_other);
438
439 if ((etype == ET_NONE) || (etype == ET_REL)) {
440 switch (vis) {
441 case STV_DEFAULT:
442 sdp->sd_flags |= FLG_SY_DEFAULT;
443 break;
444 case STV_INTERNAL:
445 case STV_HIDDEN:
446 sdp->sd_flags |= FLG_SY_HIDDEN;
447 break;
448 case STV_PROTECTED:
449 sdp->sd_flags |= FLG_SY_PROTECT;
450 break;
451 case STV_EXPORTED:
452 sdp->sd_flags |= FLG_SY_EXPORT;
453 break;
454 case STV_SINGLETON:
455 sdp->sd_flags |= (FLG_SY_SINGLE | FLG_SY_NDIR);
456 ofl->ofl_flags1 |= (FLG_OF1_NDIRECT | FLG_OF1_NGLBDIR);
457 break;
458 case STV_ELIMINATE:
459 sdp->sd_flags |= (FLG_SY_HIDDEN | FLG_SY_ELIM);
460 break;
461 default:
462 assert(vis <= STV_ELIMINATE);
463 }
464
465 sdp->sd_ref = REF_REL_NEED;
466
467 /*
468 * Under -Bnodirect, all exported interfaces that have not
469 * explicitly been defined protected or directly bound to, are
470 * tagged to prevent direct binding.
471 */
472 if ((ofl->ofl_flags1 & FLG_OF1_ALNODIR) &&
473 ((sdp->sd_flags & (FLG_SY_PROTECT | FLG_SY_DIR)) == 0) &&
474 (nsym->st_shndx != SHN_UNDEF)) {
475 sdp->sd_flags |= FLG_SY_NDIR;
476 }
477 } else {
478 sdp->sd_ref = REF_DYN_SEEN;
479
480 /*
481 * If this is a protected symbol, remember this. Note, this
482 * state is different from the FLG_SY_PROTECT used to establish
483 * a symbol definitions visibility. This state is used to warn
484 * against possible copy relocations against this referenced
485 * symbol.
486 */
487 if (vis == STV_PROTECTED)
488 sdp->sd_flags |= FLG_SY_PROT;
489
490 /*
491 * If this is a SINGLETON definition, then indicate the symbol
492 * can not be directly bound to, and retain the visibility.
493 * This visibility will be inherited by any references made to
494 * this symbol.
495 */
496 if ((vis == STV_SINGLETON) && (nsym->st_shndx != SHN_UNDEF))
497 sdp->sd_flags |= (FLG_SY_SINGLE | FLG_SY_NDIR);
498
499 /*
500 * If the new symbol is from a shared library and is associated
501 * with a SHT_NOBITS section then this symbol originated from a
502 * tentative symbol.
503 */
504 if (sdp->sd_isc &&
505 (sdp->sd_isc->is_shdr->sh_type == SHT_NOBITS))
506 sdp->sd_flags |= FLG_SY_TENTSYM;
507 }
508
509 /*
510 * Reclassify any SHN_SUNW_IGNORE symbols to SHN_UNDEF so as to
511 * simplify future processing.
512 */
513 if (nsym->st_shndx == SHN_SUNW_IGNORE) {
514 sdp->sd_shndx = shndx = SHN_UNDEF;
515 sdp->sd_flags |= (FLG_SY_REDUCED |
516 FLG_SY_HIDDEN | FLG_SY_IGNORE | FLG_SY_ELIM);
517 }
518
519 /*
520 * If this is an undefined, or common symbol from a relocatable object
521 * determine whether it is a global or weak reference (see build_osym(),
522 * where REF_DYN_NEED definitions are returned back to undefines).
523 */
524 if ((etype == ET_REL) &&
525 (ELF_ST_BIND(nsym->st_info) == STB_GLOBAL) &&
526 ((nsym->st_shndx == SHN_UNDEF) || ((sdflags & FLG_SY_SPECSEC) &&
527 #if defined(_ELF64)
528 ((nsym->st_shndx == SHN_COMMON) ||
529 ((ld_targ.t_m.m_mach == EM_AMD64) &&
530 (nsym->st_shndx == SHN_X86_64_LCOMMON))))))
531 #else
532 /* BEGIN CSTYLED */
533 (nsym->st_shndx == SHN_COMMON))))
534 /* END CSTYLED */
535 #endif
536 sdp->sd_flags |= FLG_SY_GLOBREF;
537
538 /*
539 * Record the input filename on the referenced or defined files list
540 * for possible later diagnostics. The `sa_rfile' pointer contains the
541 * name of the file that first referenced this symbol and is used to
542 * generate undefined symbol diagnostics (refer to sym_undef_entry()).
543 * Note that this entry can be overridden if a reference from a
544 * relocatable object is found after a reference from a shared object
545 * (refer to sym_override()).
546 * The `sa_dfiles' list is used to maintain the list of files that
547 * define the same symbol. This list can be used for two reasons:
548 *
549 * - To save the first definition of a symbol that is not available
550 * for this link-edit.
551 *
552 * - To save all definitions of a symbol when the -m option is in
553 * effect. This is optional as it is used to list multiple
554 * (interposed) definitions of a symbol (refer to ldmap_out()),
555 * and can be quite expensive.
556 */
557 if (nsym->st_shndx == SHN_UNDEF) {
558 sap->sa_rfile = ifl->ifl_name;
559 } else {
560 if (sdp->sd_ref == REF_DYN_SEEN) {
561 /*
562 * A symbol is determined to be unavailable if it
563 * belongs to a version of a shared object that this
564 * user does not wish to use, or if it belongs to an
565 * implicit shared object.
566 */
567 if (ifl->ifl_vercnt) {
568 Ver_index *vip;
569 Half vndx = ifl->ifl_versym[ndx];
570
571 sap->sa_dverndx = vndx;
572 vip = &ifl->ifl_verndx[vndx];
573 if (!(vip->vi_flags & FLG_VER_AVAIL)) {
574 sdp->sd_flags |= FLG_SY_NOTAVAIL;
575 sap->sa_vfile = ifl->ifl_name;
576 }
577 }
578 if (!(ifl->ifl_flags & FLG_IF_NEEDED))
579 sdp->sd_flags |= FLG_SY_NOTAVAIL;
580
581 } else if (etype == ET_REL) {
582 /*
583 * If this symbol has been obtained from a versioned
584 * input relocatable object then the new symbol must be
585 * promoted to the versioning of the output file.
586 */
587 if (ifl->ifl_versym)
588 ld_vers_promote(sdp, ndx, ifl, ofl);
589 }
590
591 if ((ofl->ofl_flags & FLG_OF_GENMAP) &&
592 ((sdflags & FLG_SY_SPECSEC) == 0))
593 if (aplist_append(&sap->sa_dfiles, ifl->ifl_name,
594 AL_CNT_SDP_DFILES) == NULL)
595 return ((Sym_desc *)S_ERROR);
596 }
597
598 /*
599 * Provided we're not processing a mapfile, diagnose the entered symbol.
600 * Mapfile processing requires the symbol to be updated with additional
601 * information, therefore the diagnosing of the symbol is deferred until
602 * later (see Dbg_map_symbol()).
603 */
604 if ((ifl == NULL) || ((ifl->ifl_flags & FLG_IF_MAPFILE) == 0))
605 DBG_CALL(Dbg_syms_entered(ofl, nsym, sdp));
606
607 return (sdp);
608 }
609
610 /*
611 * Add a special symbol to the symbol table. Takes special symbol name with
612 * and without underscores. This routine is called, after all other symbol
613 * resolution has completed, to generate a reserved absolute symbol (the
614 * underscore version). Special symbols are updated with the appropriate
615 * values in update_osym(). If the user has already defined this symbol
616 * issue a warning and leave the symbol as is. If the non-underscore symbol
617 * is referenced then turn it into a weak alias of the underscored symbol.
618 *
619 * The bits in sdflags_u are OR'd into the flags field of the symbol for the
620 * underscored symbol.
621 *
622 * If this is a global symbol, and it hasn't explicitly been defined as being
623 * directly bound to, indicate that it can't be directly bound to.
624 * Historically, most special symbols only have meaning to the object in which
625 * they exist, however, they've always been global. To ensure compatibility
626 * with any unexpected use presently in effect, ensure these symbols don't get
627 * directly bound to. Note, that establishing this state here isn't sufficient
628 * to create a syminfo table, only if a syminfo table is being created by some
629 * other symbol directives will the nodirect binding be recorded. This ensures
630 * we don't create syminfo sections for all objects we create, as this might add
631 * unnecessary bloat to users who haven't explicitly requested extra symbol
632 * information.
633 */
634 static uintptr_t
635 sym_add_spec(const char *name, const char *uname, Word sdaux_id,
636 sd_flag_t sdflags_u, sd_flag_t sdflags, Ofl_desc *ofl)
637 {
638 Sym_desc *sdp;
639 Sym_desc *usdp;
640 Sym *sym;
641 Word hash;
642 avl_index_t where;
643
644 /* LINTED */
645 hash = (Word)elf_hash(uname);
646 if (usdp = ld_sym_find(uname, hash, &where, ofl)) {
647 /*
648 * If the underscore symbol exists and is undefined, or was
649 * defined in a shared library, convert it to a local symbol.
650 * Otherwise leave it as is and warn the user.
651 */
652 if ((usdp->sd_shndx == SHN_UNDEF) ||
653 (usdp->sd_ref != REF_REL_NEED)) {
654 usdp->sd_ref = REF_REL_NEED;
655 usdp->sd_shndx = usdp->sd_sym->st_shndx = SHN_ABS;
656 usdp->sd_flags |= FLG_SY_SPECSEC | sdflags_u;
657 usdp->sd_sym->st_info =
658 ELF_ST_INFO(STB_GLOBAL, STT_OBJECT);
659 usdp->sd_isc = NULL;
660 usdp->sd_sym->st_size = 0;
661 usdp->sd_sym->st_value = 0;
662 /* LINTED */
663 usdp->sd_aux->sa_symspec = (Half)sdaux_id;
664
665 /*
666 * If a user hasn't specifically indicated that the
667 * scope of this symbol be made local, then leave it
668 * as global (ie. prevent automatic scoping). The GOT
669 * should be defined protected, whereas all other
670 * special symbols are tagged as no-direct.
671 */
672 if (!SYM_IS_HIDDEN(usdp) &&
673 (sdflags & FLG_SY_DEFAULT)) {
674 usdp->sd_aux->sa_overndx = VER_NDX_GLOBAL;
675 if (sdaux_id == SDAUX_ID_GOT) {
676 usdp->sd_flags &= ~FLG_SY_NDIR;
677 usdp->sd_flags |= FLG_SY_PROTECT;
678 usdp->sd_sym->st_other = STV_PROTECTED;
679 } else if (
680 ((usdp->sd_flags & FLG_SY_DIR) == 0) &&
681 ((ofl->ofl_flags & FLG_OF_SYMBOLIC) == 0)) {
682 usdp->sd_flags |= FLG_SY_NDIR;
683 }
684 }
685 usdp->sd_flags |= sdflags;
686
687 /*
688 * If the reference originated from a mapfile ensure
689 * we mark the symbol as used.
690 */
691 if (usdp->sd_flags & FLG_SY_MAPREF)
692 usdp->sd_flags |= FLG_SY_MAPUSED;
693
694 DBG_CALL(Dbg_syms_updated(ofl, usdp, uname));
695 } else {
696 ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_RESERVE),
697 uname, usdp->sd_file->ifl_name);
698 }
699 } else {
700 /*
701 * If the symbol does not exist create it.
702 */
703 if ((sym = libld_calloc(sizeof (Sym), 1)) == NULL)
704 return (S_ERROR);
705 sym->st_shndx = SHN_ABS;
706 sym->st_info = ELF_ST_INFO(STB_GLOBAL, STT_OBJECT);
707 sym->st_size = 0;
708 sym->st_value = 0;
709 DBG_CALL(Dbg_syms_created(ofl->ofl_lml, uname));
710 if ((usdp = ld_sym_enter(uname, sym, hash, (Ifl_desc *)NULL,
711 ofl, 0, SHN_ABS, (FLG_SY_SPECSEC | sdflags_u), &where)) ==
712 (Sym_desc *)S_ERROR)
713 return (S_ERROR);
714 usdp->sd_ref = REF_REL_NEED;
715 /* LINTED */
716 usdp->sd_aux->sa_symspec = (Half)sdaux_id;
717
718 usdp->sd_aux->sa_overndx = VER_NDX_GLOBAL;
719
720 if (sdaux_id == SDAUX_ID_GOT) {
721 usdp->sd_flags |= FLG_SY_PROTECT;
722 usdp->sd_sym->st_other = STV_PROTECTED;
723 } else if ((sdflags & FLG_SY_DEFAULT) &&
724 ((ofl->ofl_flags & FLG_OF_SYMBOLIC) == 0)) {
725 usdp->sd_flags |= FLG_SY_NDIR;
726 }
727 usdp->sd_flags |= sdflags;
728 }
729
730 if (name && (sdp = ld_sym_find(name, SYM_NOHASH, NULL, ofl)) &&
731 (sdp->sd_sym->st_shndx == SHN_UNDEF)) {
732 uchar_t bind;
733
734 /*
735 * If the non-underscore symbol exists and is undefined
736 * convert it to be a local. If the underscore has
737 * sa_symspec set (ie. it was created above) then simulate this
738 * as a weak alias.
739 */
740 sdp->sd_ref = REF_REL_NEED;
741 sdp->sd_shndx = sdp->sd_sym->st_shndx = SHN_ABS;
742 sdp->sd_flags |= FLG_SY_SPECSEC;
743 sdp->sd_isc = NULL;
744 sdp->sd_sym->st_size = 0;
745 sdp->sd_sym->st_value = 0;
746 /* LINTED */
747 sdp->sd_aux->sa_symspec = (Half)sdaux_id;
748 if (usdp->sd_aux->sa_symspec) {
749 usdp->sd_aux->sa_linkndx = 0;
750 sdp->sd_aux->sa_linkndx = 0;
751 bind = STB_WEAK;
752 } else
753 bind = STB_GLOBAL;
754 sdp->sd_sym->st_info = ELF_ST_INFO(bind, STT_OBJECT);
755
756 /*
757 * If a user hasn't specifically indicated the scope of this
758 * symbol be made local then leave it as global (ie. prevent
759 * automatic scoping). The GOT should be defined protected,
760 * whereas all other special symbols are tagged as no-direct.
761 */
762 if (!SYM_IS_HIDDEN(sdp) &&
763 (sdflags & FLG_SY_DEFAULT)) {
764 sdp->sd_aux->sa_overndx = VER_NDX_GLOBAL;
765 if (sdaux_id == SDAUX_ID_GOT) {
766 sdp->sd_flags &= ~FLG_SY_NDIR;
767 sdp->sd_flags |= FLG_SY_PROTECT;
768 sdp->sd_sym->st_other = STV_PROTECTED;
769 } else if (((sdp->sd_flags & FLG_SY_DIR) == 0) &&
770 ((ofl->ofl_flags & FLG_OF_SYMBOLIC) == 0)) {
771 sdp->sd_flags |= FLG_SY_NDIR;
772 }
773 }
774 sdp->sd_flags |= sdflags;
775
776 /*
777 * If the reference originated from a mapfile ensure
778 * we mark the symbol as used.
779 */
780 if (sdp->sd_flags & FLG_SY_MAPREF)
781 sdp->sd_flags |= FLG_SY_MAPUSED;
782
783 DBG_CALL(Dbg_syms_updated(ofl, sdp, name));
784 }
785 return (1);
786 }
787
788
789 /*
790 * Undefined symbols can fall into one of four types:
791 *
792 * - the symbol is really undefined (SHN_UNDEF).
793 *
794 * - versioning has been enabled, however this symbol has not been assigned
795 * to one of the defined versions.
796 *
797 * - the symbol has been defined by an implicitly supplied library, ie. one
798 * which was encounted because it was NEEDED by another library, rather
799 * than from a command line supplied library which would become the only
800 * dependency of the output file being produced.
801 *
802 * - the symbol has been defined by a version of a shared object that is
803 * not permitted for this link-edit.
804 *
805 * In all cases the file who made the first reference to this symbol will have
806 * been recorded via the `sa_rfile' pointer.
807 */
808 typedef enum {
809 UNDEF, NOVERSION, IMPLICIT, NOTAVAIL,
810 BNDLOCAL
811 } Type;
812
813 static const Msg format[] = {
814 MSG_SYM_UND_UNDEF, /* MSG_INTL(MSG_SYM_UND_UNDEF) */
815 MSG_SYM_UND_NOVER, /* MSG_INTL(MSG_SYM_UND_NOVER) */
816 MSG_SYM_UND_IMPL, /* MSG_INTL(MSG_SYM_UND_IMPL) */
817 MSG_SYM_UND_NOTA, /* MSG_INTL(MSG_SYM_UND_NOTA) */
818 MSG_SYM_UND_BNDLOCAL /* MSG_INTL(MSG_SYM_UND_BNDLOCAL) */
819 };
820
821 /*
822 * Issue an undefined symbol message for the given symbol.
823 *
824 * entry:
825 * ofl - Output descriptor
826 * sdp - Undefined symbol to report
827 * type - Type of undefined symbol
828 * ofl_flag - One of 0, FLG_OF_FATAL, or FLG_OF_WARN.
829 * undef_state - Address of variable to be initialized to 0
830 * before the first call to sym_undef_entry, and passed
831 * to each subsequent call. A non-zero value for *undef_state
832 * indicates that this is not the first call in the series.
833 *
834 * exit:
835 * If *undef_state is 0, a title is issued.
836 *
837 * A message for the undefined symbol is issued.
838 *
839 * If ofl_flag is non-zero, its value is OR'd into *undef_state. Otherwise,
840 * all bits other than FLG_OF_FATAL and FLG_OF_WARN are set, in order to
841 * provide *undef_state with a non-zero value. These other bits have
842 * no meaning beyond that, and serve to ensure that *undef_state is
843 * non-zero if sym_undef_entry() has been called.
844 */
845 static void
846 sym_undef_entry(Ofl_desc *ofl, Sym_desc *sdp, Type type, ofl_flag_t ofl_flag,
847 ofl_flag_t *undef_state)
848 {
849 const char *name1, *name2, *name3;
850 Ifl_desc *ifl = sdp->sd_file;
851 Sym_aux *sap = sdp->sd_aux;
852
853 if (*undef_state == 0)
854 ld_eprintf(ofl, ERR_NONE, MSG_INTL(MSG_SYM_FMT_UNDEF),
855 MSG_INTL(MSG_SYM_UNDEF_ITM_11),
856 MSG_INTL(MSG_SYM_UNDEF_ITM_21),
857 MSG_INTL(MSG_SYM_UNDEF_ITM_12),
858 MSG_INTL(MSG_SYM_UNDEF_ITM_22));
859
860 ofl->ofl_flags |= ofl_flag;
861 *undef_state |= ofl_flag ? ofl_flag : ~(FLG_OF_FATAL | FLG_OF_WARN);
862
863 switch (type) {
864 case UNDEF:
865 case BNDLOCAL:
866 name1 = sap->sa_rfile;
867 break;
868 case NOVERSION:
869 name1 = ifl->ifl_name;
870 break;
871 case IMPLICIT:
872 name1 = sap->sa_rfile;
873 name2 = ifl->ifl_name;
874 break;
875 case NOTAVAIL:
876 name1 = sap->sa_rfile;
877 name2 = sap->sa_vfile;
878 name3 = ifl->ifl_verndx[sap->sa_dverndx].vi_name;
879 break;
880 default:
881 return;
882 }
883
884 ld_eprintf(ofl, ERR_NONE, MSG_INTL(format[type]),
885 demangle(sdp->sd_name), name1, name2, name3);
886 }
887
888 /*
889 * If an undef symbol exists naming a bound for the output section,
890 * turn it into a defined symbol with the correct value.
891 *
892 * We set an arbitrary 1KB limit on the resulting symbol names.
893 */
894 static void
895 sym_add_bounds(Ofl_desc *ofl, Os_desc *osp, Word bound)
896 {
897 Sym_desc *bsdp;
898 char symn[1024];
899 size_t nsz;
900
901 switch (bound) {
902 case SDAUX_ID_SECBOUND_START:
903 nsz = snprintf(symn, sizeof (symn), "%s%s",
904 MSG_ORIG(MSG_SYM_SECBOUND_START), osp->os_name);
905 if (nsz >= sizeof (symn))
906 return;
907 break;
908 case SDAUX_ID_SECBOUND_STOP:
909 nsz = snprintf(symn, sizeof (symn), "%s%s",
910 MSG_ORIG(MSG_SYM_SECBOUND_STOP), osp->os_name);
911 if (nsz >= sizeof (symn))
912 return;
913 break;
914 default:
915 assert(0);
916 }
917
918 if ((bsdp = ld_sym_find(symn, SYM_NOHASH, NULL, ofl)) != NULL) {
919 if ((bsdp->sd_shndx != SHN_UNDEF) &&
920 (bsdp->sd_ref == REF_REL_NEED)) {
921 ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_RESERVE),
922 symn, bsdp->sd_file->ifl_name);
923 return;
924 }
925
926 DBG_CALL(Dbg_syms_updated(ofl, bsdp, symn));
927
928 bsdp->sd_aux->sa_symspec = bound;
929 bsdp->sd_aux->sa_boundsec = osp;
930 bsdp->sd_flags |= FLG_SY_SPECSEC;
931 bsdp->sd_ref = REF_REL_NEED;
932 bsdp->sd_sym->st_info = ELF_ST_INFO(STB_GLOBAL, STT_NOTYPE);
933 bsdp->sd_sym->st_other = STV_PROTECTED;
934 bsdp->sd_isc = NULL;
935 bsdp->sd_sym->st_size = 0;
936 bsdp->sd_sym->st_value = 0;
937 bsdp->sd_shndx = bsdp->sd_sym->st_shndx = SHN_ABS;
938 }
939 }
940
941 static Boolean
942 is_cname(const char *name)
943 {
944 if (strlen(name) == strspn(name,
945 "abcdefghijklmnopqrstuvwxyz"
946 "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
947 "0123456789"
948 "_"))
949 return (TRUE);
950 else
951 return (FALSE);
952 }
953
954 /*
955 * At this point all symbol input processing has been completed, therefore
956 * complete the symbol table entries by generating any necessary internal
957 * symbols.
958 */
959 uintptr_t
960 ld_sym_spec(Ofl_desc *ofl)
961 {
962 Sym_desc *sdp;
963 Sg_desc *sgp;
964
965 DBG_CALL(Dbg_syms_spec_title(ofl->ofl_lml));
966
967 /*
968 * For each section in the output file, look for symbols named for the
969 * __start/__stop patterns. If references exist, flesh the symbols to
970 * be defined.
971 *
972 * The symbols are given values at the same time as the other special
973 * symbols.
974 */
975 if (!(ofl->ofl_flags & FLG_OF_RELOBJ) ||
976 (ofl->ofl_flags & FLG_OF_KMOD)) {
977 Aliste idx1;
978
979 for (APLIST_TRAVERSE(ofl->ofl_segs, idx1, sgp)) {
980 Os_desc *osp;
981 Aliste idx2;
982
983 for (APLIST_TRAVERSE(sgp->sg_osdescs, idx2, osp)) {
984 if (is_cname(osp->os_name)) {
985 sym_add_bounds(ofl, osp,
986 SDAUX_ID_SECBOUND_START);
987 sym_add_bounds(ofl, osp,
988 SDAUX_ID_SECBOUND_STOP);
989 }
990 }
991 }
992 }
993
994 if (ofl->ofl_flags & FLG_OF_RELOBJ)
995 return (1);
996
997 if (sym_add_spec(MSG_ORIG(MSG_SYM_ETEXT), MSG_ORIG(MSG_SYM_ETEXT_U),
998 SDAUX_ID_ETEXT, 0, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
999 ofl) == S_ERROR)
1000 return (S_ERROR);
1001 if (sym_add_spec(MSG_ORIG(MSG_SYM_EDATA), MSG_ORIG(MSG_SYM_EDATA_U),
1002 SDAUX_ID_EDATA, 0, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1003 ofl) == S_ERROR)
1004 return (S_ERROR);
1005 if (sym_add_spec(MSG_ORIG(MSG_SYM_END), MSG_ORIG(MSG_SYM_END_U),
1006 SDAUX_ID_END, FLG_SY_DYNSORT, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1007 ofl) == S_ERROR)
1008 return (S_ERROR);
1009 if (sym_add_spec(MSG_ORIG(MSG_SYM_L_END), MSG_ORIG(MSG_SYM_L_END_U),
1010 SDAUX_ID_END, 0, FLG_SY_HIDDEN, ofl) == S_ERROR)
1011 return (S_ERROR);
1012 if (sym_add_spec(MSG_ORIG(MSG_SYM_L_START), MSG_ORIG(MSG_SYM_L_START_U),
1013 SDAUX_ID_START, 0, FLG_SY_HIDDEN, ofl) == S_ERROR)
1014 return (S_ERROR);
1015
1016 /*
1017 * Historically we've always produced a _DYNAMIC symbol, even for
1018 * static executables (in which case its value will be 0).
1019 */
1020 if (sym_add_spec(MSG_ORIG(MSG_SYM_DYNAMIC), MSG_ORIG(MSG_SYM_DYNAMIC_U),
1021 SDAUX_ID_DYN, FLG_SY_DYNSORT, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1022 ofl) == S_ERROR)
1023 return (S_ERROR);
1024
1025 if (OFL_ALLOW_DYNSYM(ofl))
1026 if (sym_add_spec(MSG_ORIG(MSG_SYM_PLKTBL),
1027 MSG_ORIG(MSG_SYM_PLKTBL_U), SDAUX_ID_PLT,
1028 FLG_SY_DYNSORT, (FLG_SY_DEFAULT | FLG_SY_EXPDEF),
1029 ofl) == S_ERROR)
1030 return (S_ERROR);
1031
1032 /*
1033 * A GOT reference will be accompanied by the associated GOT symbol.
1034 * Make sure it gets assigned the appropriate special attributes.
1035 */
1036 if (((sdp = ld_sym_find(MSG_ORIG(MSG_SYM_GOFTBL_U),
1037 SYM_NOHASH, NULL, ofl)) != NULL) && (sdp->sd_ref != REF_DYN_SEEN)) {
1038 if (sym_add_spec(MSG_ORIG(MSG_SYM_GOFTBL),
1039 MSG_ORIG(MSG_SYM_GOFTBL_U), SDAUX_ID_GOT, FLG_SY_DYNSORT,
1040 (FLG_SY_DEFAULT | FLG_SY_EXPDEF), ofl) == S_ERROR)
1041 return (S_ERROR);
1042 }
1043
1044 return (1);
1045 }
1046
1047 /*
1048 * Determine a potential capability symbol's visibility.
1049 *
1050 * The -z symbolcap option transforms an object capabilities relocatable object
1051 * into a symbol capabilities relocatable object. Any global function symbols,
1052 * or initialized global data symbols are candidates for transforming into local
1053 * symbol capabilities definitions. However, if a user indicates that a symbol
1054 * should be demoted to local using a mapfile, then there is no need to
1055 * transform the associated global symbol.
1056 *
1057 * Normally, a symbol's visibility is determined after the symbol resolution
1058 * process, after all symbol state has been gathered and resolved. However,
1059 * for -z symbolcap, this determination is too late. When a global symbol is
1060 * read from an input file we need to determine it's visibility so as to decide
1061 * whether to create a local or not.
1062 *
1063 * If a user has explicitly defined this symbol as having local scope within a
1064 * mapfile, then a symbol of the same name already exists. However, explicit
1065 * local definitions are uncommon, as most mapfiles define the global symbol
1066 * requirements together with an auto-reduction directive '*'. If this state
1067 * has been defined, then we must make sure that the new symbol isn't a type
1068 * that can not be demoted to local.
1069 */
1070 static int
1071 sym_cap_vis(const char *name, Word hash, Sym *sym, Ofl_desc *ofl)
1072 {
1073 Sym_desc *sdp;
1074 uchar_t vis;
1075 avl_index_t where;
1076 sd_flag_t sdflags = 0;
1077
1078 /*
1079 * Determine the visibility of the new symbol.
1080 */
1081 vis = ELF_ST_VISIBILITY(sym->st_other);
1082 switch (vis) {
1083 case STV_EXPORTED:
1084 sdflags |= FLG_SY_EXPORT;
1085 break;
1086 case STV_SINGLETON:
1087 sdflags |= FLG_SY_SINGLE;
1088 break;
1089 }
1090
1091 /*
1092 * Determine whether a symbol definition already exists, and if so
1093 * obtain the visibility.
1094 */
1095 if ((sdp = ld_sym_find(name, hash, &where, ofl)) != NULL)
1096 sdflags |= sdp->sd_flags;
1097
1098 /*
1099 * Determine whether the symbol flags indicate this symbol should be
1100 * hidden.
1101 */
1102 if ((ofl->ofl_flags & (FLG_OF_AUTOLCL | FLG_OF_AUTOELM)) &&
1103 ((sdflags & MSK_SY_NOAUTO) == 0))
1104 sdflags |= FLG_SY_HIDDEN;
1105
1106 return ((sdflags & FLG_SY_HIDDEN) == 0);
1107 }
1108
1109 /*
1110 * This routine checks to see if a symbols visibility needs to be reduced to
1111 * either SYMBOLIC or LOCAL. This routine can be called from either
1112 * reloc_init() or sym_validate().
1113 */
1114 void
1115 ld_sym_adjust_vis(Sym_desc *sdp, Ofl_desc *ofl)
1116 {
1117 ofl_flag_t oflags = ofl->ofl_flags;
1118 Sym *sym = sdp->sd_sym;
1119
1120 if ((sdp->sd_ref == REF_REL_NEED) &&
1121 (sdp->sd_sym->st_shndx != SHN_UNDEF)) {
1122 /*
1123 * If auto-reduction/elimination is enabled, reduce any
1124 * non-versioned, and non-local capabilities global symbols.
1125 * A symbol is a candidate for auto-reduction/elimination if:
1126 *
1127 * - the symbol wasn't explicitly defined within a mapfile
1128 * (in which case all the necessary state has been applied
1129 * to the symbol), or
1130 * - the symbol isn't one of the family of reserved
1131 * special symbols (ie. _end, _etext, etc.), or
1132 * - the symbol isn't a SINGLETON, or
1133 * - the symbol wasn't explicitly defined within a version
1134 * definition associated with an input relocatable object.
1135 *
1136 * Indicate that the symbol has been reduced as it may be
1137 * necessary to print these symbols later.
1138 */
1139 if ((oflags & (FLG_OF_AUTOLCL | FLG_OF_AUTOELM)) &&
1140 ((sdp->sd_flags & MSK_SY_NOAUTO) == 0)) {
1141 if ((sdp->sd_flags & FLG_SY_HIDDEN) == 0) {
1142 sdp->sd_flags |=
1143 (FLG_SY_REDUCED | FLG_SY_HIDDEN);
1144 }
1145
1146 if (oflags & (FLG_OF_REDLSYM | FLG_OF_AUTOELM)) {
1147 sdp->sd_flags |= FLG_SY_ELIM;
1148 sym->st_other = STV_ELIMINATE |
1149 (sym->st_other & ~MSK_SYM_VISIBILITY);
1150 } else if (ELF_ST_VISIBILITY(sym->st_other) !=
1151 STV_INTERNAL)
1152 sym->st_other = STV_HIDDEN |
1153 (sym->st_other & ~MSK_SYM_VISIBILITY);
1154 }
1155
1156 /*
1157 * If -Bsymbolic is in effect, and the symbol hasn't explicitly
1158 * been defined nodirect (via a mapfile), then bind the global
1159 * symbol symbolically and assign the STV_PROTECTED visibility
1160 * attribute.
1161 */
1162 if ((oflags & FLG_OF_SYMBOLIC) &&
1163 ((sdp->sd_flags & (FLG_SY_HIDDEN | FLG_SY_NDIR)) == 0)) {
1164 sdp->sd_flags |= FLG_SY_PROTECT;
1165 if (ELF_ST_VISIBILITY(sym->st_other) == STV_DEFAULT)
1166 sym->st_other = STV_PROTECTED |
1167 (sym->st_other & ~MSK_SYM_VISIBILITY);
1168 }
1169 }
1170
1171 /*
1172 * Indicate that this symbol has had it's visibility checked so that
1173 * we don't need to do this investigation again.
1174 */
1175 sdp->sd_flags |= FLG_SY_VISIBLE;
1176 }
1177
1178 /*
1179 * Make sure a symbol definition is local to the object being built.
1180 */
1181 inline static int
1182 ensure_sym_local(Ofl_desc *ofl, Sym_desc *sdp, const char *str)
1183 {
1184 if (sdp->sd_sym->st_shndx == SHN_UNDEF) {
1185 if (str) {
1186 ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_SYM_UNDEF),
1187 str, demangle((char *)sdp->sd_name));
1188 }
1189 return (1);
1190 }
1191 if (sdp->sd_ref != REF_REL_NEED) {
1192 if (str) {
1193 ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_SYM_EXTERN),
1194 str, demangle((char *)sdp->sd_name),
1195 sdp->sd_file->ifl_name);
1196 }
1197 return (1);
1198 }
1199
1200 sdp->sd_flags |= FLG_SY_UPREQD;
1201 if (sdp->sd_isc) {
1202 sdp->sd_isc->is_flags |= FLG_IS_SECTREF;
1203 sdp->sd_isc->is_file->ifl_flags |= FLG_IF_FILEREF;
1204 }
1205 return (0);
1206 }
1207
1208 /*
1209 * Make sure all the symbol definitions required for initarray, finiarray, or
1210 * preinitarray's are local to the object being built.
1211 */
1212 static int
1213 ensure_array_local(Ofl_desc *ofl, APlist *apl, const char *str)
1214 {
1215 Aliste idx;
1216 Sym_desc *sdp;
1217 int ret = 0;
1218
1219 for (APLIST_TRAVERSE(apl, idx, sdp))
1220 ret += ensure_sym_local(ofl, sdp, str);
1221
1222 return (ret);
1223 }
1224
1225 /*
1226 * After all symbol table input processing has been finished, and all relocation
1227 * counting has been carried out (ie. no more symbols will be read, generated,
1228 * or modified), validate and count the relevant entries:
1229 *
1230 * - check and print any undefined symbols remaining. Note that if a symbol
1231 * has been defined by virtue of the inclusion of an implicit shared
1232 * library, it is still classed as undefined.
1233 *
1234 * - count the number of global needed symbols together with the size of
1235 * their associated name strings (if scoping has been indicated these
1236 * symbols may be reduced to locals).
1237 *
1238 * - establish the size and alignment requirements for the global .bss
1239 * section (the alignment of this section is based on the first symbol
1240 * that it will contain).
1241 */
1242 uintptr_t
1243 ld_sym_validate(Ofl_desc *ofl)
1244 {
1245 Sym_avlnode *sav;
1246 Sym_desc *sdp;
1247 Sym *sym;
1248 ofl_flag_t oflags = ofl->ofl_flags;
1249 ofl_flag_t undef = 0, needed = 0, verdesc = 0;
1250 Xword bssalign = 0, tlsalign = 0;
1251 Boolean need_bss, need_tlsbss;
1252 Xword bsssize = 0, tlssize = 0;
1253 #if defined(_ELF64)
1254 Xword lbssalign = 0, lbsssize = 0;
1255 Boolean need_lbss;
1256 #endif
1257 int ret, allow_ldynsym;
1258 uchar_t type;
1259 ofl_flag_t undef_state = 0;
1260
1261 DBG_CALL(Dbg_basic_validate(ofl->ofl_lml));
1262
1263 /*
1264 * The need_XXX booleans are used to determine whether we need to
1265 * create each type of bss section. We used to create these sections
1266 * if the sum of the required sizes for each type were non-zero.
1267 * However, it is possible for a compiler to generate COMMON variables
1268 * of zero-length and this tricks that logic --- even zero-length
1269 * symbols need an output section.
1270 */
1271 need_bss = need_tlsbss = FALSE;
1272 #if defined(_ELF64)
1273 need_lbss = FALSE;
1274 #endif
1275
1276 /*
1277 * Determine how undefined symbols are handled:
1278 *
1279 * fatal:
1280 * If this link-edit calls for no undefined symbols to remain
1281 * (this is the default case when generating an executable but
1282 * can be enforced for any object using -z defs), a fatal error
1283 * condition will be indicated.
1284 *
1285 * warning:
1286 * If we're creating a shared object, and either the -Bsymbolic
1287 * flag is set, or the user has turned on the -z guidance feature,
1288 * then a non-fatal warning is issued for each symbol.
1289 *
1290 * ignore:
1291 * In all other cases, undefined symbols are quietly allowed.
1292 */
1293 if (oflags & FLG_OF_NOUNDEF) {
1294 undef = FLG_OF_FATAL;
1295 } else if (oflags & FLG_OF_SHAROBJ) {
1296 if ((oflags & FLG_OF_SYMBOLIC) ||
1297 OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS))
1298 undef = FLG_OF_WARN;
1299 }
1300
1301 /*
1302 * If the symbol is referenced from an implicitly included shared object
1303 * (ie. it's not on the NEEDED list) then the symbol is also classified
1304 * as undefined and a fatal error condition will be indicated.
1305 */
1306 if ((oflags & FLG_OF_NOUNDEF) || !(oflags & FLG_OF_SHAROBJ))
1307 needed = FLG_OF_FATAL;
1308 else if ((oflags & FLG_OF_SHAROBJ) &&
1309 OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS))
1310 needed = FLG_OF_WARN;
1311
1312 /*
1313 * If the output image is being versioned, then all symbol definitions
1314 * must be associated with a version. Any symbol that isn't associated
1315 * with a version is classified as undefined, and a fatal error
1316 * condition is indicated.
1317 */
1318 if ((oflags & FLG_OF_VERDEF) && (ofl->ofl_vercnt > VER_NDX_GLOBAL))
1319 verdesc = FLG_OF_FATAL;
1320
1321 allow_ldynsym = OFL_ALLOW_LDYNSYM(ofl);
1322
1323 if (allow_ldynsym) {
1324 /*
1325 * Normally, we disallow symbols with 0 size from appearing
1326 * in a dyn[sym|tls]sort section. However, there are some
1327 * symbols that serve special purposes that we want to exempt
1328 * from this rule. Look them up, and set their
1329 * FLG_SY_DYNSORT flag.
1330 */
1331 static const char *special[] = {
1332 MSG_ORIG(MSG_SYM_INIT_U), /* _init */
1333 MSG_ORIG(MSG_SYM_FINI_U), /* _fini */
1334 MSG_ORIG(MSG_SYM_START), /* _start */
1335 NULL
1336 };
1337 int i;
1338
1339 for (i = 0; special[i] != NULL; i++) {
1340 if (((sdp = ld_sym_find(special[i],
1341 SYM_NOHASH, NULL, ofl)) != NULL) &&
1342 (sdp->sd_sym->st_size == 0)) {
1343 if (ld_sym_copy(sdp) == S_ERROR)
1344 return (S_ERROR);
1345 sdp->sd_flags |= FLG_SY_DYNSORT;
1346 }
1347 }
1348 }
1349
1350 /*
1351 * Collect and validate the globals from the internal symbol table.
1352 */
1353 for (sav = avl_first(&ofl->ofl_symavl); sav;
1354 sav = AVL_NEXT(&ofl->ofl_symavl, sav)) {
1355 Is_desc *isp;
1356 int undeferr = 0;
1357 uchar_t vis;
1358
1359 sdp = sav->sav_sdp;
1360
1361 /*
1362 * If undefined symbols are allowed, and we're not being
1363 * asked to supply guidance, ignore any symbols that are
1364 * not needed.
1365 */
1366 if (!(oflags & FLG_OF_NOUNDEF) &&
1367 !OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS) &&
1368 (sdp->sd_ref == REF_DYN_SEEN))
1369 continue;
1370
1371 /*
1372 * If the symbol originates from an external or parent mapfile
1373 * reference and hasn't been matched to a reference from a
1374 * relocatable object, ignore it.
1375 */
1376 if ((sdp->sd_flags & (FLG_SY_EXTERN | FLG_SY_PARENT)) &&
1377 ((sdp->sd_flags & FLG_SY_MAPUSED) == 0)) {
1378 sdp->sd_flags |= FLG_SY_INVALID;
1379 continue;
1380 }
1381
1382 sym = sdp->sd_sym;
1383 type = ELF_ST_TYPE(sym->st_info);
1384
1385 /*
1386 * Sanity check TLS.
1387 */
1388 if ((type == STT_TLS) && (sym->st_size != 0) &&
1389 (sym->st_shndx != SHN_UNDEF) &&
1390 (sym->st_shndx != SHN_COMMON)) {
1391 Is_desc *isp = sdp->sd_isc;
1392 Ifl_desc *ifl = sdp->sd_file;
1393
1394 if ((isp == NULL) || (isp->is_shdr == NULL) ||
1395 ((isp->is_shdr->sh_flags & SHF_TLS) == 0)) {
1396 ld_eprintf(ofl, ERR_FATAL,
1397 MSG_INTL(MSG_SYM_TLS),
1398 demangle(sdp->sd_name), ifl->ifl_name);
1399 continue;
1400 }
1401 }
1402
1403 if ((sdp->sd_flags & FLG_SY_VISIBLE) == 0)
1404 ld_sym_adjust_vis(sdp, ofl);
1405
1406 if ((sdp->sd_flags & FLG_SY_REDUCED) &&
1407 (oflags & FLG_OF_PROCRED)) {
1408 DBG_CALL(Dbg_syms_reduce(ofl, DBG_SYM_REDUCE_GLOBAL,
1409 sdp, 0, 0));
1410 }
1411
1412 /*
1413 * Record any STV_SINGLETON existence.
1414 */
1415 if ((vis = ELF_ST_VISIBILITY(sym->st_other)) == STV_SINGLETON)
1416 ofl->ofl_dtflags_1 |= DF_1_SINGLETON;
1417
1418 /*
1419 * If building a shared object or executable, and this is a
1420 * non-weak UNDEF symbol with reduced visibility (STV_*), then
1421 * give a fatal error.
1422 */
1423 if (((oflags & FLG_OF_RELOBJ) == 0) &&
1424 (sym->st_shndx == SHN_UNDEF) &&
1425 (ELF_ST_BIND(sym->st_info) != STB_WEAK)) {
1426 if (vis && (vis != STV_SINGLETON)) {
1427 sym_undef_entry(ofl, sdp, BNDLOCAL,
1428 FLG_OF_FATAL, &undef_state);
1429 continue;
1430 }
1431 }
1432
1433 /*
1434 * If this symbol is defined in a non-allocatable section,
1435 * reduce it to local symbol.
1436 */
1437 if (((isp = sdp->sd_isc) != 0) && isp->is_shdr &&
1438 ((isp->is_shdr->sh_flags & SHF_ALLOC) == 0)) {
1439 sdp->sd_flags |= (FLG_SY_REDUCED | FLG_SY_HIDDEN);
1440 }
1441
1442 /*
1443 * If this symbol originated as a SHN_SUNW_IGNORE, it will have
1444 * been processed as an SHN_UNDEF. Return the symbol to its
1445 * original index for validation, and propagation to the output
1446 * file.
1447 */
1448 if (sdp->sd_flags & FLG_SY_IGNORE)
1449 sdp->sd_shndx = SHN_SUNW_IGNORE;
1450
1451 if (undef) {
1452 /*
1453 * If a non-weak reference remains undefined, or if a
1454 * mapfile reference is not bound to the relocatable
1455 * objects that make up the object being built, we have
1456 * a fatal error.
1457 *
1458 * The exceptions are symbols which are defined to be
1459 * found in the parent (FLG_SY_PARENT), which is really
1460 * only meaningful for direct binding, or are defined
1461 * external (FLG_SY_EXTERN) so as to suppress -zdefs
1462 * errors.
1463 *
1464 * Register symbols are always allowed to be UNDEF.
1465 *
1466 * Note that we don't include references created via -u
1467 * in the same shared object binding test. This is for
1468 * backward compatibility, in that a number of archive
1469 * makefile rules used -u to cause archive extraction.
1470 * These same rules have been cut and pasted to apply
1471 * to shared objects, and thus although the -u reference
1472 * is redundant, flagging it as fatal could cause some
1473 * build to fail. Also we have documented the use of
1474 * -u as a mechanism to cause binding to weak version
1475 * definitions, thus giving users an error condition
1476 * would be incorrect.
1477 */
1478 if (!(sdp->sd_flags & FLG_SY_REGSYM) &&
1479 ((sym->st_shndx == SHN_UNDEF) &&
1480 ((ELF_ST_BIND(sym->st_info) != STB_WEAK) &&
1481 ((sdp->sd_flags &
1482 (FLG_SY_PARENT | FLG_SY_EXTERN)) == 0)) ||
1483 ((sdp->sd_flags &
1484 (FLG_SY_MAPREF | FLG_SY_MAPUSED | FLG_SY_HIDDEN |
1485 FLG_SY_PROTECT)) == FLG_SY_MAPREF))) {
1486 sym_undef_entry(ofl, sdp, UNDEF, undef,
1487 &undef_state);
1488 undeferr = 1;
1489 }
1490
1491 } else {
1492 /*
1493 * For building things like shared objects (or anything
1494 * -znodefs), undefined symbols are allowed.
1495 *
1496 * If a mapfile reference remains undefined the user
1497 * would probably like a warning at least (they've
1498 * usually mis-spelt the reference). Refer to the above
1499 * comments for discussion on -u references, which
1500 * are not tested for in the same manner.
1501 */
1502 if ((sdp->sd_flags &
1503 (FLG_SY_MAPREF | FLG_SY_MAPUSED)) ==
1504 FLG_SY_MAPREF) {
1505 sym_undef_entry(ofl, sdp, UNDEF, FLG_OF_WARN,
1506 &undef_state);
1507 undeferr = 1;
1508 }
1509 }
1510
1511 /*
1512 * If this symbol comes from a dependency mark the dependency
1513 * as required (-z ignore can result in unused dependencies
1514 * being dropped). If we need to record dependency versioning
1515 * information indicate what version of the needed shared object
1516 * this symbol is part of. Flag the symbol as undefined if it
1517 * has not been made available to us.
1518 */
1519 if ((sdp->sd_ref == REF_DYN_NEED) &&
1520 (!(sdp->sd_flags & FLG_SY_REFRSD))) {
1521 sdp->sd_file->ifl_flags |= FLG_IF_DEPREQD;
1522
1523 /*
1524 * Capture that we've bound to a symbol that doesn't
1525 * allow being directly bound to.
1526 */
1527 if (sdp->sd_flags & FLG_SY_NDIR)
1528 ofl->ofl_flags1 |= FLG_OF1_NGLBDIR;
1529
1530 if (sdp->sd_file->ifl_vercnt) {
1531 int vndx;
1532 Ver_index *vip;
1533
1534 vndx = sdp->sd_aux->sa_dverndx;
1535 vip = &sdp->sd_file->ifl_verndx[vndx];
1536 if (vip->vi_flags & FLG_VER_AVAIL) {
1537 vip->vi_flags |= FLG_VER_REFER;
1538 } else {
1539 sym_undef_entry(ofl, sdp, NOTAVAIL,
1540 FLG_OF_FATAL, &undef_state);
1541 continue;
1542 }
1543 }
1544 }
1545
1546 /*
1547 * Test that we do not bind to symbol supplied from an implicit
1548 * shared object. If a binding is from a weak reference it can
1549 * be ignored.
1550 */
1551 if (needed && !undeferr && (sdp->sd_flags & FLG_SY_GLOBREF) &&
1552 (sdp->sd_ref == REF_DYN_NEED) &&
1553 (sdp->sd_flags & FLG_SY_NOTAVAIL)) {
1554 sym_undef_entry(ofl, sdp, IMPLICIT, needed,
1555 &undef_state);
1556 if (needed == FLG_OF_FATAL)
1557 continue;
1558 }
1559
1560 /*
1561 * Test that a symbol isn't going to be reduced to local scope
1562 * which actually wants to bind to a shared object - if so it's
1563 * a fatal error.
1564 */
1565 if ((sdp->sd_ref == REF_DYN_NEED) &&
1566 (sdp->sd_flags & (FLG_SY_HIDDEN | FLG_SY_PROTECT))) {
1567 sym_undef_entry(ofl, sdp, BNDLOCAL, FLG_OF_FATAL,
1568 &undef_state);
1569 continue;
1570 }
1571
1572 /*
1573 * If the output image is to be versioned then all symbol
1574 * definitions must be associated with a version. Remove any
1575 * versioning that might be left associated with an undefined
1576 * symbol.
1577 */
1578 if (verdesc && (sdp->sd_ref == REF_REL_NEED)) {
1579 if (sym->st_shndx == SHN_UNDEF) {
1580 if (sdp->sd_aux && sdp->sd_aux->sa_overndx)
1581 sdp->sd_aux->sa_overndx = 0;
1582 } else {
1583 if (!SYM_IS_HIDDEN(sdp) && sdp->sd_aux &&
1584 (sdp->sd_aux->sa_overndx == 0)) {
1585 sym_undef_entry(ofl, sdp, NOVERSION,
1586 verdesc, &undef_state);
1587 continue;
1588 }
1589 }
1590 }
1591
1592 /*
1593 * If we don't need the symbol there's no need to process it
1594 * any further.
1595 */
1596 if (sdp->sd_ref == REF_DYN_SEEN)
1597 continue;
1598
1599 /*
1600 * Calculate the size and alignment requirements for the global
1601 * .bss and .tls sections. If we're building a relocatable
1602 * object only account for scoped COMMON symbols (these will
1603 * be converted to .bss references).
1604 *
1605 * When -z nopartial is in effect, partially initialized
1606 * symbols are directed to the special .data section
1607 * created for that purpose (ofl->ofl_isparexpn).
1608 * Otherwise, partially initialized symbols go to .bss.
1609 *
1610 * Also refer to make_mvsections() in sunwmove.c
1611 */
1612 if ((sym->st_shndx == SHN_COMMON) &&
1613 (((oflags & FLG_OF_RELOBJ) == 0) ||
1614 (SYM_IS_HIDDEN(sdp) && (oflags & FLG_OF_PROCRED)))) {
1615 if ((sdp->sd_move == NULL) ||
1616 ((sdp->sd_flags & FLG_SY_PAREXPN) == 0)) {
1617 if (type != STT_TLS) {
1618 need_bss = TRUE;
1619 bsssize = (Xword)S_ROUND(bsssize,
1620 sym->st_value) + sym->st_size;
1621 if (sym->st_value > bssalign)
1622 bssalign = sym->st_value;
1623 } else {
1624 need_tlsbss = TRUE;
1625 tlssize = (Xword)S_ROUND(tlssize,
1626 sym->st_value) + sym->st_size;
1627 if (sym->st_value > tlsalign)
1628 tlsalign = sym->st_value;
1629 }
1630 }
1631 }
1632
1633 #if defined(_ELF64)
1634 /*
1635 * Calculate the size and alignment requirement for the global
1636 * .lbss. TLS or partially initialized symbols do not need to be
1637 * considered yet.
1638 */
1639 if ((ld_targ.t_m.m_mach == EM_AMD64) &&
1640 (sym->st_shndx == SHN_X86_64_LCOMMON)) {
1641 need_lbss = TRUE;
1642 lbsssize = (Xword)S_ROUND(lbsssize, sym->st_value) +
1643 sym->st_size;
1644 if (sym->st_value > lbssalign)
1645 lbssalign = sym->st_value;
1646 }
1647 #endif
1648 /*
1649 * If a symbol was referenced via the command line
1650 * (ld -u <>, ...), then this counts as a reference against the
1651 * symbol. Mark any section that symbol is defined in.
1652 */
1653 if (((isp = sdp->sd_isc) != 0) &&
1654 (sdp->sd_flags & FLG_SY_CMDREF)) {
1655 isp->is_flags |= FLG_IS_SECTREF;
1656 isp->is_file->ifl_flags |= FLG_IF_FILEREF;
1657 }
1658
1659 /*
1660 * Update the symbol count and the associated name string size.
1661 * Note, a capabilities symbol must remain as visible as a
1662 * global symbol. However, the runtime linker recognizes the
1663 * hidden requirement and ensures the symbol isn't made globally
1664 * available at runtime.
1665 */
1666 if (SYM_IS_HIDDEN(sdp) && (oflags & FLG_OF_PROCRED)) {
1667 /*
1668 * If any reductions are being processed, keep a count
1669 * of eliminated symbols, and if the symbol is being
1670 * reduced to local, count it's size for the .symtab.
1671 */
1672 if (sdp->sd_flags & FLG_SY_ELIM) {
1673 ofl->ofl_elimcnt++;
1674 } else {
1675 ofl->ofl_scopecnt++;
1676 if ((((sdp->sd_flags & FLG_SY_REGSYM) == 0) ||
1677 sym->st_name) && (st_insert(ofl->ofl_strtab,
1678 sdp->sd_name) == -1))
1679 return (S_ERROR);
1680 if (allow_ldynsym && sym->st_name &&
1681 ldynsym_symtype[type]) {
1682 ofl->ofl_dynscopecnt++;
1683 if (st_insert(ofl->ofl_dynstrtab,
1684 sdp->sd_name) == -1)
1685 return (S_ERROR);
1686 /* Include it in sort section? */
1687 DYNSORT_COUNT(sdp, sym, type, ++);
1688 }
1689 }
1690 } else {
1691 ofl->ofl_globcnt++;
1692
1693 /*
1694 * Check to see if this global variable should go into
1695 * a sort section. Sort sections require a
1696 * .SUNW_ldynsym section, so, don't check unless a
1697 * .SUNW_ldynsym is allowed.
1698 */
1699 if (allow_ldynsym)
1700 DYNSORT_COUNT(sdp, sym, type, ++);
1701
1702 /*
1703 * If global direct bindings are in effect, or this
1704 * symbol has bound to a dependency which was specified
1705 * as requiring direct bindings, and it hasn't
1706 * explicitly been defined as a non-direct binding
1707 * symbol, mark it.
1708 */
1709 if (((ofl->ofl_dtflags_1 & DF_1_DIRECT) || (isp &&
1710 (isp->is_file->ifl_flags & FLG_IF_DIRECT))) &&
1711 ((sdp->sd_flags & FLG_SY_NDIR) == 0))
1712 sdp->sd_flags |= FLG_SY_DIR;
1713
1714 /*
1715 * Insert the symbol name.
1716 */
1717 if (((sdp->sd_flags & FLG_SY_REGSYM) == 0) ||
1718 sym->st_name) {
1719 if (st_insert(ofl->ofl_strtab,
1720 sdp->sd_name) == -1)
1721 return (S_ERROR);
1722
1723 if (!(ofl->ofl_flags & FLG_OF_RELOBJ) &&
1724 (st_insert(ofl->ofl_dynstrtab,
1725 sdp->sd_name) == -1))
1726 return (S_ERROR);
1727 }
1728
1729 /*
1730 * If this section offers a global symbol - record that
1731 * fact.
1732 */
1733 if (isp) {
1734 isp->is_flags |= FLG_IS_SECTREF;
1735 isp->is_file->ifl_flags |= FLG_IF_FILEREF;
1736 }
1737 }
1738 }
1739
1740 /*
1741 * Guidance: Use -z defs|nodefs when building shared objects.
1742 *
1743 * Our caller issues this, unless we mask it out here. So we mask it
1744 * out unless we've issued at least one warnings or fatal error.
1745 */
1746 if (!((oflags & FLG_OF_SHAROBJ) && OFL_GUIDANCE(ofl, FLG_OFG_NO_DEFS) &&
1747 (undef_state & (FLG_OF_FATAL | FLG_OF_WARN))))
1748 ofl->ofl_guideflags |= FLG_OFG_NO_DEFS;
1749
1750 /*
1751 * If we've encountered a fatal error during symbol validation then
1752 * return now.
1753 */
1754 if (ofl->ofl_flags & FLG_OF_FATAL)
1755 return (1);
1756
1757 /*
1758 * Now that symbol resolution is completed, scan any register symbols.
1759 * From now on, we're only interested in those that contribute to the
1760 * output file.
1761 */
1762 if (ofl->ofl_regsyms) {
1763 int ndx;
1764
1765 for (ndx = 0; ndx < ofl->ofl_regsymsno; ndx++) {
1766 if ((sdp = ofl->ofl_regsyms[ndx]) == NULL)
1767 continue;
1768 if (sdp->sd_ref != REF_REL_NEED) {
1769 ofl->ofl_regsyms[ndx] = NULL;
1770 continue;
1771 }
1772
1773 ofl->ofl_regsymcnt++;
1774 if (sdp->sd_sym->st_name == 0)
1775 sdp->sd_name = MSG_ORIG(MSG_STR_EMPTY);
1776
1777 if (SYM_IS_HIDDEN(sdp) ||
1778 (ELF_ST_BIND(sdp->sd_sym->st_info) == STB_LOCAL))
1779 ofl->ofl_lregsymcnt++;
1780 }
1781 }
1782
1783 /*
1784 * Generate the .bss section now that we know its size and alignment.
1785 */
1786 if (need_bss) {
1787 if (ld_make_bss(ofl, bsssize, bssalign,
1788 ld_targ.t_id.id_bss) == S_ERROR)
1789 return (S_ERROR);
1790 }
1791 if (need_tlsbss) {
1792 if (ld_make_bss(ofl, tlssize, tlsalign,
1793 ld_targ.t_id.id_tlsbss) == S_ERROR)
1794 return (S_ERROR);
1795 }
1796 #if defined(_ELF64)
1797 if ((ld_targ.t_m.m_mach == EM_AMD64) &&
1798 need_lbss && !(oflags & FLG_OF_RELOBJ)) {
1799 if (ld_make_bss(ofl, lbsssize, lbssalign,
1800 ld_targ.t_id.id_lbss) == S_ERROR)
1801 return (S_ERROR);
1802 }
1803 #endif
1804 /*
1805 * Determine what entry point symbol we need, and if found save its
1806 * symbol descriptor so that we can update the ELF header entry with the
1807 * symbols value later (see update_oehdr). Make sure the symbol is
1808 * tagged to ensure its update in case -s is in effect. Use any -e
1809 * option first, or the default entry points `_start' and `main'.
1810 */
1811 ret = 0;
1812 if (ofl->ofl_entry) {
1813 if ((sdp = ld_sym_find(ofl->ofl_entry, SYM_NOHASH,
1814 NULL, ofl)) == NULL) {
1815 ld_eprintf(ofl, ERR_FATAL, MSG_INTL(MSG_ARG_NOENTRY),
1816 ofl->ofl_entry);
1817 ret++;
1818 } else if (ensure_sym_local(ofl, sdp,
1819 MSG_INTL(MSG_SYM_ENTRY)) != 0) {
1820 ret++;
1821 } else {
1822 ofl->ofl_entry = (void *)sdp;
1823 }
1824 } else if (((sdp = ld_sym_find(MSG_ORIG(MSG_SYM_START),
1825 SYM_NOHASH, NULL, ofl)) != NULL) && (ensure_sym_local(ofl,
1826 sdp, 0) == 0)) {
1827 ofl->ofl_entry = (void *)sdp;
1828
1829 } else if (((sdp = ld_sym_find(MSG_ORIG(MSG_SYM_MAIN),
1830 SYM_NOHASH, NULL, ofl)) != NULL) && (ensure_sym_local(ofl,
1831 sdp, 0) == 0)) {
1832 ofl->ofl_entry = (void *)sdp;
1833 }
1834
1835 /*
1836 * If ld -zdtrace=<sym> was given, then validate that the symbol is
1837 * defined within the current object being built.
1838 */
1839 if ((sdp = ofl->ofl_dtracesym) != 0)
1840 ret += ensure_sym_local(ofl, sdp, MSG_ORIG(MSG_STR_DTRACE));
1841
1842 /*
1843 * If any initarray, finiarray or preinitarray functions have been
1844 * requested, make sure they are defined within the current object
1845 * being built.
1846 */
1847 if (ofl->ofl_initarray) {
1848 ret += ensure_array_local(ofl, ofl->ofl_initarray,
1849 MSG_ORIG(MSG_SYM_INITARRAY));
1850 }
1851 if (ofl->ofl_finiarray) {
1852 ret += ensure_array_local(ofl, ofl->ofl_finiarray,
1853 MSG_ORIG(MSG_SYM_FINIARRAY));
1854 }
1855 if (ofl->ofl_preiarray) {
1856 ret += ensure_array_local(ofl, ofl->ofl_preiarray,
1857 MSG_ORIG(MSG_SYM_PREINITARRAY));
1858 }
1859
1860 if (ret)
1861 return (S_ERROR);
1862
1863 /*
1864 * If we're required to record any needed dependencies versioning
1865 * information calculate it now that all symbols have been validated.
1866 */
1867 if ((oflags & (FLG_OF_VERNEED | FLG_OF_NOVERSEC)) == FLG_OF_VERNEED)
1868 return (ld_vers_check_need(ofl));
1869 else
1870 return (1);
1871 }
1872
1873 /*
1874 * qsort(3c) comparison function. As an optimization for associating weak
1875 * symbols to their strong counterparts sort global symbols according to their
1876 * section index, address and binding.
1877 */
1878 static int
1879 compare(const void *sdpp1, const void *sdpp2)
1880 {
1881 Sym_desc *sdp1 = *((Sym_desc **)sdpp1);
1882 Sym_desc *sdp2 = *((Sym_desc **)sdpp2);
1883 Sym *sym1, *sym2;
1884 uchar_t bind1, bind2;
1885
1886 /*
1887 * Symbol descriptors may be zero, move these to the front of the
1888 * sorted array.
1889 */
1890 if (sdp1 == NULL)
1891 return (-1);
1892 if (sdp2 == NULL)
1893 return (1);
1894
1895 sym1 = sdp1->sd_sym;
1896 sym2 = sdp2->sd_sym;
1897
1898 /*
1899 * Compare the symbols section index. This is important when sorting
1900 * the symbol tables of relocatable objects. In this case, a symbols
1901 * value is the offset within the associated section, and thus many
1902 * symbols can have the same value, but are effectively different
1903 * addresses.
1904 */
1905 if (sym1->st_shndx > sym2->st_shndx)
1906 return (1);
1907 if (sym1->st_shndx < sym2->st_shndx)
1908 return (-1);
1909
1910 /*
1911 * Compare the symbols value (address).
1912 */
1913 if (sym1->st_value > sym2->st_value)
1914 return (1);
1915 if (sym1->st_value < sym2->st_value)
1916 return (-1);
1917
1918 bind1 = ELF_ST_BIND(sym1->st_info);
1919 bind2 = ELF_ST_BIND(sym2->st_info);
1920
1921 /*
1922 * If two symbols have the same address place the weak symbol before
1923 * any strong counterpart.
1924 */
1925 if (bind1 > bind2)
1926 return (-1);
1927 if (bind1 < bind2)
1928 return (1);
1929
1930 return (0);
1931 }
1932
1933 /*
1934 * Issue a MSG_SYM_BADADDR error from ld_sym_process(). This error
1935 * is issued when a symbol address/size is not contained by the
1936 * target section.
1937 *
1938 * Such objects are at least partially corrupt, and the user would
1939 * be well advised to be skeptical of them, and to ask their compiler
1940 * supplier to fix the problem. However, a distinction needs to be
1941 * made between symbols that reference readonly text, and those that
1942 * access writable data. Other than throwing off profiling results,
1943 * the readonly section case is less serious. We have encountered
1944 * such objects in the field. In order to allow existing objects
1945 * to continue working, we issue a warning rather than a fatal error
1946 * if the symbol is against readonly text. Other cases are fatal.
1947 */
1948 static void
1949 issue_badaddr_msg(Ifl_desc *ifl, Ofl_desc *ofl, Sym_desc *sdp,
1950 Sym *sym, Word shndx)
1951 {
1952 Error err;
1953 const char *msg;
1954
1955 if ((sdp->sd_isc->is_shdr->sh_flags & (SHF_WRITE | SHF_ALLOC)) ==
1956 SHF_ALLOC) {
1957 msg = MSG_INTL(MSG_SYM_BADADDR_ROTXT);
1958 err = ERR_WARNING;
1959 } else {
1960 msg = MSG_INTL(MSG_SYM_BADADDR);
1961 err = ERR_FATAL;
1962 }
1963
1964 ld_eprintf(ofl, err, msg, demangle(sdp->sd_name),
1965 ifl->ifl_name, shndx, sdp->sd_isc->is_name,
1966 EC_XWORD(sdp->sd_isc->is_shdr->sh_size),
1967 EC_XWORD(sym->st_value), EC_XWORD(sym->st_size));
1968 }
1969
1970 /*
1971 * Global symbols that are candidates for translation to local capability
1972 * symbols under -z symbolcap, are maintained on a local symbol list. Once
1973 * all symbols of a file are processed, this list is traversed to cull any
1974 * unnecessary weak symbol aliases.
1975 */
1976 typedef struct {
1977 Sym_desc *c_nsdp; /* new lead symbol */
1978 Sym_desc *c_osdp; /* original symbol */
1979 Cap_group *c_group; /* symbol capability group */
1980 Word c_ndx; /* symbol index */
1981 } Cap_pair;
1982
1983 /*
1984 * Process the symbol table for the specified input file. At this point all
1985 * input sections from this input file have been assigned an input section
1986 * descriptor which is saved in the `ifl_isdesc' array.
1987 *
1988 * - local symbols are saved (as is) if the input file is a relocatable
1989 * object
1990 *
1991 * - global symbols are added to the linkers internal symbol table if they
1992 * are not already present, otherwise a symbol resolution function is
1993 * called upon to resolve the conflict.
1994 */
1995 uintptr_t
1996 ld_sym_process(Is_desc *isc, Ifl_desc *ifl, Ofl_desc *ofl)
1997 {
1998 /*
1999 * This macro tests the given symbol to see if it is out of
2000 * range relative to the section it references.
2001 *
2002 * entry:
2003 * - ifl is a relative object (ET_REL)
2004 * _sdp - Symbol descriptor
2005 * _sym - Symbol
2006 * _type - Symbol type
2007 *
2008 * The following are tested:
2009 * - Symbol length is non-zero
2010 * - Symbol type is a type that references code or data
2011 * - Referenced section is not 0 (indicates an UNDEF symbol)
2012 * and is not in the range of special values above SHN_LORESERVE
2013 * (excluding SHN_XINDEX, which is OK).
2014 * - We have a valid section header for the target section
2015 *
2016 * If the above are all true, and the symbol position is not
2017 * contained by the target section, this macro evaluates to
2018 * True (1). Otherwise, False(0).
2019 */
2020 #define SYM_LOC_BADADDR(_sdp, _sym, _type) \
2021 (_sym->st_size && dynsymsort_symtype[_type] && \
2022 (_sym->st_shndx != SHN_UNDEF) && \
2023 ((_sym->st_shndx < SHN_LORESERVE) || \
2024 (_sym->st_shndx == SHN_XINDEX)) && \
2025 _sdp->sd_isc && _sdp->sd_isc->is_shdr && \
2026 ((_sym->st_value + _sym->st_size) > _sdp->sd_isc->is_shdr->sh_size))
2027
2028 Conv_inv_buf_t inv_buf;
2029 Sym *sym = (Sym *)isc->is_indata->d_buf;
2030 Word *symshndx = NULL;
2031 Shdr *shdr = isc->is_shdr;
2032 Sym_desc *sdp;
2033 size_t strsize;
2034 char *strs;
2035 uchar_t type, bind;
2036 Word ndx, hash, local, total;
2037 uchar_t osabi = ifl->ifl_ehdr->e_ident[EI_OSABI];
2038 Half mach = ifl->ifl_ehdr->e_machine;
2039 Half etype = ifl->ifl_ehdr->e_type;
2040 int etype_rel;
2041 const char *symsecname, *strsecname;
2042 Word symsecndx;
2043 avl_index_t where;
2044 int test_gnu_hidden_bit, weak;
2045 Cap_desc *cdp = NULL;
2046 Alist *cappairs = NULL;
2047
2048 /*
2049 * Its possible that a file may contain more that one symbol table,
2050 * ie. .dynsym and .symtab in a shared library. Only process the first
2051 * table (here, we assume .dynsym comes before .symtab).
2052 */
2053 if (ifl->ifl_symscnt)
2054 return (1);
2055
2056 if (isc->is_symshndx)
2057 symshndx = isc->is_symshndx->is_indata->d_buf;
2058
2059 DBG_CALL(Dbg_syms_process(ofl->ofl_lml, ifl));
2060
2061 symsecndx = isc->is_scnndx;
2062 if (isc->is_name)
2063 symsecname = isc->is_name;
2064 else
2065 symsecname = MSG_ORIG(MSG_STR_EMPTY);
2066
2067 /*
2068 * From the symbol tables section header information determine which
2069 * strtab table is needed to locate the actual symbol names.
2070 */
2071 if (ifl->ifl_flags & FLG_IF_HSTRTAB) {
2072 ndx = shdr->sh_link;
2073 if ((ndx == 0) || (ndx >= ifl->ifl_shnum)) {
2074 ld_eprintf(ofl, ERR_FATAL,
2075 MSG_INTL(MSG_FIL_INVSHLINK), ifl->ifl_name,
2076 EC_WORD(symsecndx), symsecname, EC_XWORD(ndx));
2077 return (S_ERROR);
2078 }
2079 strsize = ifl->ifl_isdesc[ndx]->is_shdr->sh_size;
2080 strs = ifl->ifl_isdesc[ndx]->is_indata->d_buf;
2081 if (ifl->ifl_isdesc[ndx]->is_name)
2082 strsecname = ifl->ifl_isdesc[ndx]->is_name;
2083 else
2084 strsecname = MSG_ORIG(MSG_STR_EMPTY);
2085 } else {
2086 /*
2087 * There is no string table section in this input file
2088 * although there are symbols in this symbol table section.
2089 * This means that these symbols do not have names.
2090 * Currently, only scratch register symbols are allowed
2091 * not to have names.
2092 */
2093 strsize = 0;
2094 strs = (char *)MSG_ORIG(MSG_STR_EMPTY);
2095 strsecname = MSG_ORIG(MSG_STR_EMPTY);
2096 }
2097
2098 /*
2099 * Determine the number of local symbols together with the total
2100 * number we have to process.
2101 */
2102 total = (Word)(shdr->sh_size / shdr->sh_entsize);
2103 local = shdr->sh_info;
2104
2105 /*
2106 * Allocate a symbol table index array and a local symbol array
2107 * (global symbols are processed and added to the ofl->ofl_symbkt[]
2108 * array). If we are dealing with a relocatable object, allocate the
2109 * local symbol descriptors. If this isn't a relocatable object we
2110 * still have to process any shared object locals to determine if any
2111 * register symbols exist. Although these aren't added to the output
2112 * image, they are used as part of symbol resolution.
2113 */
2114 if ((ifl->ifl_oldndx = libld_malloc((size_t)(total *
2115 sizeof (Sym_desc *)))) == NULL)
2116 return (S_ERROR);
2117 etype_rel = (etype == ET_REL);
2118 if (etype_rel && local) {
2119 if ((ifl->ifl_locs =
2120 libld_calloc(sizeof (Sym_desc), local)) == NULL)
2121 return (S_ERROR);
2122 /* LINTED */
2123 ifl->ifl_locscnt = (Word)local;
2124 }
2125 ifl->ifl_symscnt = total;
2126
2127 /*
2128 * If there are local symbols to save add them to the symbol table
2129 * index array.
2130 */
2131 if (local) {
2132 int allow_ldynsym = OFL_ALLOW_LDYNSYM(ofl);
2133 Sym_desc *last_file_sdp = NULL;
2134 int last_file_ndx = 0;
2135
2136 for (sym++, ndx = 1; ndx < local; sym++, ndx++) {
2137 sd_flag_t sdflags = FLG_SY_CLEAN;
2138 Word shndx;
2139 const char *name;
2140 Sym_desc *rsdp;
2141 int shndx_bad = 0;
2142 int symtab_enter = 1;
2143
2144 /*
2145 * Determine and validate the associated section index.
2146 */
2147 if (symshndx && (sym->st_shndx == SHN_XINDEX)) {
2148 shndx = symshndx[ndx];
2149 } else if ((shndx = sym->st_shndx) >= SHN_LORESERVE) {
2150 sdflags |= FLG_SY_SPECSEC;
2151 } else if (shndx > ifl->ifl_shnum) {
2152 /* We need the name before we can issue error */
2153 shndx_bad = 1;
2154 }
2155
2156 /*
2157 * Check if st_name has a valid value or not.
2158 */
2159 if ((name = string(ofl, ifl, sym, strs, strsize, ndx,
2160 shndx, symsecndx, symsecname, strsecname,
2161 &sdflags)) == NULL)
2162 continue;
2163
2164 /*
2165 * Now that we have the name, if the section index
2166 * was bad, report it.
2167 */
2168 if (shndx_bad) {
2169 ld_eprintf(ofl, ERR_WARNING,
2170 MSG_INTL(MSG_SYM_INVSHNDX),
2171 demangle_symname(name, symsecname, ndx),
2172 ifl->ifl_name,
2173 conv_sym_shndx(osabi, mach, sym->st_shndx,
2174 CONV_FMT_DECIMAL, &inv_buf));
2175 continue;
2176 }
2177
2178 /*
2179 * If this local symbol table originates from a shared
2180 * object, then we're only interested in recording
2181 * register symbols. As local symbol descriptors aren't
2182 * allocated for shared objects, one will be allocated
2183 * to associated with the register symbol. This symbol
2184 * won't become part of the output image, but we must
2185 * process it to test for register conflicts.
2186 */
2187 rsdp = sdp = NULL;
2188 if (sdflags & FLG_SY_REGSYM) {
2189 /*
2190 * The presence of FLG_SY_REGSYM means that
2191 * the pointers in ld_targ.t_ms are non-NULL.
2192 */
2193 rsdp = (*ld_targ.t_ms.ms_reg_find)(sym, ofl);
2194 if (rsdp != 0) {
2195 /*
2196 * The fact that another register def-
2197 * inition has been found is fatal.
2198 * Call the verification routine to get
2199 * the error message and move on.
2200 */
2201 (void) (*ld_targ.t_ms.ms_reg_check)
2202 (rsdp, sym, name, ifl, ofl);
2203 continue;
2204 }
2205
2206 if (etype == ET_DYN) {
2207 if ((sdp = libld_calloc(
2208 sizeof (Sym_desc), 1)) == NULL)
2209 return (S_ERROR);
2210 sdp->sd_ref = REF_DYN_SEEN;
2211
2212 /* Will not appear in output object */
2213 symtab_enter = 0;
2214 }
2215 } else if (etype == ET_DYN)
2216 continue;
2217
2218 /*
2219 * Fill in the remaining symbol descriptor information.
2220 */
2221 if (sdp == NULL) {
2222 sdp = &(ifl->ifl_locs[ndx]);
2223 sdp->sd_ref = REF_REL_NEED;
2224 sdp->sd_symndx = ndx;
2225 }
2226 if (rsdp == NULL) {
2227 sdp->sd_name = name;
2228 sdp->sd_sym = sym;
2229 sdp->sd_shndx = shndx;
2230 sdp->sd_flags = sdflags;
2231 sdp->sd_file = ifl;
2232 ifl->ifl_oldndx[ndx] = sdp;
2233 }
2234
2235 DBG_CALL(Dbg_syms_entry(ofl->ofl_lml, ndx, sdp));
2236
2237 /*
2238 * Reclassify any SHN_SUNW_IGNORE symbols to SHN_UNDEF
2239 * so as to simplify future processing.
2240 */
2241 if (sym->st_shndx == SHN_SUNW_IGNORE) {
2242 sdp->sd_shndx = shndx = SHN_UNDEF;
2243 sdp->sd_flags |= (FLG_SY_IGNORE | FLG_SY_ELIM);
2244 }
2245
2246 /*
2247 * Process any register symbols.
2248 */
2249 if (sdp->sd_flags & FLG_SY_REGSYM) {
2250 /*
2251 * Add a diagnostic to indicate we've caught a
2252 * register symbol, as this can be useful if a
2253 * register conflict is later discovered.
2254 */
2255 DBG_CALL(Dbg_syms_entered(ofl, sym, sdp));
2256
2257 /*
2258 * If this register symbol hasn't already been
2259 * recorded, enter it now.
2260 *
2261 * The presence of FLG_SY_REGSYM means that
2262 * the pointers in ld_targ.t_ms are non-NULL.
2263 */
2264 if ((rsdp == NULL) &&
2265 ((*ld_targ.t_ms.ms_reg_enter)(sdp, ofl) ==
2266 0))
2267 return (S_ERROR);
2268 }
2269
2270 /*
2271 * Assign an input section.
2272 */
2273 if ((sym->st_shndx != SHN_UNDEF) &&
2274 ((sdp->sd_flags & FLG_SY_SPECSEC) == 0))
2275 sdp->sd_isc = ifl->ifl_isdesc[shndx];
2276
2277 /*
2278 * If this symbol falls within the range of a section
2279 * being discarded, then discard the symbol itself.
2280 * There is no reason to keep this local symbol.
2281 */
2282 if (sdp->sd_isc &&
2283 (sdp->sd_isc->is_flags & FLG_IS_DISCARD)) {
2284 sdp->sd_flags |= FLG_SY_ISDISC;
2285 DBG_CALL(Dbg_syms_discarded(ofl->ofl_lml, sdp));
2286 continue;
2287 }
2288
2289 /*
2290 * Skip any section symbols as new versions of these
2291 * will be created.
2292 */
2293 if ((type = ELF_ST_TYPE(sym->st_info)) == STT_SECTION) {
2294 if (sym->st_shndx == SHN_UNDEF) {
2295 ld_eprintf(ofl, ERR_WARNING,
2296 MSG_INTL(MSG_SYM_INVSHNDX),
2297 demangle_symname(name, symsecname,
2298 ndx), ifl->ifl_name,
2299 conv_sym_shndx(osabi, mach,
2300 sym->st_shndx, CONV_FMT_DECIMAL,
2301 &inv_buf));
2302 }
2303 continue;
2304 }
2305
2306 /*
2307 * For a relocatable object, if this symbol is defined
2308 * and has non-zero length and references an address
2309 * within an associated section, then check its extents
2310 * to make sure the section boundaries encompass it.
2311 * If they don't, the ELF file is corrupt.
2312 */
2313 if (etype_rel) {
2314 if (SYM_LOC_BADADDR(sdp, sym, type)) {
2315 issue_badaddr_msg(ifl, ofl, sdp,
2316 sym, shndx);
2317 if (ofl->ofl_flags & FLG_OF_FATAL)
2318 continue;
2319 }
2320
2321 /*
2322 * We have observed relocatable objects
2323 * containing identical adjacent STT_FILE
2324 * symbols. Discard any other than the first,
2325 * as they are all equivalent and the extras
2326 * do not add information.
2327 *
2328 * For the purpose of this test, we assume
2329 * that only the symbol type and the string
2330 * table offset (st_name) matter.
2331 */
2332 if (type == STT_FILE) {
2333 int toss = (last_file_sdp != NULL) &&
2334 ((ndx - 1) == last_file_ndx) &&
2335 (sym->st_name ==
2336 last_file_sdp->sd_sym->st_name);
2337
2338 last_file_sdp = sdp;
2339 last_file_ndx = ndx;
2340 if (toss) {
2341 sdp->sd_flags |= FLG_SY_INVALID;
2342 DBG_CALL(Dbg_syms_dup_discarded(
2343 ofl->ofl_lml, ndx, sdp));
2344 continue;
2345 }
2346 }
2347 }
2348
2349
2350 /*
2351 * Sanity check for TLS
2352 */
2353 if ((sym->st_size != 0) && ((type == STT_TLS) &&
2354 (sym->st_shndx != SHN_COMMON))) {
2355 Is_desc *isp = sdp->sd_isc;
2356
2357 if ((isp == NULL) || (isp->is_shdr == NULL) ||
2358 ((isp->is_shdr->sh_flags & SHF_TLS) == 0)) {
2359 ld_eprintf(ofl, ERR_FATAL,
2360 MSG_INTL(MSG_SYM_TLS),
2361 demangle(sdp->sd_name),
2362 ifl->ifl_name);
2363 continue;
2364 }
2365 }
2366
2367 /*
2368 * Carry our some basic sanity checks (these are just
2369 * some of the erroneous symbol entries we've come
2370 * across, there's probably a lot more). The symbol
2371 * will not be carried forward to the output file, which
2372 * won't be a problem unless a relocation is required
2373 * against it.
2374 */
2375 if (((sdp->sd_flags & FLG_SY_SPECSEC) &&
2376 ((sym->st_shndx == SHN_COMMON)) ||
2377 ((type == STT_FILE) &&
2378 (sym->st_shndx != SHN_ABS))) ||
2379 (sdp->sd_isc && (sdp->sd_isc->is_osdesc == NULL))) {
2380 ld_eprintf(ofl, ERR_WARNING,
2381 MSG_INTL(MSG_SYM_INVSHNDX),
2382 demangle_symname(name, symsecname, ndx),
2383 ifl->ifl_name,
2384 conv_sym_shndx(osabi, mach, sym->st_shndx,
2385 CONV_FMT_DECIMAL, &inv_buf));
2386 sdp->sd_isc = NULL;
2387 sdp->sd_flags |= FLG_SY_INVALID;
2388 continue;
2389 }
2390
2391 /*
2392 * As these local symbols will become part of the output
2393 * image, record their number and name string size.
2394 * Globals are counted after all input file processing
2395 * (and hence symbol resolution) is complete during
2396 * sym_validate().
2397 */
2398 if (!(ofl->ofl_flags & FLG_OF_REDLSYM) &&
2399 symtab_enter) {
2400 ofl->ofl_locscnt++;
2401
2402 if ((((sdp->sd_flags & FLG_SY_REGSYM) == 0) ||
2403 sym->st_name) && (st_insert(ofl->ofl_strtab,
2404 sdp->sd_name) == -1))
2405 return (S_ERROR);
2406
2407 if (allow_ldynsym && sym->st_name &&
2408 ldynsym_symtype[type]) {
2409 ofl->ofl_dynlocscnt++;
2410 if (st_insert(ofl->ofl_dynstrtab,
2411 sdp->sd_name) == -1)
2412 return (S_ERROR);
2413 /* Include it in sort section? */
2414 DYNSORT_COUNT(sdp, sym, type, ++);
2415 }
2416 }
2417 }
2418 }
2419
2420 /*
2421 * The GNU ld interprets the top bit of the 16-bit Versym value
2422 * (0x8000) as the "hidden" bit. If this bit is set, the linker
2423 * is supposed to act as if that symbol does not exist. The Solaris
2424 * linker does not support this mechanism, or the model of interface
2425 * evolution that it allows, but we honor it in GNU ld produced
2426 * objects in order to interoperate with them.
2427 *
2428 * Determine if we should honor the GNU hidden bit for this file.
2429 */
2430 test_gnu_hidden_bit = ((ifl->ifl_flags & FLG_IF_GNUVER) != 0) &&
2431 (ifl->ifl_versym != NULL);
2432
2433 /*
2434 * Determine whether object capabilities for this file are being
2435 * converted into symbol capabilities. If so, global function symbols,
2436 * and initialized global data symbols, need special translation and
2437 * processing.
2438 */
2439 if ((etype == ET_REL) && (ifl->ifl_flags & FLG_IF_OTOSCAP))
2440 cdp = ifl->ifl_caps;
2441
2442 /*
2443 * Now scan the global symbols entering them in the internal symbol
2444 * table or resolving them as necessary.
2445 */
2446 sym = (Sym *)isc->is_indata->d_buf;
2447 sym += local;
2448 weak = 0;
2449 /* LINTED */
2450 for (ndx = (int)local; ndx < total; sym++, ndx++) {
2451 const char *name;
2452 sd_flag_t sdflags = 0;
2453 Word shndx;
2454 int shndx_bad = 0;
2455 Sym *nsym = sym;
2456 Cap_pair *cpp = NULL;
2457 uchar_t ntype;
2458
2459 /*
2460 * Determine and validate the associated section index.
2461 */
2462 if (symshndx && (nsym->st_shndx == SHN_XINDEX)) {
2463 shndx = symshndx[ndx];
2464 } else if ((shndx = nsym->st_shndx) >= SHN_LORESERVE) {
2465 sdflags |= FLG_SY_SPECSEC;
2466 } else if (shndx > ifl->ifl_shnum) {
2467 /* We need the name before we can issue error */
2468 shndx_bad = 1;
2469 }
2470
2471 /*
2472 * Check if st_name has a valid value or not.
2473 */
2474 if ((name = string(ofl, ifl, nsym, strs, strsize, ndx, shndx,
2475 symsecndx, symsecname, strsecname, &sdflags)) == NULL)
2476 continue;
2477
2478 /*
2479 * Now that we have the name, report an erroneous section index.
2480 */
2481 if (shndx_bad) {
2482 ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_INVSHNDX),
2483 demangle_symname(name, symsecname, ndx),
2484 ifl->ifl_name,
2485 conv_sym_shndx(osabi, mach, nsym->st_shndx,
2486 CONV_FMT_DECIMAL, &inv_buf));
2487 continue;
2488 }
2489
2490 /*
2491 * Test for the GNU hidden bit, and ignore symbols that
2492 * have it set.
2493 */
2494 if (test_gnu_hidden_bit &&
2495 ((ifl->ifl_versym[ndx] & 0x8000) != 0))
2496 continue;
2497
2498 /*
2499 * The linker itself will generate symbols for _end, _etext,
2500 * _edata, _DYNAMIC and _PROCEDURE_LINKAGE_TABLE_, so don't
2501 * bother entering these symbols from shared objects. This
2502 * results in some wasted resolution processing, which is hard
2503 * to feel, but if nothing else, pollutes diagnostic relocation
2504 * output.
2505 */
2506 if (name[0] && (etype == ET_DYN) && (nsym->st_size == 0) &&
2507 (ELF_ST_TYPE(nsym->st_info) == STT_OBJECT) &&
2508 (name[0] == '_') && ((name[1] == 'e') ||
2509 (name[1] == 'D') || (name[1] == 'P')) &&
2510 ((strcmp(name, MSG_ORIG(MSG_SYM_ETEXT_U)) == 0) ||
2511 (strcmp(name, MSG_ORIG(MSG_SYM_EDATA_U)) == 0) ||
2512 (strcmp(name, MSG_ORIG(MSG_SYM_END_U)) == 0) ||
2513 (strcmp(name, MSG_ORIG(MSG_SYM_DYNAMIC_U)) == 0) ||
2514 (strcmp(name, MSG_ORIG(MSG_SYM_PLKTBL_U)) == 0))) {
2515 ifl->ifl_oldndx[ndx] = 0;
2516 continue;
2517 }
2518
2519 /*
2520 * The '-z wrap=XXX' option emulates the GNU ld --wrap=XXX
2521 * option. When XXX is the symbol to be wrapped:
2522 *
2523 * - An undefined reference to XXX is converted to __wrap_XXX
2524 * - An undefined reference to __real_XXX is converted to XXX
2525 *
2526 * The idea is that the user can supply a wrapper function
2527 * __wrap_XXX that does some work, and then uses the name
2528 * __real_XXX to pass the call on to the real function. The
2529 * wrapper objects are linked with the original unmodified
2530 * objects to produce a wrapped version of the output object.
2531 */
2532 if (ofl->ofl_wrap && name[0] && (shndx == SHN_UNDEF)) {
2533 WrapSymNode wsn, *wsnp;
2534
2535 /*
2536 * If this is the __real_XXX form, advance the
2537 * pointer to reference the wrapped name.
2538 */
2539 wsn.wsn_name = name;
2540 if ((*name == '_') &&
2541 (strncmp(name, MSG_ORIG(MSG_STR_UU_REAL_U),
2542 MSG_STR_UU_REAL_U_SIZE) == 0))
2543 wsn.wsn_name += MSG_STR_UU_REAL_U_SIZE;
2544
2545 /*
2546 * Is this symbol in the wrap AVL tree? If so, map
2547 * XXX to __wrap_XXX, and __real_XXX to XXX. Note that
2548 * wsn.wsn_name will equal the current value of name
2549 * if the __real_ prefix is not present.
2550 */
2551 if ((wsnp = avl_find(ofl->ofl_wrap, &wsn, 0)) != NULL) {
2552 const char *old_name = name;
2553
2554 name = (wsn.wsn_name == name) ?
2555 wsnp->wsn_wrapname : wsn.wsn_name;
2556 DBG_CALL(Dbg_syms_wrap(ofl->ofl_lml, ndx,
2557 old_name, name));
2558 }
2559 }
2560
2561 /*
2562 * Determine and validate the symbols binding.
2563 */
2564 bind = ELF_ST_BIND(nsym->st_info);
2565 if ((bind != STB_GLOBAL) && (bind != STB_WEAK)) {
2566 ld_eprintf(ofl, ERR_WARNING, MSG_INTL(MSG_SYM_NONGLOB),
2567 demangle_symname(name, symsecname, ndx),
2568 ifl->ifl_name,
2569 conv_sym_info_bind(bind, 0, &inv_buf));
2570 continue;
2571 }
2572 if (bind == STB_WEAK)
2573 weak++;
2574
2575 /*
2576 * If this symbol falls within the range of a section being
2577 * discarded, then discard the symbol itself.
2578 */
2579 if (((sdflags & FLG_SY_SPECSEC) == 0) &&
2580 (nsym->st_shndx != SHN_UNDEF)) {
2581 Is_desc *isp;
2582
2583 if (shndx >= ifl->ifl_shnum) {
2584 /*
2585 * Carry our some basic sanity checks
2586 * The symbol will not be carried forward to
2587 * the output file, which won't be a problem
2588 * unless a relocation is required against it.
2589 */
2590 ld_eprintf(ofl, ERR_WARNING,
2591 MSG_INTL(MSG_SYM_INVSHNDX),
2592 demangle_symname(name, symsecname, ndx),
2593 ifl->ifl_name,
2594 conv_sym_shndx(osabi, mach, nsym->st_shndx,
2595 CONV_FMT_DECIMAL, &inv_buf));
2596 continue;
2597 }
2598
2599 isp = ifl->ifl_isdesc[shndx];
2600 if (isp && (isp->is_flags & FLG_IS_DISCARD)) {
2601 if ((sdp =
2602 libld_calloc(sizeof (Sym_desc), 1)) == NULL)
2603 return (S_ERROR);
2604
2605 /*
2606 * Create a dummy symbol entry so that if we
2607 * find any references to this discarded symbol
2608 * we can compensate.
2609 */
2610 sdp->sd_name = name;
2611 sdp->sd_sym = nsym;
2612 sdp->sd_file = ifl;
2613 sdp->sd_isc = isp;
2614 sdp->sd_flags = FLG_SY_ISDISC;
2615 ifl->ifl_oldndx[ndx] = sdp;
2616
2617 DBG_CALL(Dbg_syms_discarded(ofl->ofl_lml, sdp));
2618 continue;
2619 }
2620 }
2621
2622 /*
2623 * If object capabilities for this file are being converted
2624 * into symbol capabilities, then:
2625 *
2626 * - Any global function, or initialized global data symbol
2627 * definitions (ie., those that are not associated with
2628 * special symbol types, ie., ABS, COMMON, etc.), and which
2629 * have not been reduced to locals, are converted to symbol
2630 * references (UNDEF). This ensures that any reference to
2631 * the original symbol, for example from a relocation, get
2632 * associated to a capabilities family lead symbol, ie., a
2633 * generic instance.
2634 *
2635 * - For each global function, or object symbol definition,
2636 * a new local symbol is created. The function or object
2637 * is renamed using the capabilities CA_SUNW_ID definition
2638 * (which might have been fabricated for this purpose -
2639 * see get_cap_group()). The new symbol name is:
2640 *
2641 * <original name>%<capability group identifier>
2642 *
2643 * This symbol is associated to the same location, and
2644 * becomes a capabilities family member.
2645 */
2646 /* LINTED */
2647 hash = (Word)elf_hash(name);
2648
2649 ntype = ELF_ST_TYPE(nsym->st_info);
2650 if (cdp && (nsym->st_shndx != SHN_UNDEF) &&
2651 ((sdflags & FLG_SY_SPECSEC) == 0) &&
2652 ((ntype == STT_FUNC) || (ntype == STT_OBJECT))) {
2653 /*
2654 * Determine this symbol's visibility. If a mapfile has
2655 * indicated this symbol should be local, then there's
2656 * no point in transforming this global symbol to a
2657 * capabilities symbol. Otherwise, create a symbol
2658 * capability pair descriptor to record this symbol as
2659 * a candidate for translation.
2660 */
2661 if (sym_cap_vis(name, hash, sym, ofl) &&
2662 ((cpp = alist_append(&cappairs, NULL,
2663 sizeof (Cap_pair), AL_CNT_CAP_PAIRS)) == NULL))
2664 return (S_ERROR);
2665 }
2666
2667 if (cpp) {
2668 Sym *rsym;
2669
2670 DBG_CALL(Dbg_syms_cap_convert(ofl, ndx, name, nsym));
2671
2672 /*
2673 * Allocate a new symbol descriptor to represent the
2674 * transformed global symbol. The descriptor points
2675 * to the original symbol information (which might
2676 * indicate a global or weak visibility). The symbol
2677 * information will be transformed into a local symbol
2678 * later, after any weak aliases are culled.
2679 */
2680 if ((cpp->c_osdp =
2681 libld_malloc(sizeof (Sym_desc))) == NULL)
2682 return (S_ERROR);
2683
2684 cpp->c_osdp->sd_name = name;
2685 cpp->c_osdp->sd_sym = nsym;
2686 cpp->c_osdp->sd_shndx = shndx;
2687 cpp->c_osdp->sd_file = ifl;
2688 cpp->c_osdp->sd_isc = ifl->ifl_isdesc[shndx];
2689 cpp->c_osdp->sd_ref = REF_REL_NEED;
2690
2691 /*
2692 * Save the capabilities group this symbol belongs to,
2693 * and the original symbol index.
2694 */
2695 cpp->c_group = cdp->ca_groups->apl_data[0];
2696 cpp->c_ndx = ndx;
2697
2698 /*
2699 * Replace the original symbol definition with a symbol
2700 * reference. Make sure this reference isn't left as a
2701 * weak.
2702 */
2703 if ((rsym = libld_malloc(sizeof (Sym))) == NULL)
2704 return (S_ERROR);
2705
2706 *rsym = *nsym;
2707
2708 rsym->st_info = ELF_ST_INFO(STB_GLOBAL, ntype);
2709 rsym->st_shndx = shndx = SHN_UNDEF;
2710 rsym->st_value = 0;
2711 rsym->st_size = 0;
2712
2713 sdflags |= FLG_SY_CAP;
2714
2715 nsym = rsym;
2716 }
2717
2718 /*
2719 * If the symbol does not already exist in the internal symbol
2720 * table add it, otherwise resolve the conflict. If the symbol
2721 * from this file is kept, retain its symbol table index for
2722 * possible use in associating a global alias.
2723 */
2724 if ((sdp = ld_sym_find(name, hash, &where, ofl)) == NULL) {
2725 DBG_CALL(Dbg_syms_global(ofl->ofl_lml, ndx, name));
2726 if ((sdp = ld_sym_enter(name, nsym, hash, ifl, ofl, ndx,
2727 shndx, sdflags, &where)) == (Sym_desc *)S_ERROR)
2728 return (S_ERROR);
2729
2730 } else if (ld_sym_resolve(sdp, nsym, ifl, ofl, ndx, shndx,
2731 sdflags) == S_ERROR)
2732 return (S_ERROR);
2733
2734 /*
2735 * Now that we have a symbol descriptor, retain the descriptor
2736 * for later use by symbol capabilities processing.
2737 */
2738 if (cpp)
2739 cpp->c_nsdp = sdp;
2740
2741 /*
2742 * After we've compared a defined symbol in one shared
2743 * object, flag the symbol so we don't compare it again.
2744 */
2745 if ((etype == ET_DYN) && (nsym->st_shndx != SHN_UNDEF) &&
2746 ((sdp->sd_flags & FLG_SY_SOFOUND) == 0))
2747 sdp->sd_flags |= FLG_SY_SOFOUND;
2748
2749 /*
2750 * If the symbol is accepted from this file retain the symbol
2751 * index for possible use in aliasing.
2752 */
2753 if (sdp->sd_file == ifl)
2754 sdp->sd_symndx = ndx;
2755
2756 ifl->ifl_oldndx[ndx] = sdp;
2757
2758 /*
2759 * If we've accepted a register symbol, continue to validate
2760 * it.
2761 */
2762 if (sdp->sd_flags & FLG_SY_REGSYM) {
2763 Sym_desc *rsdp;
2764
2765 /*
2766 * The presence of FLG_SY_REGSYM means that
2767 * the pointers in ld_targ.t_ms are non-NULL.
2768 */
2769 rsdp = (*ld_targ.t_ms.ms_reg_find)(sdp->sd_sym, ofl);
2770 if (rsdp == NULL) {
2771 if ((*ld_targ.t_ms.ms_reg_enter)(sdp, ofl) == 0)
2772 return (S_ERROR);
2773 } else if (rsdp != sdp) {
2774 (void) (*ld_targ.t_ms.ms_reg_check)(rsdp,
2775 sdp->sd_sym, sdp->sd_name, ifl, ofl);
2776 }
2777 }
2778
2779 /*
2780 * For a relocatable object, if this symbol is defined
2781 * and has non-zero length and references an address
2782 * within an associated section, then check its extents
2783 * to make sure the section boundaries encompass it.
2784 * If they don't, the ELF file is corrupt. Note that this
2785 * global symbol may have come from another file to satisfy
2786 * an UNDEF symbol of the same name from this one. In that
2787 * case, we don't check it, because it was already checked
2788 * as part of its own file.
2789 */
2790 if (etype_rel && (sdp->sd_file == ifl)) {
2791 Sym *tsym = sdp->sd_sym;
2792
2793 if (SYM_LOC_BADADDR(sdp, tsym,
2794 ELF_ST_TYPE(tsym->st_info))) {
2795 issue_badaddr_msg(ifl, ofl, sdp,
2796 tsym, tsym->st_shndx);
2797 continue;
2798 }
2799 }
2800 }
2801 DBG_CALL(Dbg_util_nl(ofl->ofl_lml, DBG_NL_STD));
2802
2803 /*
2804 * Associate weak (alias) symbols to their non-weak counterparts by
2805 * scanning the global symbols one more time.
2806 *
2807 * This association is needed when processing the symbols from a shared
2808 * object dependency when a a weak definition satisfies a reference:
2809 *
2810 * - When building a dynamic executable, if a referenced symbol is a
2811 * data item, the symbol data is copied to the executables address
2812 * space. In this copy-relocation case, we must also reassociate
2813 * the alias symbol with its new location in the executable.
2814 *
2815 * - If the referenced symbol is a function then we may need to
2816 * promote the symbols binding from undefined weak to undefined,
2817 * otherwise the run-time linker will not generate the correct
2818 * relocation error should the symbol not be found.
2819 *
2820 * Weak alias association is also required when a local dynsym table
2821 * is being created. This table should only contain one instance of a
2822 * symbol that is associated to a given address.
2823 *
2824 * The true association between a weak/strong symbol pair is that both
2825 * symbol entries are identical, thus first we create a sorted symbol
2826 * list keyed off of the symbols section index and value. If the symbol
2827 * belongs to the same section and has the same value, then the chances
2828 * are that the rest of the symbols data is the same. This list is then
2829 * scanned for weak symbols, and if one is found then any strong
2830 * association will exist in the entries that follow. Thus we just have
2831 * to scan one (typically a single alias) or more (in the uncommon
2832 * instance of multiple weak to strong associations) entries to
2833 * determine if a match exists.
2834 */
2835 if (weak && (OFL_ALLOW_LDYNSYM(ofl) || (etype == ET_DYN)) &&
2836 (total > local)) {
2837 static Sym_desc **sort;
2838 static size_t osize = 0;
2839 size_t nsize = (total - local) * sizeof (Sym_desc *);
2840
2841 /*
2842 * As we might be processing many input files, and many symbols,
2843 * try and reuse a static sort buffer. Note, presently we're
2844 * playing the game of never freeing any buffers as there's a
2845 * belief this wastes time.
2846 */
2847 if ((osize == 0) || (nsize > osize)) {
2848 if ((sort = libld_malloc(nsize)) == NULL)
2849 return (S_ERROR);
2850 osize = nsize;
2851 }
2852 (void) memcpy((void *)sort, &ifl->ifl_oldndx[local], nsize);
2853
2854 qsort(sort, (total - local), sizeof (Sym_desc *), compare);
2855
2856 for (ndx = 0; ndx < (total - local); ndx++) {
2857 Sym_desc *wsdp = sort[ndx];
2858 Sym *wsym;
2859 int sndx;
2860
2861 /*
2862 * Ignore any empty symbol descriptor, or the case where
2863 * the symbol has been resolved to a different file.
2864 */
2865 if ((wsdp == NULL) || (wsdp->sd_file != ifl))
2866 continue;
2867
2868 wsym = wsdp->sd_sym;
2869
2870 if ((wsym->st_shndx == SHN_UNDEF) ||
2871 (wsdp->sd_flags & FLG_SY_SPECSEC) ||
2872 (ELF_ST_BIND(wsym->st_info) != STB_WEAK))
2873 continue;
2874
2875 /*
2876 * We have a weak symbol, if it has a strong alias it
2877 * will have been sorted to one of the following sort
2878 * table entries. Note that we could have multiple weak
2879 * symbols aliased to one strong (if this occurs then
2880 * the strong symbol only maintains one alias back to
2881 * the last weak).
2882 */
2883 for (sndx = ndx + 1; sndx < (total - local); sndx++) {
2884 Sym_desc *ssdp = sort[sndx];
2885 Sym *ssym;
2886 sd_flag_t w_dynbits, s_dynbits;
2887
2888 /*
2889 * Ignore any empty symbol descriptor, or the
2890 * case where the symbol has been resolved to a
2891 * different file.
2892 */
2893 if ((ssdp == NULL) || (ssdp->sd_file != ifl))
2894 continue;
2895
2896 ssym = ssdp->sd_sym;
2897
2898 if (ssym->st_shndx == SHN_UNDEF)
2899 continue;
2900
2901 if ((ssym->st_shndx != wsym->st_shndx) ||
2902 (ssym->st_value != wsym->st_value))
2903 break;
2904
2905 if ((ssym->st_size != wsym->st_size) ||
2906 (ssdp->sd_flags & FLG_SY_SPECSEC) ||
2907 (ELF_ST_BIND(ssym->st_info) == STB_WEAK))
2908 continue;
2909
2910 /*
2911 * If a sharable object, set link fields so
2912 * that they reference each other.`
2913 */
2914 if (etype == ET_DYN) {
2915 ssdp->sd_aux->sa_linkndx =
2916 (Word)wsdp->sd_symndx;
2917 wsdp->sd_aux->sa_linkndx =
2918 (Word)ssdp->sd_symndx;
2919 }
2920
2921 /*
2922 * Determine which of these two symbols go into
2923 * the sort section. If a mapfile has made
2924 * explicit settings of the FLG_SY_*DYNSORT
2925 * flags for both symbols, then we do what they
2926 * say. If one has the DYNSORT flags set, we
2927 * set the NODYNSORT bit in the other. And if
2928 * neither has an explicit setting, then we
2929 * favor the weak symbol because they usually
2930 * lack the leading underscore.
2931 */
2932 w_dynbits = wsdp->sd_flags &
2933 (FLG_SY_DYNSORT | FLG_SY_NODYNSORT);
2934 s_dynbits = ssdp->sd_flags &
2935 (FLG_SY_DYNSORT | FLG_SY_NODYNSORT);
2936 if (!(w_dynbits && s_dynbits)) {
2937 if (s_dynbits) {
2938 if (s_dynbits == FLG_SY_DYNSORT)
2939 wsdp->sd_flags |=
2940 FLG_SY_NODYNSORT;
2941 } else if (w_dynbits !=
2942 FLG_SY_NODYNSORT) {
2943 ssdp->sd_flags |=
2944 FLG_SY_NODYNSORT;
2945 }
2946 }
2947 break;
2948 }
2949 }
2950 }
2951
2952 /*
2953 * Having processed all symbols, under -z symbolcap, reprocess any
2954 * symbols that are being translated from global to locals. The symbol
2955 * pair that has been collected defines the original symbol (c_osdp),
2956 * which will become a local, and the new symbol (c_nsdp), which will
2957 * become a reference (UNDEF) for the original.
2958 *
2959 * Scan these symbol pairs looking for weak symbols, which have non-weak
2960 * aliases. There is no need to translate both of these symbols to
2961 * locals, only the global is necessary.
2962 */
2963 if (cappairs) {
2964 Aliste idx1;
2965 Cap_pair *cpp1;
2966
2967 for (ALIST_TRAVERSE(cappairs, idx1, cpp1)) {
2968 Sym_desc *sdp1 = cpp1->c_osdp;
2969 Sym *sym1 = sdp1->sd_sym;
2970 uchar_t bind1 = ELF_ST_BIND(sym1->st_info);
2971 Aliste idx2;
2972 Cap_pair *cpp2;
2973
2974 /*
2975 * If this symbol isn't weak, it's capability member is
2976 * retained for the creation of a local symbol.
2977 */
2978 if (bind1 != STB_WEAK)
2979 continue;
2980
2981 /*
2982 * If this is a weak symbol, traverse the capabilities
2983 * list again to determine if a corresponding non-weak
2984 * symbol exists.
2985 */
2986 for (ALIST_TRAVERSE(cappairs, idx2, cpp2)) {
2987 Sym_desc *sdp2 = cpp2->c_osdp;
2988 Sym *sym2 = sdp2->sd_sym;
2989 uchar_t bind2 =
2990 ELF_ST_BIND(sym2->st_info);
2991
2992 if ((cpp1 == cpp2) ||
2993 (cpp1->c_group != cpp2->c_group) ||
2994 (sym1->st_value != sym2->st_value) ||
2995 (bind2 == STB_WEAK))
2996 continue;
2997
2998 /*
2999 * The weak symbol (sym1) has a non-weak (sym2)
3000 * counterpart. There's no point in translating
3001 * both of these equivalent symbols to locals.
3002 * Add this symbol capability alias to the
3003 * capabilities family information, and remove
3004 * the weak symbol.
3005 */
3006 if (ld_cap_add_family(ofl, cpp2->c_nsdp,
3007 cpp1->c_nsdp, NULL, NULL) == S_ERROR)
3008 return (S_ERROR);
3009
3010 free((void *)cpp1->c_osdp);
3011 (void) alist_delete(cappairs, &idx1);
3012 }
3013 }
3014
3015 DBG_CALL(Dbg_util_nl(ofl->ofl_lml, DBG_NL_STD));
3016
3017 /*
3018 * The capability pairs information now represents all the
3019 * global symbols that need transforming to locals. These
3020 * local symbols are renamed using their group identifiers.
3021 */
3022 for (ALIST_TRAVERSE(cappairs, idx1, cpp1)) {
3023 Sym_desc *osdp = cpp1->c_osdp;
3024 Objcapset *capset;
3025 size_t nsize, tsize;
3026 const char *oname;
3027 char *cname, *idstr;
3028 Sym *csym;
3029
3030 /*
3031 * If the local symbol has not yet been translated
3032 * convert it to a local symbol with a name.
3033 */
3034 if ((osdp->sd_flags & FLG_SY_CAP) != 0)
3035 continue;
3036
3037 /*
3038 * As we're converting object capabilities to symbol
3039 * capabilities, obtain the capabilities set for this
3040 * object, so as to retrieve the CA_SUNW_ID value.
3041 */
3042 capset = &cpp1->c_group->cg_set;
3043
3044 /*
3045 * Create a new name from the existing symbol and the
3046 * capabilities group identifier. Note, the delimiter
3047 * between the symbol name and identifier name is hard-
3048 * coded here (%), so that we establish a convention
3049 * for transformed symbol names.
3050 */
3051 oname = osdp->sd_name;
3052
3053 idstr = capset->oc_id.cs_str;
3054 nsize = strlen(oname);
3055 tsize = nsize + 1 + strlen(idstr) + 1;
3056 if ((cname = libld_malloc(tsize)) == 0)
3057 return (S_ERROR);
3058
3059 (void) strcpy(cname, oname);
3060 cname[nsize++] = '%';
3061 (void) strcpy(&cname[nsize], idstr);
3062
3063 /*
3064 * Allocate a new symbol table entry, transform this
3065 * symbol to a local, and assign the new name.
3066 */
3067 if ((csym = libld_malloc(sizeof (Sym))) == NULL)
3068 return (S_ERROR);
3069
3070 *csym = *osdp->sd_sym;
3071 csym->st_info = ELF_ST_INFO(STB_LOCAL,
3072 ELF_ST_TYPE(osdp->sd_sym->st_info));
3073
3074 osdp->sd_name = cname;
3075 osdp->sd_sym = csym;
3076 osdp->sd_flags = FLG_SY_CAP;
3077
3078 /*
3079 * Keep track of this new local symbol. As -z symbolcap
3080 * can only be used to create a relocatable object, a
3081 * dynamic symbol table can't exist. Ensure there is
3082 * space reserved in the string table.
3083 */
3084 ofl->ofl_caploclcnt++;
3085 if (st_insert(ofl->ofl_strtab, cname) == -1)
3086 return (S_ERROR);
3087
3088 DBG_CALL(Dbg_syms_cap_local(ofl, cpp1->c_ndx,
3089 cname, csym, osdp));
3090
3091 /*
3092 * Establish this capability pair as a family.
3093 */
3094 if (ld_cap_add_family(ofl, cpp1->c_nsdp, osdp,
3095 cpp1->c_group, &ifl->ifl_caps->ca_syms) == S_ERROR)
3096 return (S_ERROR);
3097 }
3098 }
3099
3100 return (1);
3101
3102 #undef SYM_LOC_BADADDR
3103 }
3104
3105 /*
3106 * Add an undefined symbol to the symbol table. The reference originates from
3107 * the location identified by the message id (mid). These references can
3108 * originate from command line options such as -e, -u, -initarray, etc.
3109 * (identified with MSG_INTL(MSG_STR_COMMAND)), or from internally generated
3110 * TLS relocation references (identified with MSG_INTL(MSG_STR_TLSREL)).
3111 */
3112 Sym_desc *
3113 ld_sym_add_u(const char *name, Ofl_desc *ofl, Msg mid)
3114 {
3115 Sym *sym;
3116 Ifl_desc *ifl = NULL, *_ifl;
3117 Sym_desc *sdp;
3118 Word hash;
3119 Aliste idx;
3120 avl_index_t where;
3121 const char *reference = MSG_INTL(mid);
3122
3123 /*
3124 * As an optimization, determine whether we've already generated this
3125 * reference. If the symbol doesn't already exist we'll create it.
3126 * Or if the symbol does exist from a different source, we'll resolve
3127 * the conflict.
3128 */
3129 /* LINTED */
3130 hash = (Word)elf_hash(name);
3131 if ((sdp = ld_sym_find(name, hash, &where, ofl)) != NULL) {
3132 if ((sdp->sd_sym->st_shndx == SHN_UNDEF) &&
3133 (sdp->sd_file->ifl_name == reference))
3134 return (sdp);
3135 }
3136
3137 /*
3138 * Determine whether a pseudo input file descriptor exists to represent
3139 * the command line, as any global symbol needs an input file descriptor
3140 * during any symbol resolution (refer to map_ifl() which provides a
3141 * similar method for adding symbols from mapfiles).
3142 */
3143 for (APLIST_TRAVERSE(ofl->ofl_objs, idx, _ifl))
3144 if (strcmp(_ifl->ifl_name, reference) == 0) {
3145 ifl = _ifl;
3146 break;
3147 }
3148
3149 /*
3150 * If no descriptor exists create one.
3151 */
3152 if (ifl == NULL) {
3153 if ((ifl = libld_calloc(sizeof (Ifl_desc), 1)) == NULL)
3154 return ((Sym_desc *)S_ERROR);
3155 ifl->ifl_name = reference;
3156 ifl->ifl_flags = FLG_IF_NEEDED | FLG_IF_FILEREF;
3157 if ((ifl->ifl_ehdr = libld_calloc(sizeof (Ehdr), 1)) == NULL)
3158 return ((Sym_desc *)S_ERROR);
3159 ifl->ifl_ehdr->e_type = ET_REL;
3160
3161 if (aplist_append(&ofl->ofl_objs, ifl, AL_CNT_OFL_OBJS) == NULL)
3162 return ((Sym_desc *)S_ERROR);
3163 }
3164
3165 /*
3166 * Allocate a symbol structure and add it to the global symbol table.
3167 */
3168 if ((sym = libld_calloc(sizeof (Sym), 1)) == NULL)
3169 return ((Sym_desc *)S_ERROR);
3170 sym->st_info = ELF_ST_INFO(STB_GLOBAL, STT_NOTYPE);
3171 sym->st_shndx = SHN_UNDEF;
3172
3173 DBG_CALL(Dbg_syms_process(ofl->ofl_lml, ifl));
3174 if (sdp == NULL) {
3175 DBG_CALL(Dbg_syms_global(ofl->ofl_lml, 0, name));
3176 if ((sdp = ld_sym_enter(name, sym, hash, ifl, ofl, 0, SHN_UNDEF,
3177 0, &where)) == (Sym_desc *)S_ERROR)
3178 return ((Sym_desc *)S_ERROR);
3179 } else if (ld_sym_resolve(sdp, sym, ifl, ofl, 0,
3180 SHN_UNDEF, 0) == S_ERROR)
3181 return ((Sym_desc *)S_ERROR);
3182
3183 sdp->sd_flags &= ~FLG_SY_CLEAN;
3184 sdp->sd_flags |= FLG_SY_CMDREF;
3185
3186 return (sdp);
3187 }
3188
3189 /*
3190 * STT_SECTION symbols have their st_name field set to NULL, and consequently
3191 * have no name. Generate a name suitable for diagnostic use for such a symbol
3192 * and store it in the input section descriptor. The resulting name will be
3193 * of the form:
3194 *
3195 * "XXX (section)"
3196 *
3197 * where XXX is the name of the section.
3198 *
3199 * entry:
3200 * isc - Input section associated with the symbol.
3201 * fmt - NULL, or format string to use.
3202 *
3203 * exit:
3204 * Sets isp->is_sym_name to the allocated string. Returns the
3205 * string pointer, or NULL on allocation failure.
3206 */
3207 const char *
3208 ld_stt_section_sym_name(Is_desc *isp)
3209 {
3210 const char *fmt;
3211 char *str;
3212 size_t len;
3213
3214 if ((isp == NULL) || (isp->is_name == NULL))
3215 return (NULL);
3216
3217 if (isp->is_sym_name == NULL) {
3218 fmt = (isp->is_flags & FLG_IS_GNSTRMRG) ?
3219 MSG_INTL(MSG_STR_SECTION_MSTR) : MSG_INTL(MSG_STR_SECTION);
3220
3221 len = strlen(fmt) + strlen(isp->is_name) + 1;
3222
3223 if ((str = libld_malloc(len)) == NULL)
3224 return (NULL);
3225 (void) snprintf(str, len, fmt, isp->is_name);
3226 isp->is_sym_name = str;
3227 }
3228
3229 return (isp->is_sym_name);
3230 }