dl-hash.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367
  1. /* vi: set sw=4 ts=4: */
  2. /*
  3. * Program to load an ELF binary on a linux system, and run it
  4. * after resolving ELF shared library symbols
  5. *
  6. * Copyright (C) 2004 by Joakim Tjernlund <joakim.tjernlund@lumentis.se>
  7. * Copyright (C) 2000-2006 by Erik Andersen <andersen@codepoet.org>
  8. * Copyright (c) 1994-2000 Eric Youngdale, Peter MacDonald,
  9. * David Engel, Hongjiu Lu and Mitch D'Souza
  10. *
  11. * Redistribution and use in source and binary forms, with or without
  12. * modification, are permitted provided that the following conditions
  13. * are met:
  14. * 1. Redistributions of source code must retain the above copyright
  15. * notice, this list of conditions and the following disclaimer.
  16. * 2. The name of the above contributors may not be
  17. * used to endorse or promote products derived from this software
  18. * without specific prior written permission.
  19. *
  20. * THIS SOFTWARE IS PROVIDED BY THE CONTRIBUTORS ``AS IS'' AND
  21. * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  22. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  23. * ARE DISCLAIMED. IN NO EVENT SHALL THE CONTRIBUTORS BE LIABLE
  24. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  25. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  26. * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  27. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  28. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  29. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  30. * SUCH DAMAGE.
  31. */
  32. /* Various symbol table handling functions, including symbol lookup */
  33. /*
  34. * This is the start of the linked list that describes all of the files present
  35. * in the system with pointers to all of the symbol, string, and hash tables,
  36. * as well as all of the other good stuff in the binary.
  37. */
  38. struct elf_resolve *_dl_loaded_modules = NULL;
  39. /*
  40. * This is the list of modules that are loaded when the image is first
  41. * started. As we add more via dlopen, they get added into other
  42. * chains.
  43. */
  44. struct dyn_elf *_dl_symbol_tables = NULL;
  45. /*
  46. * This is the list of modules that are loaded via dlopen. We may need
  47. * to search these for RTLD_GLOBAL files.
  48. */
  49. struct dyn_elf *_dl_handles = NULL;
  50. #ifdef __LDSO_GNU_HASH_SUPPORT__
  51. /* This is the new hash function that is used by the ELF linker to generate the
  52. * GNU hash table that each executable and library will have if --hash-style=[gnu,both]
  53. * is passed to the linker. We need it to decode the GNU hash table. */
  54. static __inline__ Elf_Symndx _dl_gnu_hash (const unsigned char *name)
  55. {
  56. unsigned long h = 5381;
  57. unsigned char c;
  58. for (c = *name; c != '\0'; c = *++name)
  59. h = h * 33 + c;
  60. return h & 0xffffffff;
  61. }
  62. #endif
  63. /* This is the hash function that is used by the ELF linker to generate the
  64. * hash table that each executable and library is required to have. We need
  65. * it to decode the hash table. */
  66. static __inline__ Elf_Symndx _dl_elf_hash(const unsigned char *name)
  67. {
  68. unsigned long hash=0;
  69. unsigned long tmp;
  70. while (*name) {
  71. hash = (hash << 4) + *name++;
  72. tmp = hash & 0xf0000000;
  73. /* The algorithm specified in the ELF ABI is as follows:
  74. if (tmp != 0)
  75. hash ^= tmp >> 24;
  76. hash &= ~tmp;
  77. But the following is equivalent and a lot
  78. faster, especially on modern processors. */
  79. hash ^= tmp;
  80. hash ^= tmp >> 24;
  81. }
  82. return hash;
  83. }
  84. /*
  85. * We call this function when we have just read an ELF library or executable.
  86. * We add the relevant info to the symbol chain, so that we can resolve all
  87. * externals properly.
  88. */
  89. struct elf_resolve *_dl_add_elf_hash_table(const char *libname,
  90. DL_LOADADDR_TYPE loadaddr, unsigned long *dynamic_info, unsigned long dynamic_addr,
  91. attribute_unused unsigned long dynamic_size)
  92. {
  93. Elf_Symndx *hash_addr;
  94. struct elf_resolve *tpnt;
  95. int i;
  96. if (!_dl_loaded_modules) {
  97. tpnt = _dl_loaded_modules = (struct elf_resolve *) _dl_malloc(sizeof(struct elf_resolve));
  98. _dl_memset(tpnt, 0, sizeof(struct elf_resolve));
  99. } else {
  100. tpnt = _dl_loaded_modules;
  101. while (tpnt->next)
  102. tpnt = tpnt->next;
  103. tpnt->next = (struct elf_resolve *) _dl_malloc(sizeof(struct elf_resolve));
  104. _dl_memset(tpnt->next, 0, sizeof(struct elf_resolve));
  105. tpnt->next->prev = tpnt;
  106. tpnt = tpnt->next;
  107. }
  108. tpnt->next = NULL;
  109. tpnt->init_flag = 0;
  110. tpnt->libname = _dl_strdup(libname);
  111. tpnt->dynamic_addr = (ElfW(Dyn) *)dynamic_addr;
  112. tpnt->libtype = loaded_file;
  113. #ifdef __LDSO_GNU_HASH_SUPPORT__
  114. if (dynamic_info[DT_GNU_HASH_IDX] != 0) {
  115. Elf32_Word *hash32 = (Elf_Symndx*)dynamic_info[DT_GNU_HASH_IDX];
  116. tpnt->nbucket = *hash32++;
  117. Elf32_Word symbias = *hash32++;
  118. Elf32_Word bitmask_nwords = *hash32++;
  119. /* Must be a power of two. */
  120. _dl_assert ((bitmask_nwords & (bitmask_nwords - 1)) == 0);
  121. tpnt->l_gnu_bitmask_idxbits = bitmask_nwords - 1;
  122. tpnt->l_gnu_shift = *hash32++;
  123. tpnt->l_gnu_bitmask = (ElfW(Addr) *) hash32;
  124. hash32 += __ELF_NATIVE_CLASS / 32 * bitmask_nwords;
  125. tpnt->l_gnu_buckets = hash32;
  126. hash32 += tpnt->nbucket;
  127. tpnt->l_gnu_chain_zero = hash32 - symbias;
  128. } else
  129. /* Fall using old SysV hash table if GNU hash is not present */
  130. #endif
  131. if (dynamic_info[DT_HASH] != 0) {
  132. hash_addr = (Elf_Symndx*)dynamic_info[DT_HASH];
  133. tpnt->nbucket = *hash_addr++;
  134. tpnt->nchain = *hash_addr++;
  135. tpnt->elf_buckets = hash_addr;
  136. hash_addr += tpnt->nbucket;
  137. tpnt->chains = hash_addr;
  138. }
  139. tpnt->loadaddr = loadaddr;
  140. tpnt->mapaddr = DL_RELOC_ADDR(loadaddr, 0);
  141. for (i = 0; i < DYNAMIC_SIZE; i++)
  142. tpnt->dynamic_info[i] = dynamic_info[i];
  143. return tpnt;
  144. }
  145. /* Routine to check whether the symbol matches. */
  146. static __attribute_noinline__ const ElfW(Sym) *
  147. check_match (const ElfW(Sym) *sym, char *strtab, const char* undef_name, int type_class)
  148. {
  149. if (type_class & (sym->st_shndx == SHN_UNDEF))
  150. /* undefined symbol itself */
  151. return NULL;
  152. if (sym->st_value == 0)
  153. /* No value */
  154. return NULL;
  155. if (ELF_ST_TYPE(sym->st_info) > STT_FUNC
  156. && ELF_ST_TYPE(sym->st_info) != STT_COMMON)
  157. /* Ignore all but STT_NOTYPE, STT_OBJECT, STT_FUNC
  158. * and STT_COMMON entries since these are no
  159. * code/data definitions
  160. */
  161. return NULL;
  162. if (_dl_strcmp(strtab + sym->st_name, undef_name) != 0)
  163. return NULL;
  164. /* This is the matching symbol */
  165. return sym;
  166. }
  167. #ifdef __LDSO_GNU_HASH_SUPPORT__
  168. static __always_inline const ElfW(Sym) *
  169. _dl_lookup_gnu_hash(struct elf_resolve *tpnt, ElfW(Sym) *symtab, unsigned long hash,
  170. const char* undef_name, int type_class)
  171. {
  172. Elf_Symndx symidx;
  173. const ElfW(Sym) *sym;
  174. char *strtab;
  175. const ElfW(Addr) *bitmask = tpnt->l_gnu_bitmask;
  176. ElfW(Addr) bitmask_word = bitmask[(hash / __ELF_NATIVE_CLASS) & tpnt->l_gnu_bitmask_idxbits];
  177. unsigned int hashbit1 = hash & (__ELF_NATIVE_CLASS - 1);
  178. unsigned int hashbit2 = ((hash >> tpnt->l_gnu_shift) & (__ELF_NATIVE_CLASS - 1));
  179. _dl_assert (bitmask != NULL);
  180. if (unlikely((bitmask_word >> hashbit1) & (bitmask_word >> hashbit2) & 1)) {
  181. unsigned long rem;
  182. Elf32_Word bucket;
  183. do_rem (rem, hash, tpnt->nbucket);
  184. bucket = tpnt->l_gnu_buckets[rem];
  185. if (bucket != 0) {
  186. const Elf32_Word *hasharr = &tpnt->l_gnu_chain_zero[bucket];
  187. do {
  188. if (((*hasharr ^ hash) >> 1) == 0) {
  189. symidx = hasharr - tpnt->l_gnu_chain_zero;
  190. strtab = (char *) (tpnt->dynamic_info[DT_STRTAB]);
  191. sym = check_match (&symtab[symidx], strtab, undef_name, type_class);
  192. if (sym != NULL)
  193. return sym;
  194. }
  195. } while ((*hasharr++ & 1u) == 0);
  196. }
  197. }
  198. /* No symbol found. */
  199. return NULL;
  200. }
  201. #endif
  202. static __always_inline const ElfW(Sym) *
  203. _dl_lookup_sysv_hash(struct elf_resolve *tpnt, ElfW(Sym) *symtab, unsigned long hash, const char* undef_name, int type_class)
  204. {
  205. unsigned long hn;
  206. char *strtab;
  207. const ElfW(Sym) *sym;
  208. Elf_Symndx symidx;
  209. /* Avoid calling .urem here. */
  210. do_rem(hn, hash, tpnt->nbucket);
  211. strtab = (char *) (tpnt->dynamic_info[DT_STRTAB]);
  212. _dl_assert(tpnt->elf_buckets != NULL);
  213. for (symidx = tpnt->elf_buckets[hn]; symidx != STN_UNDEF; symidx = tpnt->chains[symidx]) {
  214. sym = check_match (&symtab[symidx], strtab, undef_name, type_class);
  215. if (sym != NULL)
  216. /* At this point the symbol is that we are looking for */
  217. return sym;
  218. }
  219. /* No symbol found into the current module*/
  220. return NULL;
  221. }
  222. /*
  223. * This function resolves externals, and this is either called when we process
  224. * relocations or when we call an entry in the PLT table for the first time.
  225. */
  226. char *_dl_lookup_hash(const char *name, struct dyn_elf *rpnt,
  227. struct elf_resolve *mytpnt, int type_class
  228. #ifdef __FDPIC__
  229. , struct elf_resolve **tpntp
  230. #endif
  231. )
  232. {
  233. struct elf_resolve *tpnt = NULL;
  234. ElfW(Sym) *symtab;
  235. unsigned long elf_hash_number = 0xffffffff;
  236. const ElfW(Sym) *sym = NULL;
  237. const ElfW(Sym) *weak_sym = 0;
  238. struct elf_resolve *weak_tpnt = 0;
  239. #ifdef __LDSO_GNU_HASH_SUPPORT__
  240. unsigned long gnu_hash_number = _dl_gnu_hash((const unsigned char *)name);
  241. #endif
  242. for (; rpnt; rpnt = rpnt->next) {
  243. tpnt = rpnt->dyn;
  244. if (!(tpnt->rtld_flags & RTLD_GLOBAL) && mytpnt) {
  245. if (mytpnt == tpnt)
  246. ;
  247. else {
  248. struct init_fini_list *tmp;
  249. for (tmp = mytpnt->rtld_local; tmp; tmp = tmp->next) {
  250. if (tmp->tpnt == tpnt)
  251. break;
  252. }
  253. if (!tmp)
  254. continue;
  255. }
  256. }
  257. /* Don't search the executable when resolving a copy reloc. */
  258. if ((type_class & ELF_RTYPE_CLASS_COPY) && tpnt->libtype == elf_executable)
  259. continue;
  260. /* If the hash table is empty there is nothing to do here. */
  261. if (tpnt->nbucket == 0)
  262. continue;
  263. symtab = (ElfW(Sym) *) (intptr_t) (tpnt->dynamic_info[DT_SYMTAB]);
  264. #ifdef __LDSO_GNU_HASH_SUPPORT__
  265. /* Prefer GNU hash style, if any */
  266. if (tpnt->l_gnu_bitmask) {
  267. sym = _dl_lookup_gnu_hash(tpnt, symtab, gnu_hash_number, name, type_class);
  268. if (sym != NULL)
  269. /* If sym has been found, do not search further */
  270. break;
  271. } else {
  272. #endif
  273. /* Use the old SysV-style hash table */
  274. /* Calculate the old sysv hash number only once */
  275. if (elf_hash_number == 0xffffffff)
  276. elf_hash_number = _dl_elf_hash((const unsigned char *)name);
  277. sym = _dl_lookup_sysv_hash(tpnt, symtab, elf_hash_number, name, type_class);
  278. if (sym != NULL)
  279. break;
  280. #ifdef __LDSO_GNU_HASH_SUPPORT__
  281. }
  282. #endif
  283. } /* end of for (; rpnt; rpnt = rpnt->next) { */
  284. if (sym) {
  285. /* At this point we have found the requested symbol, do binding */
  286. switch (ELF_ST_BIND(sym->st_info)) {
  287. case STB_WEAK:
  288. #if 0
  289. /* Perhaps we should support old style weak symbol handling
  290. * per what glibc does when you export LD_DYNAMIC_WEAK */
  291. if (!weak_sym) {
  292. weak_tpnt = tpnt;
  293. weak_sym = sym;
  294. }
  295. break;
  296. #endif
  297. case STB_GLOBAL:
  298. #ifdef __FDPIC__
  299. if (tpntp)
  300. *tpntp = tpnt;
  301. #endif
  302. return (char *) DL_FIND_HASH_VALUE (tpnt, type_class, sym);
  303. default: /* Local symbols not handled here */
  304. break;
  305. }
  306. }
  307. if (weak_sym) {
  308. #ifdef __FDPIC__
  309. if (tpntp)
  310. *tpntp = weak_tpnt;
  311. #endif
  312. return (char *) DL_FIND_HASH_VALUE (weak_tpnt, type_class, weak_sym);
  313. }
  314. #ifdef __FDPIC__
  315. if (tpntp)
  316. *tpntp = NULL;
  317. #endif
  318. return NULL;
  319. }