reintroduce hardening against partially-replaced allocator
[musl] / ldso / dynlink.c
1 #define _GNU_SOURCE
2 #include <stdio.h>
3 #include <stdlib.h>
4 #include <stdarg.h>
5 #include <stddef.h>
6 #include <string.h>
7 #include <unistd.h>
8 #include <stdint.h>
9 #include <elf.h>
10 #include <sys/mman.h>
11 #include <limits.h>
12 #include <fcntl.h>
13 #include <sys/stat.h>
14 #include <errno.h>
15 #include <link.h>
16 #include <setjmp.h>
17 #include <pthread.h>
18 #include <ctype.h>
19 #include <dlfcn.h>
20 #include "pthread_impl.h"
21 #include "libc.h"
22 #include "dynlink.h"
23
24 static void error(const char *, ...);
25
26 #define MAXP2(a,b) (-(-(a)&-(b)))
27 #define ALIGN(x,y) ((x)+(y)-1 & -(y))
28
29 struct debug {
30         int ver;
31         void *head;
32         void (*bp)(void);
33         int state;
34         void *base;
35 };
36
37 struct td_index {
38         size_t args[2];
39         struct td_index *next;
40 };
41
42 struct dso {
43 #if DL_FDPIC
44         struct fdpic_loadmap *loadmap;
45 #else
46         unsigned char *base;
47 #endif
48         char *name;
49         size_t *dynv;
50         struct dso *next, *prev;
51
52         Phdr *phdr;
53         int phnum;
54         size_t phentsize;
55         Sym *syms;
56         Elf_Symndx *hashtab;
57         uint32_t *ghashtab;
58         int16_t *versym;
59         char *strings;
60         struct dso *syms_next, *lazy_next;
61         size_t *lazy, lazy_cnt;
62         unsigned char *map;
63         size_t map_len;
64         dev_t dev;
65         ino_t ino;
66         char relocated;
67         char constructed;
68         char kernel_mapped;
69         struct dso **deps, *needed_by;
70         char *rpath_orig, *rpath;
71         struct tls_module tls;
72         size_t tls_id;
73         size_t relro_start, relro_end;
74         void **new_dtv;
75         unsigned char *new_tls;
76         volatile int new_dtv_idx, new_tls_idx;
77         struct td_index *td_index;
78         struct dso *fini_next;
79         char *shortname;
80 #if DL_FDPIC
81         unsigned char *base;
82 #else
83         struct fdpic_loadmap *loadmap;
84 #endif
85         struct funcdesc {
86                 void *addr;
87                 size_t *got;
88         } *funcdescs;
89         size_t *got;
90         char buf[];
91 };
92
93 struct symdef {
94         Sym *sym;
95         struct dso *dso;
96 };
97
98 int __init_tp(void *);
99 void __init_libc(char **, char *);
100 void *__copy_tls(unsigned char *);
101
102 __attribute__((__visibility__("hidden")))
103 const char *__libc_get_version(void);
104
105 static struct builtin_tls {
106         char c;
107         struct pthread pt;
108         void *space[16];
109 } builtin_tls[1];
110 #define MIN_TLS_ALIGN offsetof(struct builtin_tls, pt)
111
112 #define ADDEND_LIMIT 4096
113 static size_t *saved_addends, *apply_addends_to;
114
115 static struct dso ldso;
116 static struct dso *head, *tail, *fini_head, *syms_tail, *lazy_head;
117 static char *env_path, *sys_path;
118 static unsigned long long gencnt;
119 static int runtime;
120 static int ldd_mode;
121 static int ldso_fail;
122 static int noload;
123 static jmp_buf *rtld_fail;
124 static pthread_rwlock_t lock;
125 static struct debug debug;
126 static struct tls_module *tls_tail;
127 static size_t tls_cnt, tls_offset, tls_align = MIN_TLS_ALIGN;
128 static size_t static_tls_cnt;
129 static pthread_mutex_t init_fini_lock = { ._m_type = PTHREAD_MUTEX_RECURSIVE };
130 static struct fdpic_loadmap *app_loadmap;
131 static struct fdpic_dummy_loadmap app_dummy_loadmap;
132 static struct dso *const nodeps_dummy;
133
134 struct debug *_dl_debug_addr = &debug;
135
136 __attribute__((__visibility__("hidden")))
137 extern int __malloc_replaced;
138
139 __attribute__((__visibility__("hidden")))
140 void (*const __init_array_start)(void)=0, (*const __fini_array_start)(void)=0;
141
142 __attribute__((__visibility__("hidden")))
143 extern void (*const __init_array_end)(void), (*const __fini_array_end)(void);
144
145 weak_alias(__init_array_start, __init_array_end);
146 weak_alias(__fini_array_start, __fini_array_end);
147
148 static int dl_strcmp(const char *l, const char *r)
149 {
150         for (; *l==*r && *l; l++, r++);
151         return *(unsigned char *)l - *(unsigned char *)r;
152 }
153 #define strcmp(l,r) dl_strcmp(l,r)
154
155 /* Compute load address for a virtual address in a given dso. */
156 #if DL_FDPIC
157 static void *laddr(const struct dso *p, size_t v)
158 {
159         size_t j=0;
160         if (!p->loadmap) return p->base + v;
161         for (j=0; v-p->loadmap->segs[j].p_vaddr >= p->loadmap->segs[j].p_memsz; j++);
162         return (void *)(v - p->loadmap->segs[j].p_vaddr + p->loadmap->segs[j].addr);
163 }
164 static void *laddr_pg(const struct dso *p, size_t v)
165 {
166         size_t j=0;
167         size_t pgsz = PAGE_SIZE;
168         if (!p->loadmap) return p->base + v;
169         for (j=0; ; j++) {
170                 size_t a = p->loadmap->segs[j].p_vaddr;
171                 size_t b = a + p->loadmap->segs[j].p_memsz;
172                 a &= -pgsz;
173                 b += pgsz-1;
174                 b &= -pgsz;
175                 if (v-a<b-a) break;
176         }
177         return (void *)(v - p->loadmap->segs[j].p_vaddr + p->loadmap->segs[j].addr);
178 }
179 #define fpaddr(p, v) ((void (*)())&(struct funcdesc){ \
180         laddr(p, v), (p)->got })
181 #else
182 #define laddr(p, v) (void *)((p)->base + (v))
183 #define laddr_pg(p, v) laddr(p, v)
184 #define fpaddr(p, v) ((void (*)())laddr(p, v))
185 #endif
186
187 static void decode_vec(size_t *v, size_t *a, size_t cnt)
188 {
189         size_t i;
190         for (i=0; i<cnt; i++) a[i] = 0;
191         for (; v[0]; v+=2) if (v[0]-1<cnt-1) {
192                 a[0] |= 1UL<<v[0];
193                 a[v[0]] = v[1];
194         }
195 }
196
197 static int search_vec(size_t *v, size_t *r, size_t key)
198 {
199         for (; v[0]!=key; v+=2)
200                 if (!v[0]) return 0;
201         *r = v[1];
202         return 1;
203 }
204
205 static uint32_t sysv_hash(const char *s0)
206 {
207         const unsigned char *s = (void *)s0;
208         uint_fast32_t h = 0;
209         while (*s) {
210                 h = 16*h + *s++;
211                 h ^= h>>24 & 0xf0;
212         }
213         return h & 0xfffffff;
214 }
215
216 static uint32_t gnu_hash(const char *s0)
217 {
218         const unsigned char *s = (void *)s0;
219         uint_fast32_t h = 5381;
220         for (; *s; s++)
221                 h += h*32 + *s;
222         return h;
223 }
224
225 static Sym *sysv_lookup(const char *s, uint32_t h, struct dso *dso)
226 {
227         size_t i;
228         Sym *syms = dso->syms;
229         Elf_Symndx *hashtab = dso->hashtab;
230         char *strings = dso->strings;
231         for (i=hashtab[2+h%hashtab[0]]; i; i=hashtab[2+hashtab[0]+i]) {
232                 if ((!dso->versym || dso->versym[i] >= 0)
233                     && (!strcmp(s, strings+syms[i].st_name)))
234                         return syms+i;
235         }
236         return 0;
237 }
238
239 static Sym *gnu_lookup(uint32_t h1, uint32_t *hashtab, struct dso *dso, const char *s)
240 {
241         uint32_t nbuckets = hashtab[0];
242         uint32_t *buckets = hashtab + 4 + hashtab[2]*(sizeof(size_t)/4);
243         uint32_t i = buckets[h1 % nbuckets];
244
245         if (!i) return 0;
246
247         uint32_t *hashval = buckets + nbuckets + (i - hashtab[1]);
248
249         for (h1 |= 1; ; i++) {
250                 uint32_t h2 = *hashval++;
251                 if ((h1 == (h2|1)) && (!dso->versym || dso->versym[i] >= 0)
252                     && !strcmp(s, dso->strings + dso->syms[i].st_name))
253                         return dso->syms+i;
254                 if (h2 & 1) break;
255         }
256
257         return 0;
258 }
259
260 static Sym *gnu_lookup_filtered(uint32_t h1, uint32_t *hashtab, struct dso *dso, const char *s, uint32_t fofs, size_t fmask)
261 {
262         const size_t *bloomwords = (const void *)(hashtab+4);
263         size_t f = bloomwords[fofs & (hashtab[2]-1)];
264         if (!(f & fmask)) return 0;
265
266         f >>= (h1 >> hashtab[3]) % (8 * sizeof f);
267         if (!(f & 1)) return 0;
268
269         return gnu_lookup(h1, hashtab, dso, s);
270 }
271
272 #define OK_TYPES (1<<STT_NOTYPE | 1<<STT_OBJECT | 1<<STT_FUNC | 1<<STT_COMMON | 1<<STT_TLS)
273 #define OK_BINDS (1<<STB_GLOBAL | 1<<STB_WEAK | 1<<STB_GNU_UNIQUE)
274
275 #ifndef ARCH_SYM_REJECT_UND
276 #define ARCH_SYM_REJECT_UND(s) 0
277 #endif
278
279 static struct symdef find_sym(struct dso *dso, const char *s, int need_def)
280 {
281         uint32_t h = 0, gh = gnu_hash(s), gho = gh / (8*sizeof(size_t)), *ght;
282         size_t ghm = 1ul << gh % (8*sizeof(size_t));
283         struct symdef def = {0};
284         for (; dso; dso=dso->syms_next) {
285                 Sym *sym;
286                 if ((ght = dso->ghashtab)) {
287                         sym = gnu_lookup_filtered(gh, ght, dso, s, gho, ghm);
288                 } else {
289                         if (!h) h = sysv_hash(s);
290                         sym = sysv_lookup(s, h, dso);
291                 }
292                 if (!sym) continue;
293                 if (!sym->st_shndx)
294                         if (need_def || (sym->st_info&0xf) == STT_TLS
295                             || ARCH_SYM_REJECT_UND(sym))
296                                 continue;
297                 if (!sym->st_value)
298                         if ((sym->st_info&0xf) != STT_TLS)
299                                 continue;
300                 if (!(1<<(sym->st_info&0xf) & OK_TYPES)) continue;
301                 if (!(1<<(sym->st_info>>4) & OK_BINDS)) continue;
302                 def.sym = sym;
303                 def.dso = dso;
304                 break;
305         }
306         return def;
307 }
308
309 __attribute__((__visibility__("hidden")))
310 ptrdiff_t __tlsdesc_static(), __tlsdesc_dynamic();
311
312 static void do_relocs(struct dso *dso, size_t *rel, size_t rel_size, size_t stride)
313 {
314         unsigned char *base = dso->base;
315         Sym *syms = dso->syms;
316         char *strings = dso->strings;
317         Sym *sym;
318         const char *name;
319         void *ctx;
320         int type;
321         int sym_index;
322         struct symdef def;
323         size_t *reloc_addr;
324         size_t sym_val;
325         size_t tls_val;
326         size_t addend;
327         int skip_relative = 0, reuse_addends = 0, save_slot = 0;
328
329         if (dso == &ldso) {
330                 /* Only ldso's REL table needs addend saving/reuse. */
331                 if (rel == apply_addends_to)
332                         reuse_addends = 1;
333                 skip_relative = 1;
334         }
335
336         for (; rel_size; rel+=stride, rel_size-=stride*sizeof(size_t)) {
337                 if (skip_relative && IS_RELATIVE(rel[1], dso->syms)) continue;
338                 type = R_TYPE(rel[1]);
339                 if (type == REL_NONE) continue;
340                 reloc_addr = laddr(dso, rel[0]);
341
342                 if (stride > 2) {
343                         addend = rel[2];
344                 } else if (type==REL_GOT || type==REL_PLT|| type==REL_COPY) {
345                         addend = 0;
346                 } else if (reuse_addends) {
347                         /* Save original addend in stage 2 where the dso
348                          * chain consists of just ldso; otherwise read back
349                          * saved addend since the inline one was clobbered. */
350                         if (head==&ldso)
351                                 saved_addends[save_slot] = *reloc_addr;
352                         addend = saved_addends[save_slot++];
353                 } else {
354                         addend = *reloc_addr;
355                 }
356
357                 sym_index = R_SYM(rel[1]);
358                 if (sym_index) {
359                         sym = syms + sym_index;
360                         name = strings + sym->st_name;
361                         ctx = type==REL_COPY ? head->syms_next : head;
362                         def = (sym->st_info&0xf) == STT_SECTION
363                                 ? (struct symdef){ .dso = dso, .sym = sym }
364                                 : find_sym(ctx, name, type==REL_PLT);
365                         if (!def.sym && (sym->st_shndx != SHN_UNDEF
366                             || sym->st_info>>4 != STB_WEAK)) {
367                                 if (dso->lazy && (type==REL_PLT || type==REL_GOT)) {
368                                         dso->lazy[3*dso->lazy_cnt+0] = rel[0];
369                                         dso->lazy[3*dso->lazy_cnt+1] = rel[1];
370                                         dso->lazy[3*dso->lazy_cnt+2] = addend;
371                                         dso->lazy_cnt++;
372                                         continue;
373                                 }
374                                 error("Error relocating %s: %s: symbol not found",
375                                         dso->name, name);
376                                 if (runtime) longjmp(*rtld_fail, 1);
377                                 continue;
378                         }
379                 } else {
380                         sym = 0;
381                         def.sym = 0;
382                         def.dso = dso;
383                 }
384
385                 sym_val = def.sym ? (size_t)laddr(def.dso, def.sym->st_value) : 0;
386                 tls_val = def.sym ? def.sym->st_value : 0;
387
388                 switch(type) {
389                 case REL_NONE:
390                         break;
391                 case REL_OFFSET:
392                         addend -= (size_t)reloc_addr;
393                 case REL_SYMBOLIC:
394                 case REL_GOT:
395                 case REL_PLT:
396                         *reloc_addr = sym_val + addend;
397                         break;
398                 case REL_RELATIVE:
399                         *reloc_addr = (size_t)base + addend;
400                         break;
401                 case REL_SYM_OR_REL:
402                         if (sym) *reloc_addr = sym_val + addend;
403                         else *reloc_addr = (size_t)base + addend;
404                         break;
405                 case REL_COPY:
406                         memcpy(reloc_addr, (void *)sym_val, sym->st_size);
407                         break;
408                 case REL_OFFSET32:
409                         *(uint32_t *)reloc_addr = sym_val + addend
410                                 - (size_t)reloc_addr;
411                         break;
412                 case REL_FUNCDESC:
413                         *reloc_addr = def.sym ? (size_t)(def.dso->funcdescs
414                                 + (def.sym - def.dso->syms)) : 0;
415                         break;
416                 case REL_FUNCDESC_VAL:
417                         if ((sym->st_info&0xf) == STT_SECTION) *reloc_addr += sym_val;
418                         else *reloc_addr = sym_val;
419                         reloc_addr[1] = def.sym ? (size_t)def.dso->got : 0;
420                         break;
421                 case REL_DTPMOD:
422                         *reloc_addr = def.dso->tls_id;
423                         break;
424                 case REL_DTPOFF:
425                         *reloc_addr = tls_val + addend - DTP_OFFSET;
426                         break;
427 #ifdef TLS_ABOVE_TP
428                 case REL_TPOFF:
429                         *reloc_addr = tls_val + def.dso->tls.offset + TPOFF_K + addend;
430                         break;
431 #else
432                 case REL_TPOFF:
433                         *reloc_addr = tls_val - def.dso->tls.offset + addend;
434                         break;
435                 case REL_TPOFF_NEG:
436                         *reloc_addr = def.dso->tls.offset - tls_val + addend;
437                         break;
438 #endif
439                 case REL_TLSDESC:
440                         if (stride<3) addend = reloc_addr[1];
441                         if (runtime && def.dso->tls_id >= static_tls_cnt) {
442                                 struct td_index *new = malloc(sizeof *new);
443                                 if (!new) {
444                                         error(
445                                         "Error relocating %s: cannot allocate TLSDESC for %s",
446                                         dso->name, sym ? name : "(local)" );
447                                         longjmp(*rtld_fail, 1);
448                                 }
449                                 new->next = dso->td_index;
450                                 dso->td_index = new;
451                                 new->args[0] = def.dso->tls_id;
452                                 new->args[1] = tls_val + addend;
453                                 reloc_addr[0] = (size_t)__tlsdesc_dynamic;
454                                 reloc_addr[1] = (size_t)new;
455                         } else {
456                                 reloc_addr[0] = (size_t)__tlsdesc_static;
457 #ifdef TLS_ABOVE_TP
458                                 reloc_addr[1] = tls_val + def.dso->tls.offset
459                                         + TPOFF_K + addend;
460 #else
461                                 reloc_addr[1] = tls_val - def.dso->tls.offset
462                                         + addend;
463 #endif
464                         }
465                         break;
466                 default:
467                         error("Error relocating %s: unsupported relocation type %d",
468                                 dso->name, type);
469                         if (runtime) longjmp(*rtld_fail, 1);
470                         continue;
471                 }
472         }
473 }
474
475 static void redo_lazy_relocs()
476 {
477         struct dso *p = lazy_head, *next;
478         lazy_head = 0;
479         for (; p; p=next) {
480                 next = p->lazy_next;
481                 size_t size = p->lazy_cnt*3*sizeof(size_t);
482                 p->lazy_cnt = 0;
483                 do_relocs(p, p->lazy, size, 3);
484                 if (p->lazy_cnt) {
485                         p->lazy_next = lazy_head;
486                         lazy_head = p;
487                 } else {
488                         free(p->lazy);
489                         p->lazy = 0;
490                         p->lazy_next = 0;
491                 }
492         }
493 }
494
495 /* A huge hack: to make up for the wastefulness of shared libraries
496  * needing at least a page of dirty memory even if they have no global
497  * data, we reclaim the gaps at the beginning and end of writable maps
498  * and "donate" them to the heap. */
499
500 static void reclaim(struct dso *dso, size_t start, size_t end)
501 {
502         void __malloc_donate(char *, char *);
503         if (start >= dso->relro_start && start < dso->relro_end) start = dso->relro_end;
504         if (end   >= dso->relro_start && end   < dso->relro_end) end = dso->relro_start;
505         if (start >= end) return;
506         char *base = laddr_pg(dso, start);
507         __malloc_donate(base, base+(end-start));
508 }
509
510 static void reclaim_gaps(struct dso *dso)
511 {
512         Phdr *ph = dso->phdr;
513         size_t phcnt = dso->phnum;
514
515         for (; phcnt--; ph=(void *)((char *)ph+dso->phentsize)) {
516                 if (ph->p_type!=PT_LOAD) continue;
517                 if ((ph->p_flags&(PF_R|PF_W))!=(PF_R|PF_W)) continue;
518                 reclaim(dso, ph->p_vaddr & -PAGE_SIZE, ph->p_vaddr);
519                 reclaim(dso, ph->p_vaddr+ph->p_memsz,
520                         ph->p_vaddr+ph->p_memsz+PAGE_SIZE-1 & -PAGE_SIZE);
521         }
522 }
523
524 static void *mmap_fixed(void *p, size_t n, int prot, int flags, int fd, off_t off)
525 {
526         static int no_map_fixed;
527         char *q;
528         if (!no_map_fixed) {
529                 q = mmap(p, n, prot, flags|MAP_FIXED, fd, off);
530                 if (!DL_NOMMU_SUPPORT || q != MAP_FAILED || errno != EINVAL)
531                         return q;
532                 no_map_fixed = 1;
533         }
534         /* Fallbacks for MAP_FIXED failure on NOMMU kernels. */
535         if (flags & MAP_ANONYMOUS) {
536                 memset(p, 0, n);
537                 return p;
538         }
539         ssize_t r;
540         if (lseek(fd, off, SEEK_SET) < 0) return MAP_FAILED;
541         for (q=p; n; q+=r, off+=r, n-=r) {
542                 r = read(fd, q, n);
543                 if (r < 0 && errno != EINTR) return MAP_FAILED;
544                 if (!r) {
545                         memset(q, 0, n);
546                         break;
547                 }
548         }
549         return p;
550 }
551
552 static void unmap_library(struct dso *dso)
553 {
554         if (dso->loadmap) {
555                 size_t i;
556                 for (i=0; i<dso->loadmap->nsegs; i++) {
557                         if (!dso->loadmap->segs[i].p_memsz)
558                                 continue;
559                         munmap((void *)dso->loadmap->segs[i].addr,
560                                 dso->loadmap->segs[i].p_memsz);
561                 }
562                 free(dso->loadmap);
563         } else if (dso->map && dso->map_len) {
564                 munmap(dso->map, dso->map_len);
565         }
566 }
567
568 static void *map_library(int fd, struct dso *dso)
569 {
570         Ehdr buf[(896+sizeof(Ehdr))/sizeof(Ehdr)];
571         void *allocated_buf=0;
572         size_t phsize;
573         size_t addr_min=SIZE_MAX, addr_max=0, map_len;
574         size_t this_min, this_max;
575         size_t nsegs = 0;
576         off_t off_start;
577         Ehdr *eh;
578         Phdr *ph, *ph0;
579         unsigned prot;
580         unsigned char *map=MAP_FAILED, *base;
581         size_t dyn=0;
582         size_t tls_image=0;
583         size_t i;
584
585         ssize_t l = read(fd, buf, sizeof buf);
586         eh = buf;
587         if (l<0) return 0;
588         if (l<sizeof *eh || (eh->e_type != ET_DYN && eh->e_type != ET_EXEC))
589                 goto noexec;
590         phsize = eh->e_phentsize * eh->e_phnum;
591         if (phsize > sizeof buf - sizeof *eh) {
592                 allocated_buf = malloc(phsize);
593                 if (!allocated_buf) return 0;
594                 l = pread(fd, allocated_buf, phsize, eh->e_phoff);
595                 if (l < 0) goto error;
596                 if (l != phsize) goto noexec;
597                 ph = ph0 = allocated_buf;
598         } else if (eh->e_phoff + phsize > l) {
599                 l = pread(fd, buf+1, phsize, eh->e_phoff);
600                 if (l < 0) goto error;
601                 if (l != phsize) goto noexec;
602                 ph = ph0 = (void *)(buf + 1);
603         } else {
604                 ph = ph0 = (void *)((char *)buf + eh->e_phoff);
605         }
606         for (i=eh->e_phnum; i; i--, ph=(void *)((char *)ph+eh->e_phentsize)) {
607                 if (ph->p_type == PT_DYNAMIC) {
608                         dyn = ph->p_vaddr;
609                 } else if (ph->p_type == PT_TLS) {
610                         tls_image = ph->p_vaddr;
611                         dso->tls.align = ph->p_align;
612                         dso->tls.len = ph->p_filesz;
613                         dso->tls.size = ph->p_memsz;
614                 } else if (ph->p_type == PT_GNU_RELRO) {
615                         dso->relro_start = ph->p_vaddr & -PAGE_SIZE;
616                         dso->relro_end = (ph->p_vaddr + ph->p_memsz) & -PAGE_SIZE;
617                 }
618                 if (ph->p_type != PT_LOAD) continue;
619                 nsegs++;
620                 if (ph->p_vaddr < addr_min) {
621                         addr_min = ph->p_vaddr;
622                         off_start = ph->p_offset;
623                         prot = (((ph->p_flags&PF_R) ? PROT_READ : 0) |
624                                 ((ph->p_flags&PF_W) ? PROT_WRITE: 0) |
625                                 ((ph->p_flags&PF_X) ? PROT_EXEC : 0));
626                 }
627                 if (ph->p_vaddr+ph->p_memsz > addr_max) {
628                         addr_max = ph->p_vaddr+ph->p_memsz;
629                 }
630         }
631         if (!dyn) goto noexec;
632         if (DL_FDPIC && !(eh->e_flags & FDPIC_CONSTDISP_FLAG)) {
633                 dso->loadmap = calloc(1, sizeof *dso->loadmap
634                         + nsegs * sizeof *dso->loadmap->segs);
635                 if (!dso->loadmap) goto error;
636                 dso->loadmap->nsegs = nsegs;
637                 for (ph=ph0, i=0; i<nsegs; ph=(void *)((char *)ph+eh->e_phentsize)) {
638                         if (ph->p_type != PT_LOAD) continue;
639                         prot = (((ph->p_flags&PF_R) ? PROT_READ : 0) |
640                                 ((ph->p_flags&PF_W) ? PROT_WRITE: 0) |
641                                 ((ph->p_flags&PF_X) ? PROT_EXEC : 0));
642                         map = mmap(0, ph->p_memsz + (ph->p_vaddr & PAGE_SIZE-1),
643                                 prot, MAP_PRIVATE,
644                                 fd, ph->p_offset & -PAGE_SIZE);
645                         if (map == MAP_FAILED) {
646                                 unmap_library(dso);
647                                 goto error;
648                         }
649                         dso->loadmap->segs[i].addr = (size_t)map +
650                                 (ph->p_vaddr & PAGE_SIZE-1);
651                         dso->loadmap->segs[i].p_vaddr = ph->p_vaddr;
652                         dso->loadmap->segs[i].p_memsz = ph->p_memsz;
653                         i++;
654                         if (prot & PROT_WRITE) {
655                                 size_t brk = (ph->p_vaddr & PAGE_SIZE-1)
656                                         + ph->p_filesz;
657                                 size_t pgbrk = brk + PAGE_SIZE-1 & -PAGE_SIZE;
658                                 size_t pgend = brk + ph->p_memsz - ph->p_filesz
659                                         + PAGE_SIZE-1 & -PAGE_SIZE;
660                                 if (pgend > pgbrk && mmap_fixed(map+pgbrk,
661                                         pgend-pgbrk, prot,
662                                         MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS,
663                                         -1, off_start) == MAP_FAILED)
664                                         goto error;
665                                 memset(map + brk, 0, pgbrk-brk);
666                         }
667                 }
668                 map = (void *)dso->loadmap->segs[0].addr;
669                 map_len = 0;
670                 goto done_mapping;
671         }
672         addr_max += PAGE_SIZE-1;
673         addr_max &= -PAGE_SIZE;
674         addr_min &= -PAGE_SIZE;
675         off_start &= -PAGE_SIZE;
676         map_len = addr_max - addr_min + off_start;
677         /* The first time, we map too much, possibly even more than
678          * the length of the file. This is okay because we will not
679          * use the invalid part; we just need to reserve the right
680          * amount of virtual address space to map over later. */
681         map = DL_NOMMU_SUPPORT
682                 ? mmap((void *)addr_min, map_len, PROT_READ|PROT_WRITE|PROT_EXEC,
683                         MAP_PRIVATE|MAP_ANONYMOUS, -1, 0)
684                 : mmap((void *)addr_min, map_len, prot,
685                         MAP_PRIVATE, fd, off_start);
686         if (map==MAP_FAILED) goto error;
687         dso->map = map;
688         dso->map_len = map_len;
689         /* If the loaded file is not relocatable and the requested address is
690          * not available, then the load operation must fail. */
691         if (eh->e_type != ET_DYN && addr_min && map!=(void *)addr_min) {
692                 errno = EBUSY;
693                 goto error;
694         }
695         base = map - addr_min;
696         dso->phdr = 0;
697         dso->phnum = 0;
698         for (ph=ph0, i=eh->e_phnum; i; i--, ph=(void *)((char *)ph+eh->e_phentsize)) {
699                 if (ph->p_type != PT_LOAD) continue;
700                 /* Check if the programs headers are in this load segment, and
701                  * if so, record the address for use by dl_iterate_phdr. */
702                 if (!dso->phdr && eh->e_phoff >= ph->p_offset
703                     && eh->e_phoff+phsize <= ph->p_offset+ph->p_filesz) {
704                         dso->phdr = (void *)(base + ph->p_vaddr
705                                 + (eh->e_phoff-ph->p_offset));
706                         dso->phnum = eh->e_phnum;
707                         dso->phentsize = eh->e_phentsize;
708                 }
709                 /* Reuse the existing mapping for the lowest-address LOAD */
710                 if ((ph->p_vaddr & -PAGE_SIZE) == addr_min && !DL_NOMMU_SUPPORT)
711                         continue;
712                 this_min = ph->p_vaddr & -PAGE_SIZE;
713                 this_max = ph->p_vaddr+ph->p_memsz+PAGE_SIZE-1 & -PAGE_SIZE;
714                 off_start = ph->p_offset & -PAGE_SIZE;
715                 prot = (((ph->p_flags&PF_R) ? PROT_READ : 0) |
716                         ((ph->p_flags&PF_W) ? PROT_WRITE: 0) |
717                         ((ph->p_flags&PF_X) ? PROT_EXEC : 0));
718                 if (mmap_fixed(base+this_min, this_max-this_min, prot, MAP_PRIVATE|MAP_FIXED, fd, off_start) == MAP_FAILED)
719                         goto error;
720                 if (ph->p_memsz > ph->p_filesz) {
721                         size_t brk = (size_t)base+ph->p_vaddr+ph->p_filesz;
722                         size_t pgbrk = brk+PAGE_SIZE-1 & -PAGE_SIZE;
723                         memset((void *)brk, 0, pgbrk-brk & PAGE_SIZE-1);
724                         if (pgbrk-(size_t)base < this_max && mmap_fixed((void *)pgbrk, (size_t)base+this_max-pgbrk, prot, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) == MAP_FAILED)
725                                 goto error;
726                 }
727         }
728         for (i=0; ((size_t *)(base+dyn))[i]; i+=2)
729                 if (((size_t *)(base+dyn))[i]==DT_TEXTREL) {
730                         if (mprotect(map, map_len, PROT_READ|PROT_WRITE|PROT_EXEC)
731                             && errno != ENOSYS)
732                                 goto error;
733                         break;
734                 }
735 done_mapping:
736         dso->base = base;
737         dso->dynv = laddr(dso, dyn);
738         if (dso->tls.size) dso->tls.image = laddr(dso, tls_image);
739         free(allocated_buf);
740         return map;
741 noexec:
742         errno = ENOEXEC;
743 error:
744         if (map!=MAP_FAILED) unmap_library(dso);
745         free(allocated_buf);
746         return 0;
747 }
748
749 static int path_open(const char *name, const char *s, char *buf, size_t buf_size)
750 {
751         size_t l;
752         int fd;
753         for (;;) {
754                 s += strspn(s, ":\n");
755                 l = strcspn(s, ":\n");
756                 if (l-1 >= INT_MAX) return -1;
757                 if (snprintf(buf, buf_size, "%.*s/%s", (int)l, s, name) < buf_size) {
758                         if ((fd = open(buf, O_RDONLY|O_CLOEXEC))>=0) return fd;
759                         switch (errno) {
760                         case ENOENT:
761                         case ENOTDIR:
762                         case EACCES:
763                         case ENAMETOOLONG:
764                                 break;
765                         default:
766                                 /* Any negative value but -1 will inhibit
767                                  * futher path search. */
768                                 return -2;
769                         }
770                 }
771                 s += l;
772         }
773 }
774
775 static int fixup_rpath(struct dso *p, char *buf, size_t buf_size)
776 {
777         size_t n, l;
778         const char *s, *t, *origin;
779         char *d;
780         if (p->rpath || !p->rpath_orig) return 0;
781         if (!strchr(p->rpath_orig, '$')) {
782                 p->rpath = p->rpath_orig;
783                 return 0;
784         }
785         n = 0;
786         s = p->rpath_orig;
787         while ((t=strchr(s, '$'))) {
788                 if (strncmp(t, "$ORIGIN", 7) && strncmp(t, "${ORIGIN}", 9))
789                         return 0;
790                 s = t+1;
791                 n++;
792         }
793         if (n > SSIZE_MAX/PATH_MAX) return 0;
794
795         if (p->kernel_mapped) {
796                 /* $ORIGIN searches cannot be performed for the main program
797                  * when it is suid/sgid/AT_SECURE. This is because the
798                  * pathname is under the control of the caller of execve.
799                  * For libraries, however, $ORIGIN can be processed safely
800                  * since the library's pathname came from a trusted source
801                  * (either system paths or a call to dlopen). */
802                 if (libc.secure)
803                         return 0;
804                 l = readlink("/proc/self/exe", buf, buf_size);
805                 if (l == -1) switch (errno) {
806                 case ENOENT:
807                 case ENOTDIR:
808                 case EACCES:
809                         break;
810                 default:
811                         return -1;
812                 }
813                 if (l >= buf_size)
814                         return 0;
815                 buf[l] = 0;
816                 origin = buf;
817         } else {
818                 origin = p->name;
819         }
820         t = strrchr(origin, '/');
821         if (t) {
822                 l = t-origin;
823         } else {
824                 /* Normally p->name will always be an absolute or relative
825                  * pathname containing at least one '/' character, but in the
826                  * case where ldso was invoked as a command to execute a
827                  * program in the working directory, app.name may not. Fix. */
828                 origin = ".";
829                 l = 1;
830         }
831         /* Disallow non-absolute origins for suid/sgid/AT_SECURE. */
832         if (libc.secure && *origin != '/')
833                 return 0;
834         p->rpath = malloc(strlen(p->rpath_orig) + n*l + 1);
835         if (!p->rpath) return -1;
836
837         d = p->rpath;
838         s = p->rpath_orig;
839         while ((t=strchr(s, '$'))) {
840                 memcpy(d, s, t-s);
841                 d += t-s;
842                 memcpy(d, origin, l);
843                 d += l;
844                 /* It was determined previously that the '$' is followed
845                  * either by "ORIGIN" or "{ORIGIN}". */
846                 s = t + 7 + 2*(t[1]=='{');
847         }
848         strcpy(d, s);
849         return 0;
850 }
851
852 static void decode_dyn(struct dso *p)
853 {
854         size_t dyn[DYN_CNT];
855         decode_vec(p->dynv, dyn, DYN_CNT);
856         p->syms = laddr(p, dyn[DT_SYMTAB]);
857         p->strings = laddr(p, dyn[DT_STRTAB]);
858         if (dyn[0]&(1<<DT_HASH))
859                 p->hashtab = laddr(p, dyn[DT_HASH]);
860         if (dyn[0]&(1<<DT_RPATH))
861                 p->rpath_orig = p->strings + dyn[DT_RPATH];
862         if (dyn[0]&(1<<DT_RUNPATH))
863                 p->rpath_orig = p->strings + dyn[DT_RUNPATH];
864         if (dyn[0]&(1<<DT_PLTGOT))
865                 p->got = laddr(p, dyn[DT_PLTGOT]);
866         if (search_vec(p->dynv, dyn, DT_GNU_HASH))
867                 p->ghashtab = laddr(p, *dyn);
868         if (search_vec(p->dynv, dyn, DT_VERSYM))
869                 p->versym = laddr(p, *dyn);
870 }
871
872 static size_t count_syms(struct dso *p)
873 {
874         if (p->hashtab) return p->hashtab[1];
875
876         size_t nsym, i;
877         uint32_t *buckets = p->ghashtab + 4 + (p->ghashtab[2]*sizeof(size_t)/4);
878         uint32_t *hashval;
879         for (i = nsym = 0; i < p->ghashtab[0]; i++) {
880                 if (buckets[i] > nsym)
881                         nsym = buckets[i];
882         }
883         if (nsym) {
884                 hashval = buckets + p->ghashtab[0] + (nsym - p->ghashtab[1]);
885                 do nsym++;
886                 while (!(*hashval++ & 1));
887         }
888         return nsym;
889 }
890
891 static void *dl_mmap(size_t n)
892 {
893         void *p;
894         int prot = PROT_READ|PROT_WRITE, flags = MAP_ANONYMOUS|MAP_PRIVATE;
895 #ifdef SYS_mmap2
896         p = (void *)__syscall(SYS_mmap2, 0, n, prot, flags, -1, 0);
897 #else
898         p = (void *)__syscall(SYS_mmap, 0, n, prot, flags, -1, 0);
899 #endif
900         return p == MAP_FAILED ? 0 : p;
901 }
902
903 static void makefuncdescs(struct dso *p)
904 {
905         static int self_done;
906         size_t nsym = count_syms(p);
907         size_t i, size = nsym * sizeof(*p->funcdescs);
908
909         if (!self_done) {
910                 p->funcdescs = dl_mmap(size);
911                 self_done = 1;
912         } else {
913                 p->funcdescs = malloc(size);
914         }
915         if (!p->funcdescs) {
916                 if (!runtime) a_crash();
917                 error("Error allocating function descriptors for %s", p->name);
918                 longjmp(*rtld_fail, 1);
919         }
920         for (i=0; i<nsym; i++) {
921                 if ((p->syms[i].st_info&0xf)==STT_FUNC && p->syms[i].st_shndx) {
922                         p->funcdescs[i].addr = laddr(p, p->syms[i].st_value);
923                         p->funcdescs[i].got = p->got;
924                 } else {
925                         p->funcdescs[i].addr = 0;
926                         p->funcdescs[i].got = 0;
927                 }
928         }
929 }
930
931 static struct dso *load_library(const char *name, struct dso *needed_by)
932 {
933         char buf[2*NAME_MAX+2];
934         const char *pathname;
935         unsigned char *map;
936         struct dso *p, temp_dso = {0};
937         int fd;
938         struct stat st;
939         size_t alloc_size;
940         int n_th = 0;
941         int is_self = 0;
942
943         if (!*name) {
944                 errno = EINVAL;
945                 return 0;
946         }
947
948         /* Catch and block attempts to reload the implementation itself */
949         if (name[0]=='l' && name[1]=='i' && name[2]=='b') {
950                 static const char reserved[] =
951                         "c.pthread.rt.m.dl.util.xnet.";
952                 const char *rp, *next;
953                 for (rp=reserved; *rp; rp=next) {
954                         next = strchr(rp, '.') + 1;
955                         if (strncmp(name+3, rp, next-rp) == 0)
956                                 break;
957                 }
958                 if (*rp) {
959                         if (ldd_mode) {
960                                 /* Track which names have been resolved
961                                  * and only report each one once. */
962                                 static unsigned reported;
963                                 unsigned mask = 1U<<(rp-reserved);
964                                 if (!(reported & mask)) {
965                                         reported |= mask;
966                                         dprintf(1, "\t%s => %s (%p)\n",
967                                                 name, ldso.name,
968                                                 ldso.base);
969                                 }
970                         }
971                         is_self = 1;
972                 }
973         }
974         if (!strcmp(name, ldso.name)) is_self = 1;
975         if (is_self) {
976                 if (!ldso.prev) {
977                         tail->next = &ldso;
978                         ldso.prev = tail;
979                         tail = &ldso;
980                 }
981                 return &ldso;
982         }
983         if (strchr(name, '/')) {
984                 pathname = name;
985                 fd = open(name, O_RDONLY|O_CLOEXEC);
986         } else {
987                 /* Search for the name to see if it's already loaded */
988                 for (p=head->next; p; p=p->next) {
989                         if (p->shortname && !strcmp(p->shortname, name)) {
990                                 return p;
991                         }
992                 }
993                 if (strlen(name) > NAME_MAX) return 0;
994                 fd = -1;
995                 if (env_path) fd = path_open(name, env_path, buf, sizeof buf);
996                 for (p=needed_by; fd == -1 && p; p=p->needed_by) {
997                         if (fixup_rpath(p, buf, sizeof buf) < 0)
998                                 fd = -2; /* Inhibit further search. */
999                         if (p->rpath)
1000                                 fd = path_open(name, p->rpath, buf, sizeof buf);
1001                 }
1002                 if (fd == -1) {
1003                         if (!sys_path) {
1004                                 char *prefix = 0;
1005                                 size_t prefix_len;
1006                                 if (ldso.name[0]=='/') {
1007                                         char *s, *t, *z;
1008                                         for (s=t=z=ldso.name; *s; s++)
1009                                                 if (*s=='/') z=t, t=s;
1010                                         prefix_len = z-ldso.name;
1011                                         if (prefix_len < PATH_MAX)
1012                                                 prefix = ldso.name;
1013                                 }
1014                                 if (!prefix) {
1015                                         prefix = "";
1016                                         prefix_len = 0;
1017                                 }
1018                                 char etc_ldso_path[prefix_len + 1
1019                                         + sizeof "/etc/ld-musl-" LDSO_ARCH ".path"];
1020                                 snprintf(etc_ldso_path, sizeof etc_ldso_path,
1021                                         "%.*s/etc/ld-musl-" LDSO_ARCH ".path",
1022                                         (int)prefix_len, prefix);
1023                                 FILE *f = fopen(etc_ldso_path, "rbe");
1024                                 if (f) {
1025                                         if (getdelim(&sys_path, (size_t[1]){0}, 0, f) <= 0) {
1026                                                 free(sys_path);
1027                                                 sys_path = "";
1028                                         }
1029                                         fclose(f);
1030                                 } else if (errno != ENOENT) {
1031                                         sys_path = "";
1032                                 }
1033                         }
1034                         if (!sys_path) sys_path = "/lib:/usr/local/lib:/usr/lib";
1035                         fd = path_open(name, sys_path, buf, sizeof buf);
1036                 }
1037                 pathname = buf;
1038         }
1039         if (fd < 0) return 0;
1040         if (fstat(fd, &st) < 0) {
1041                 close(fd);
1042                 return 0;
1043         }
1044         for (p=head->next; p; p=p->next) {
1045                 if (p->dev == st.st_dev && p->ino == st.st_ino) {
1046                         /* If this library was previously loaded with a
1047                          * pathname but a search found the same inode,
1048                          * setup its shortname so it can be found by name. */
1049                         if (!p->shortname && pathname != name)
1050                                 p->shortname = strrchr(p->name, '/')+1;
1051                         close(fd);
1052                         return p;
1053                 }
1054         }
1055         map = noload ? 0 : map_library(fd, &temp_dso);
1056         close(fd);
1057         if (!map) return 0;
1058
1059         /* Avoid the danger of getting two versions of libc mapped into the
1060          * same process when an absolute pathname was used. The symbols
1061          * checked are chosen to catch both musl and glibc, and to avoid
1062          * false positives from interposition-hack libraries. */
1063         decode_dyn(&temp_dso);
1064         if (find_sym(&temp_dso, "__libc_start_main", 1).sym &&
1065             find_sym(&temp_dso, "stdin", 1).sym) {
1066                 unmap_library(&temp_dso);
1067                 return load_library("libc.so", needed_by);
1068         }
1069         /* Past this point, if we haven't reached runtime yet, ldso has
1070          * committed either to use the mapped library or to abort execution.
1071          * Unmapping is not possible, so we can safely reclaim gaps. */
1072         if (!runtime) reclaim_gaps(&temp_dso);
1073
1074         /* Allocate storage for the new DSO. When there is TLS, this
1075          * storage must include a reservation for all pre-existing
1076          * threads to obtain copies of both the new TLS, and an
1077          * extended DTV capable of storing an additional slot for
1078          * the newly-loaded DSO. */
1079         alloc_size = sizeof *p + strlen(pathname) + 1;
1080         if (runtime && temp_dso.tls.image) {
1081                 size_t per_th = temp_dso.tls.size + temp_dso.tls.align
1082                         + sizeof(void *) * (tls_cnt+3);
1083                 n_th = libc.threads_minus_1 + 1;
1084                 if (n_th > SSIZE_MAX / per_th) alloc_size = SIZE_MAX;
1085                 else alloc_size += n_th * per_th;
1086         }
1087         p = calloc(1, alloc_size);
1088         if (!p) {
1089                 unmap_library(&temp_dso);
1090                 return 0;
1091         }
1092         memcpy(p, &temp_dso, sizeof temp_dso);
1093         p->dev = st.st_dev;
1094         p->ino = st.st_ino;
1095         p->needed_by = needed_by;
1096         p->name = p->buf;
1097         strcpy(p->name, pathname);
1098         /* Add a shortname only if name arg was not an explicit pathname. */
1099         if (pathname != name) p->shortname = strrchr(p->name, '/')+1;
1100         if (p->tls.image) {
1101                 p->tls_id = ++tls_cnt;
1102                 tls_align = MAXP2(tls_align, p->tls.align);
1103 #ifdef TLS_ABOVE_TP
1104                 p->tls.offset = tls_offset + ( (tls_align-1) &
1105                         -(tls_offset + (uintptr_t)p->tls.image) );
1106                 tls_offset += p->tls.size;
1107 #else
1108                 tls_offset += p->tls.size + p->tls.align - 1;
1109                 tls_offset -= (tls_offset + (uintptr_t)p->tls.image)
1110                         & (p->tls.align-1);
1111                 p->tls.offset = tls_offset;
1112 #endif
1113                 p->new_dtv = (void *)(-sizeof(size_t) &
1114                         (uintptr_t)(p->name+strlen(p->name)+sizeof(size_t)));
1115                 p->new_tls = (void *)(p->new_dtv + n_th*(tls_cnt+1));
1116                 if (tls_tail) tls_tail->next = &p->tls;
1117                 else libc.tls_head = &p->tls;
1118                 tls_tail = &p->tls;
1119         }
1120
1121         tail->next = p;
1122         p->prev = tail;
1123         tail = p;
1124
1125         if (DL_FDPIC) makefuncdescs(p);
1126
1127         if (ldd_mode) dprintf(1, "\t%s => %s (%p)\n", name, pathname, p->base);
1128
1129         return p;
1130 }
1131
1132 static void load_deps(struct dso *p)
1133 {
1134         size_t i, ndeps=0;
1135         struct dso ***deps = &p->deps, **tmp, *dep;
1136         for (; p; p=p->next) {
1137                 for (i=0; p->dynv[i]; i+=2) {
1138                         if (p->dynv[i] != DT_NEEDED) continue;
1139                         dep = load_library(p->strings + p->dynv[i+1], p);
1140                         if (!dep) {
1141                                 error("Error loading shared library %s: %m (needed by %s)",
1142                                         p->strings + p->dynv[i+1], p->name);
1143                                 if (runtime) longjmp(*rtld_fail, 1);
1144                                 continue;
1145                         }
1146                         if (runtime) {
1147                                 tmp = realloc(*deps, sizeof(*tmp)*(ndeps+2));
1148                                 if (!tmp) longjmp(*rtld_fail, 1);
1149                                 tmp[ndeps++] = dep;
1150                                 tmp[ndeps] = 0;
1151                                 *deps = tmp;
1152                         }
1153                 }
1154         }
1155         if (!*deps) *deps = (struct dso **)&nodeps_dummy;
1156 }
1157
1158 static void load_preload(char *s)
1159 {
1160         int tmp;
1161         char *z;
1162         for (z=s; *z; s=z) {
1163                 for (   ; *s && (isspace(*s) || *s==':'); s++);
1164                 for (z=s; *z && !isspace(*z) && *z!=':'; z++);
1165                 tmp = *z;
1166                 *z = 0;
1167                 load_library(s, 0);
1168                 *z = tmp;
1169         }
1170 }
1171
1172 static void add_syms(struct dso *p)
1173 {
1174         if (!p->syms_next && syms_tail != p) {
1175                 syms_tail->syms_next = p;
1176                 syms_tail = p;
1177         }
1178 }
1179
1180 static void revert_syms(struct dso *old_tail)
1181 {
1182         struct dso *p, *next;
1183         /* Chop off the tail of the list of dsos that participate in
1184          * the global symbol table, reverting them to RTLD_LOCAL. */
1185         for (p=old_tail; p; p=next) {
1186                 next = p->syms_next;
1187                 p->syms_next = 0;
1188         }
1189         syms_tail = old_tail;
1190 }
1191
1192 static void do_mips_relocs(struct dso *p, size_t *got)
1193 {
1194         size_t i, j, rel[2];
1195         unsigned char *base = p->base;
1196         i=0; search_vec(p->dynv, &i, DT_MIPS_LOCAL_GOTNO);
1197         if (p==&ldso) {
1198                 got += i;
1199         } else {
1200                 while (i--) *got++ += (size_t)base;
1201         }
1202         j=0; search_vec(p->dynv, &j, DT_MIPS_GOTSYM);
1203         i=0; search_vec(p->dynv, &i, DT_MIPS_SYMTABNO);
1204         Sym *sym = p->syms + j;
1205         rel[0] = (unsigned char *)got - base;
1206         for (i-=j; i; i--, sym++, rel[0]+=sizeof(size_t)) {
1207                 rel[1] = R_INFO(sym-p->syms, R_MIPS_JUMP_SLOT);
1208                 do_relocs(p, rel, sizeof rel, 2);
1209         }
1210 }
1211
1212 static void reloc_all(struct dso *p)
1213 {
1214         size_t dyn[DYN_CNT];
1215         for (; p; p=p->next) {
1216                 if (p->relocated) continue;
1217                 decode_vec(p->dynv, dyn, DYN_CNT);
1218                 if (NEED_MIPS_GOT_RELOCS)
1219                         do_mips_relocs(p, laddr(p, dyn[DT_PLTGOT]));
1220                 do_relocs(p, laddr(p, dyn[DT_JMPREL]), dyn[DT_PLTRELSZ],
1221                         2+(dyn[DT_PLTREL]==DT_RELA));
1222                 do_relocs(p, laddr(p, dyn[DT_REL]), dyn[DT_RELSZ], 2);
1223                 do_relocs(p, laddr(p, dyn[DT_RELA]), dyn[DT_RELASZ], 3);
1224
1225                 if (head != &ldso && p->relro_start != p->relro_end &&
1226                     mprotect(laddr(p, p->relro_start), p->relro_end-p->relro_start, PROT_READ)
1227                     && errno != ENOSYS) {
1228                         error("Error relocating %s: RELRO protection failed: %m",
1229                                 p->name);
1230                         if (runtime) longjmp(*rtld_fail, 1);
1231                 }
1232
1233                 p->relocated = 1;
1234         }
1235 }
1236
1237 static void kernel_mapped_dso(struct dso *p)
1238 {
1239         size_t min_addr = -1, max_addr = 0, cnt;
1240         Phdr *ph = p->phdr;
1241         for (cnt = p->phnum; cnt--; ph = (void *)((char *)ph + p->phentsize)) {
1242                 if (ph->p_type == PT_DYNAMIC) {
1243                         p->dynv = laddr(p, ph->p_vaddr);
1244                 } else if (ph->p_type == PT_GNU_RELRO) {
1245                         p->relro_start = ph->p_vaddr & -PAGE_SIZE;
1246                         p->relro_end = (ph->p_vaddr + ph->p_memsz) & -PAGE_SIZE;
1247                 }
1248                 if (ph->p_type != PT_LOAD) continue;
1249                 if (ph->p_vaddr < min_addr)
1250                         min_addr = ph->p_vaddr;
1251                 if (ph->p_vaddr+ph->p_memsz > max_addr)
1252                         max_addr = ph->p_vaddr+ph->p_memsz;
1253         }
1254         min_addr &= -PAGE_SIZE;
1255         max_addr = (max_addr + PAGE_SIZE-1) & -PAGE_SIZE;
1256         p->map = p->base + min_addr;
1257         p->map_len = max_addr - min_addr;
1258         p->kernel_mapped = 1;
1259 }
1260
1261 void __libc_exit_fini()
1262 {
1263         struct dso *p;
1264         size_t dyn[DYN_CNT];
1265         for (p=fini_head; p; p=p->fini_next) {
1266                 if (!p->constructed) continue;
1267                 decode_vec(p->dynv, dyn, DYN_CNT);
1268                 if (dyn[0] & (1<<DT_FINI_ARRAY)) {
1269                         size_t n = dyn[DT_FINI_ARRAYSZ]/sizeof(size_t);
1270                         size_t *fn = (size_t *)laddr(p, dyn[DT_FINI_ARRAY])+n;
1271                         while (n--) ((void (*)(void))*--fn)();
1272                 }
1273 #ifndef NO_LEGACY_INITFINI
1274                 if ((dyn[0] & (1<<DT_FINI)) && dyn[DT_FINI])
1275                         fpaddr(p, dyn[DT_FINI])();
1276 #endif
1277         }
1278 }
1279
1280 static void do_init_fini(struct dso *p)
1281 {
1282         size_t dyn[DYN_CNT];
1283         int need_locking = libc.threads_minus_1;
1284         /* Allow recursive calls that arise when a library calls
1285          * dlopen from one of its constructors, but block any
1286          * other threads until all ctors have finished. */
1287         if (need_locking) pthread_mutex_lock(&init_fini_lock);
1288         for (; p; p=p->prev) {
1289                 if (p->constructed) continue;
1290                 p->constructed = 1;
1291                 decode_vec(p->dynv, dyn, DYN_CNT);
1292                 if (dyn[0] & ((1<<DT_FINI) | (1<<DT_FINI_ARRAY))) {
1293                         p->fini_next = fini_head;
1294                         fini_head = p;
1295                 }
1296 #ifndef NO_LEGACY_INITFINI
1297                 if ((dyn[0] & (1<<DT_INIT)) && dyn[DT_INIT])
1298                         fpaddr(p, dyn[DT_INIT])();
1299 #endif
1300                 if (dyn[0] & (1<<DT_INIT_ARRAY)) {
1301                         size_t n = dyn[DT_INIT_ARRAYSZ]/sizeof(size_t);
1302                         size_t *fn = laddr(p, dyn[DT_INIT_ARRAY]);
1303                         while (n--) ((void (*)(void))*fn++)();
1304                 }
1305                 if (!need_locking && libc.threads_minus_1) {
1306                         need_locking = 1;
1307                         pthread_mutex_lock(&init_fini_lock);
1308                 }
1309         }
1310         if (need_locking) pthread_mutex_unlock(&init_fini_lock);
1311 }
1312
1313 void __libc_start_init(void)
1314 {
1315         do_init_fini(tail);
1316 }
1317
1318 static void dl_debug_state(void)
1319 {
1320 }
1321
1322 weak_alias(dl_debug_state, _dl_debug_state);
1323
1324 void __init_tls(size_t *auxv)
1325 {
1326 }
1327
1328 __attribute__((__visibility__("hidden")))
1329 void *__tls_get_new(tls_mod_off_t *v)
1330 {
1331         pthread_t self = __pthread_self();
1332
1333         /* Block signals to make accessing new TLS async-signal-safe */
1334         sigset_t set;
1335         __block_all_sigs(&set);
1336         if (v[0]<=(size_t)self->dtv[0]) {
1337                 __restore_sigs(&set);
1338                 return (char *)self->dtv[v[0]]+v[1]+DTP_OFFSET;
1339         }
1340
1341         /* This is safe without any locks held because, if the caller
1342          * is able to request the Nth entry of the DTV, the DSO list
1343          * must be valid at least that far out and it was synchronized
1344          * at program startup or by an already-completed call to dlopen. */
1345         struct dso *p;
1346         for (p=head; p->tls_id != v[0]; p=p->next);
1347
1348         /* Get new DTV space from new DSO if needed */
1349         if (v[0] > (size_t)self->dtv[0]) {
1350                 void **newdtv = p->new_dtv +
1351                         (v[0]+1)*a_fetch_add(&p->new_dtv_idx,1);
1352                 memcpy(newdtv, self->dtv,
1353                         ((size_t)self->dtv[0]+1) * sizeof(void *));
1354                 newdtv[0] = (void *)v[0];
1355                 self->dtv = self->dtv_copy = newdtv;
1356         }
1357
1358         /* Get new TLS memory from all new DSOs up to the requested one */
1359         unsigned char *mem;
1360         for (p=head; ; p=p->next) {
1361                 if (!p->tls_id || self->dtv[p->tls_id]) continue;
1362                 mem = p->new_tls + (p->tls.size + p->tls.align)
1363                         * a_fetch_add(&p->new_tls_idx,1);
1364                 mem += ((uintptr_t)p->tls.image - (uintptr_t)mem)
1365                         & (p->tls.align-1);
1366                 self->dtv[p->tls_id] = mem;
1367                 memcpy(mem, p->tls.image, p->tls.len);
1368                 if (p->tls_id == v[0]) break;
1369         }
1370         __restore_sigs(&set);
1371         return mem + v[1] + DTP_OFFSET;
1372 }
1373
1374 static void update_tls_size()
1375 {
1376         libc.tls_cnt = tls_cnt;
1377         libc.tls_align = tls_align;
1378         libc.tls_size = ALIGN(
1379                 (1+tls_cnt) * sizeof(void *) +
1380                 tls_offset +
1381                 sizeof(struct pthread) +
1382                 tls_align * 2,
1383         tls_align);
1384 }
1385
1386 /* Stage 1 of the dynamic linker is defined in dlstart.c. It calls the
1387  * following stage 2 and stage 3 functions via primitive symbolic lookup
1388  * since it does not have access to their addresses to begin with. */
1389
1390 /* Stage 2 of the dynamic linker is called after relative relocations 
1391  * have been processed. It can make function calls to static functions
1392  * and access string literals and static data, but cannot use extern
1393  * symbols. Its job is to perform symbolic relocations on the dynamic
1394  * linker itself, but some of the relocations performed may need to be
1395  * replaced later due to copy relocations in the main program. */
1396
1397 __attribute__((__visibility__("hidden")))
1398 void __dls2(unsigned char *base, size_t *sp)
1399 {
1400         if (DL_FDPIC) {
1401                 void *p1 = (void *)sp[-2];
1402                 void *p2 = (void *)sp[-1];
1403                 if (!p1) {
1404                         size_t *auxv, aux[AUX_CNT];
1405                         for (auxv=sp+1+*sp+1; *auxv; auxv++); auxv++;
1406                         decode_vec(auxv, aux, AUX_CNT);
1407                         if (aux[AT_BASE]) ldso.base = (void *)aux[AT_BASE];
1408                         else ldso.base = (void *)(aux[AT_PHDR] & -4096);
1409                 }
1410                 app_loadmap = p2 ? p1 : 0;
1411                 ldso.loadmap = p2 ? p2 : p1;
1412                 ldso.base = laddr(&ldso, 0);
1413         } else {
1414                 ldso.base = base;
1415         }
1416         Ehdr *ehdr = (void *)ldso.base;
1417         ldso.name = ldso.shortname = "libc.so";
1418         ldso.phnum = ehdr->e_phnum;
1419         ldso.phdr = laddr(&ldso, ehdr->e_phoff);
1420         ldso.phentsize = ehdr->e_phentsize;
1421         kernel_mapped_dso(&ldso);
1422         decode_dyn(&ldso);
1423
1424         if (DL_FDPIC) makefuncdescs(&ldso);
1425
1426         /* Prepare storage for to save clobbered REL addends so they
1427          * can be reused in stage 3. There should be very few. If
1428          * something goes wrong and there are a huge number, abort
1429          * instead of risking stack overflow. */
1430         size_t dyn[DYN_CNT];
1431         decode_vec(ldso.dynv, dyn, DYN_CNT);
1432         size_t *rel = laddr(&ldso, dyn[DT_REL]);
1433         size_t rel_size = dyn[DT_RELSZ];
1434         size_t symbolic_rel_cnt = 0;
1435         apply_addends_to = rel;
1436         for (; rel_size; rel+=2, rel_size-=2*sizeof(size_t))
1437                 if (!IS_RELATIVE(rel[1], ldso.syms)) symbolic_rel_cnt++;
1438         if (symbolic_rel_cnt >= ADDEND_LIMIT) a_crash();
1439         size_t addends[symbolic_rel_cnt+1];
1440         saved_addends = addends;
1441
1442         head = &ldso;
1443         reloc_all(&ldso);
1444
1445         ldso.relocated = 0;
1446
1447         /* Call dynamic linker stage-3, __dls3, looking it up
1448          * symbolically as a barrier against moving the address
1449          * load across the above relocation processing. */
1450         struct symdef dls3_def = find_sym(&ldso, "__dls3", 0);
1451         if (DL_FDPIC) ((stage3_func)&ldso.funcdescs[dls3_def.sym-ldso.syms])(sp);
1452         else ((stage3_func)laddr(&ldso, dls3_def.sym->st_value))(sp);
1453 }
1454
1455 /* Stage 3 of the dynamic linker is called with the dynamic linker/libc
1456  * fully functional. Its job is to load (if not already loaded) and
1457  * process dependencies and relocations for the main application and
1458  * transfer control to its entry point. */
1459
1460 _Noreturn void __dls3(size_t *sp)
1461 {
1462         static struct dso app, vdso;
1463         size_t aux[AUX_CNT], *auxv;
1464         size_t i;
1465         char *env_preload=0;
1466         char *replace_argv0=0;
1467         size_t vdso_base;
1468         int argc = *sp;
1469         char **argv = (void *)(sp+1);
1470         char **argv_orig = argv;
1471         char **envp = argv+argc+1;
1472
1473         /* Find aux vector just past environ[] and use it to initialize
1474          * global data that may be needed before we can make syscalls. */
1475         __environ = envp;
1476         for (i=argc+1; argv[i]; i++);
1477         libc.auxv = auxv = (void *)(argv+i+1);
1478         decode_vec(auxv, aux, AUX_CNT);
1479         __hwcap = aux[AT_HWCAP];
1480         libc.page_size = aux[AT_PAGESZ];
1481         libc.secure = ((aux[0]&0x7800)!=0x7800 || aux[AT_UID]!=aux[AT_EUID]
1482                 || aux[AT_GID]!=aux[AT_EGID] || aux[AT_SECURE]);
1483
1484         /* Setup early thread pointer in builtin_tls for ldso/libc itself to
1485          * use during dynamic linking. If possible it will also serve as the
1486          * thread pointer at runtime. */
1487         libc.tls_size = sizeof builtin_tls;
1488         libc.tls_align = tls_align;
1489         if (__init_tp(__copy_tls((void *)builtin_tls)) < 0) {
1490                 a_crash();
1491         }
1492
1493         /* Only trust user/env if kernel says we're not suid/sgid */
1494         if (!libc.secure) {
1495                 env_path = getenv("LD_LIBRARY_PATH");
1496                 env_preload = getenv("LD_PRELOAD");
1497         }
1498
1499         /* If the main program was already loaded by the kernel,
1500          * AT_PHDR will point to some location other than the dynamic
1501          * linker's program headers. */
1502         if (aux[AT_PHDR] != (size_t)ldso.phdr) {
1503                 size_t interp_off = 0;
1504                 size_t tls_image = 0;
1505                 /* Find load address of the main program, via AT_PHDR vs PT_PHDR. */
1506                 Phdr *phdr = app.phdr = (void *)aux[AT_PHDR];
1507                 app.phnum = aux[AT_PHNUM];
1508                 app.phentsize = aux[AT_PHENT];
1509                 for (i=aux[AT_PHNUM]; i; i--, phdr=(void *)((char *)phdr + aux[AT_PHENT])) {
1510                         if (phdr->p_type == PT_PHDR)
1511                                 app.base = (void *)(aux[AT_PHDR] - phdr->p_vaddr);
1512                         else if (phdr->p_type == PT_INTERP)
1513                                 interp_off = (size_t)phdr->p_vaddr;
1514                         else if (phdr->p_type == PT_TLS) {
1515                                 tls_image = phdr->p_vaddr;
1516                                 app.tls.len = phdr->p_filesz;
1517                                 app.tls.size = phdr->p_memsz;
1518                                 app.tls.align = phdr->p_align;
1519                         }
1520                 }
1521                 if (DL_FDPIC) app.loadmap = app_loadmap;
1522                 if (app.tls.size) app.tls.image = laddr(&app, tls_image);
1523                 if (interp_off) ldso.name = laddr(&app, interp_off);
1524                 if ((aux[0] & (1UL<<AT_EXECFN))
1525                     && strncmp((char *)aux[AT_EXECFN], "/proc/", 6))
1526                         app.name = (char *)aux[AT_EXECFN];
1527                 else
1528                         app.name = argv[0];
1529                 kernel_mapped_dso(&app);
1530         } else {
1531                 int fd;
1532                 char *ldname = argv[0];
1533                 size_t l = strlen(ldname);
1534                 if (l >= 3 && !strcmp(ldname+l-3, "ldd")) ldd_mode = 1;
1535                 argv++;
1536                 while (argv[0] && argv[0][0]=='-' && argv[0][1]=='-') {
1537                         char *opt = argv[0]+2;
1538                         *argv++ = (void *)-1;
1539                         if (!*opt) {
1540                                 break;
1541                         } else if (!memcmp(opt, "list", 5)) {
1542                                 ldd_mode = 1;
1543                         } else if (!memcmp(opt, "library-path", 12)) {
1544                                 if (opt[12]=='=') env_path = opt+13;
1545                                 else if (opt[12]) *argv = 0;
1546                                 else if (*argv) env_path = *argv++;
1547                         } else if (!memcmp(opt, "preload", 7)) {
1548                                 if (opt[7]=='=') env_preload = opt+8;
1549                                 else if (opt[7]) *argv = 0;
1550                                 else if (*argv) env_preload = *argv++;
1551                         } else if (!memcmp(opt, "argv0", 5)) {
1552                                 if (opt[5]=='=') replace_argv0 = opt+6;
1553                                 else if (opt[5]) *argv = 0;
1554                                 else if (*argv) replace_argv0 = *argv++;
1555                         } else {
1556                                 argv[0] = 0;
1557                         }
1558                 }
1559                 argv[-1] = (void *)(argc - (argv-argv_orig));
1560                 if (!argv[0]) {
1561                         dprintf(2, "musl libc (" LDSO_ARCH ")\n"
1562                                 "Version %s\n"
1563                                 "Dynamic Program Loader\n"
1564                                 "Usage: %s [options] [--] pathname%s\n",
1565                                 __libc_get_version(), ldname,
1566                                 ldd_mode ? "" : " [args]");
1567                         _exit(1);
1568                 }
1569                 fd = open(argv[0], O_RDONLY);
1570                 if (fd < 0) {
1571                         dprintf(2, "%s: cannot load %s: %s\n", ldname, argv[0], strerror(errno));
1572                         _exit(1);
1573                 }
1574                 Ehdr *ehdr = (void *)map_library(fd, &app);
1575                 if (!ehdr) {
1576                         dprintf(2, "%s: %s: Not a valid dynamic program\n", ldname, argv[0]);
1577                         _exit(1);
1578                 }
1579                 close(fd);
1580                 ldso.name = ldname;
1581                 app.name = argv[0];
1582                 aux[AT_ENTRY] = (size_t)laddr(&app, ehdr->e_entry);
1583                 /* Find the name that would have been used for the dynamic
1584                  * linker had ldd not taken its place. */
1585                 if (ldd_mode) {
1586                         for (i=0; i<app.phnum; i++) {
1587                                 if (app.phdr[i].p_type == PT_INTERP)
1588                                         ldso.name = laddr(&app, app.phdr[i].p_vaddr);
1589                         }
1590                         dprintf(1, "\t%s (%p)\n", ldso.name, ldso.base);
1591                 }
1592         }
1593         if (app.tls.size) {
1594                 libc.tls_head = tls_tail = &app.tls;
1595                 app.tls_id = tls_cnt = 1;
1596 #ifdef TLS_ABOVE_TP
1597                 app.tls.offset = 0;
1598                 tls_offset = app.tls.size
1599                         + ( -((uintptr_t)app.tls.image + app.tls.size)
1600                         & (app.tls.align-1) );
1601 #else
1602                 tls_offset = app.tls.offset = app.tls.size
1603                         + ( -((uintptr_t)app.tls.image + app.tls.size)
1604                         & (app.tls.align-1) );
1605 #endif
1606                 tls_align = MAXP2(tls_align, app.tls.align);
1607         }
1608         decode_dyn(&app);
1609         if (DL_FDPIC) {
1610                 makefuncdescs(&app);
1611                 if (!app.loadmap) {
1612                         app.loadmap = (void *)&app_dummy_loadmap;
1613                         app.loadmap->nsegs = 1;
1614                         app.loadmap->segs[0].addr = (size_t)app.map;
1615                         app.loadmap->segs[0].p_vaddr = (size_t)app.map
1616                                 - (size_t)app.base;
1617                         app.loadmap->segs[0].p_memsz = app.map_len;
1618                 }
1619                 argv[-3] = (void *)app.loadmap;
1620         }
1621
1622         /* Initial dso chain consists only of the app. */
1623         head = tail = syms_tail = &app;
1624
1625         /* Donate unused parts of app and library mapping to malloc */
1626         reclaim_gaps(&app);
1627         reclaim_gaps(&ldso);
1628
1629         /* Load preload/needed libraries, add symbols to global namespace. */
1630         if (env_preload) load_preload(env_preload);
1631         load_deps(&app);
1632         for (struct dso *p=head; p; p=p->next)
1633                 add_syms(p);
1634
1635         /* Attach to vdso, if provided by the kernel, last so that it does
1636          * not become part of the global namespace.  */
1637         if (search_vec(auxv, &vdso_base, AT_SYSINFO_EHDR) && vdso_base) {
1638                 Ehdr *ehdr = (void *)vdso_base;
1639                 Phdr *phdr = vdso.phdr = (void *)(vdso_base + ehdr->e_phoff);
1640                 vdso.phnum = ehdr->e_phnum;
1641                 vdso.phentsize = ehdr->e_phentsize;
1642                 for (i=ehdr->e_phnum; i; i--, phdr=(void *)((char *)phdr + ehdr->e_phentsize)) {
1643                         if (phdr->p_type == PT_DYNAMIC)
1644                                 vdso.dynv = (void *)(vdso_base + phdr->p_offset);
1645                         if (phdr->p_type == PT_LOAD)
1646                                 vdso.base = (void *)(vdso_base - phdr->p_vaddr + phdr->p_offset);
1647                 }
1648                 vdso.name = "";
1649                 vdso.shortname = "linux-gate.so.1";
1650                 vdso.relocated = 1;
1651                 decode_dyn(&vdso);
1652                 vdso.prev = tail;
1653                 tail->next = &vdso;
1654                 tail = &vdso;
1655         }
1656
1657         for (i=0; app.dynv[i]; i+=2) {
1658                 if (!DT_DEBUG_INDIRECT && app.dynv[i]==DT_DEBUG)
1659                         app.dynv[i+1] = (size_t)&debug;
1660                 if (DT_DEBUG_INDIRECT && app.dynv[i]==DT_DEBUG_INDIRECT) {
1661                         size_t *ptr = (size_t *) app.dynv[i+1];
1662                         *ptr = (size_t)&debug;
1663                 }
1664         }
1665
1666         /* The main program must be relocated LAST since it may contin
1667          * copy relocations which depend on libraries' relocations. */
1668         reloc_all(app.next);
1669         reloc_all(&app);
1670
1671         update_tls_size();
1672         if (libc.tls_size > sizeof builtin_tls || tls_align > MIN_TLS_ALIGN) {
1673                 void *initial_tls = calloc(libc.tls_size, 1);
1674                 if (!initial_tls) {
1675                         dprintf(2, "%s: Error getting %zu bytes thread-local storage: %m\n",
1676                                 argv[0], libc.tls_size);
1677                         _exit(127);
1678                 }
1679                 if (__init_tp(__copy_tls(initial_tls)) < 0) {
1680                         a_crash();
1681                 }
1682         } else {
1683                 size_t tmp_tls_size = libc.tls_size;
1684                 pthread_t self = __pthread_self();
1685                 /* Temporarily set the tls size to the full size of
1686                  * builtin_tls so that __copy_tls will use the same layout
1687                  * as it did for before. Then check, just to be safe. */
1688                 libc.tls_size = sizeof builtin_tls;
1689                 if (__copy_tls((void*)builtin_tls) != self) a_crash();
1690                 libc.tls_size = tmp_tls_size;
1691         }
1692         static_tls_cnt = tls_cnt;
1693
1694         if (ldso_fail) _exit(127);
1695         if (ldd_mode) _exit(0);
1696
1697         /* Determine if malloc was interposed by a replacement implementation
1698          * so that calloc and the memalign family can harden against the
1699          * possibility of incomplete replacement. */
1700         if (find_sym(head, "malloc", 1).dso != &ldso)
1701                 __malloc_replaced = 1;
1702
1703         /* Switch to runtime mode: any further failures in the dynamic
1704          * linker are a reportable failure rather than a fatal startup
1705          * error. */
1706         runtime = 1;
1707
1708         debug.ver = 1;
1709         debug.bp = dl_debug_state;
1710         debug.head = head;
1711         debug.base = ldso.base;
1712         debug.state = 0;
1713         _dl_debug_state();
1714
1715         if (replace_argv0) argv[0] = replace_argv0;
1716
1717         errno = 0;
1718
1719         CRTJMP((void *)aux[AT_ENTRY], argv-1);
1720         for(;;);
1721 }
1722
1723 static void prepare_lazy(struct dso *p)
1724 {
1725         size_t dyn[DYN_CNT], n, flags1=0;
1726         decode_vec(p->dynv, dyn, DYN_CNT);
1727         search_vec(p->dynv, &flags1, DT_FLAGS_1);
1728         if (dyn[DT_BIND_NOW] || (dyn[DT_FLAGS] & DF_BIND_NOW) || (flags1 & DF_1_NOW))
1729                 return;
1730         n = dyn[DT_RELSZ]/2 + dyn[DT_RELASZ]/3 + dyn[DT_PLTRELSZ]/2 + 1;
1731         if (NEED_MIPS_GOT_RELOCS) {
1732                 size_t j=0; search_vec(p->dynv, &j, DT_MIPS_GOTSYM);
1733                 size_t i=0; search_vec(p->dynv, &i, DT_MIPS_SYMTABNO);
1734                 n += i-j;
1735         }
1736         p->lazy = calloc(n, 3*sizeof(size_t));
1737         if (!p->lazy) {
1738                 error("Error preparing lazy relocation for %s: %m", p->name);
1739                 longjmp(*rtld_fail, 1);
1740         }
1741         p->lazy_next = lazy_head;
1742         lazy_head = p;
1743 }
1744
1745 void *dlopen(const char *file, int mode)
1746 {
1747         struct dso *volatile p, *orig_tail, *orig_syms_tail, *orig_lazy_head, *next;
1748         struct tls_module *orig_tls_tail;
1749         size_t orig_tls_cnt, orig_tls_offset, orig_tls_align;
1750         size_t i;
1751         int cs;
1752         jmp_buf jb;
1753
1754         if (!file) return head;
1755
1756         pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, &cs);
1757         pthread_rwlock_wrlock(&lock);
1758         __inhibit_ptc();
1759
1760         p = 0;
1761         orig_tls_tail = tls_tail;
1762         orig_tls_cnt = tls_cnt;
1763         orig_tls_offset = tls_offset;
1764         orig_tls_align = tls_align;
1765         orig_lazy_head = lazy_head;
1766         orig_syms_tail = syms_tail;
1767         orig_tail = tail;
1768         noload = mode & RTLD_NOLOAD;
1769
1770         rtld_fail = &jb;
1771         if (setjmp(*rtld_fail)) {
1772                 /* Clean up anything new that was (partially) loaded */
1773                 revert_syms(orig_syms_tail);
1774                 for (p=orig_tail->next; p; p=next) {
1775                         next = p->next;
1776                         while (p->td_index) {
1777                                 void *tmp = p->td_index->next;
1778                                 free(p->td_index);
1779                                 p->td_index = tmp;
1780                         }
1781                         free(p->funcdescs);
1782                         if (p->rpath != p->rpath_orig)
1783                                 free(p->rpath);
1784                         if (p->deps != &nodeps_dummy)
1785                                 free(p->deps);
1786                         unmap_library(p);
1787                         free(p);
1788                 }
1789                 if (!orig_tls_tail) libc.tls_head = 0;
1790                 tls_tail = orig_tls_tail;
1791                 if (tls_tail) tls_tail->next = 0;
1792                 tls_cnt = orig_tls_cnt;
1793                 tls_offset = orig_tls_offset;
1794                 tls_align = orig_tls_align;
1795                 lazy_head = orig_lazy_head;
1796                 tail = orig_tail;
1797                 tail->next = 0;
1798                 p = 0;
1799                 goto end;
1800         } else p = load_library(file, head);
1801
1802         if (!p) {
1803                 error(noload ?
1804                         "Library %s is not already loaded" :
1805                         "Error loading shared library %s: %m",
1806                         file);
1807                 goto end;
1808         }
1809
1810         /* First load handling */
1811         int first_load = !p->deps;
1812         if (first_load) {
1813                 load_deps(p);
1814                 if (!p->relocated && (mode & RTLD_LAZY)) {
1815                         prepare_lazy(p);
1816                         for (i=0; p->deps[i]; i++)
1817                                 if (!p->deps[i]->relocated)
1818                                         prepare_lazy(p->deps[i]);
1819                 }
1820         }
1821         if (first_load || (mode & RTLD_GLOBAL)) {
1822                 /* Make new symbols global, at least temporarily, so we can do
1823                  * relocations. If not RTLD_GLOBAL, this is reverted below. */
1824                 add_syms(p);
1825                 for (i=0; p->deps[i]; i++)
1826                         add_syms(p->deps[i]);
1827         }
1828         if (first_load) {
1829                 reloc_all(p);
1830         }
1831
1832         /* If RTLD_GLOBAL was not specified, undo any new additions
1833          * to the global symbol table. This is a nop if the library was
1834          * previously loaded and already global. */
1835         if (!(mode & RTLD_GLOBAL))
1836                 revert_syms(orig_syms_tail);
1837
1838         /* Processing of deferred lazy relocations must not happen until
1839          * the new libraries are committed; otherwise we could end up with
1840          * relocations resolved to symbol definitions that get removed. */
1841         redo_lazy_relocs();
1842
1843         update_tls_size();
1844         _dl_debug_state();
1845         orig_tail = tail;
1846 end:
1847         __release_ptc();
1848         if (p) gencnt++;
1849         pthread_rwlock_unlock(&lock);
1850         if (p) do_init_fini(orig_tail);
1851         pthread_setcancelstate(cs, 0);
1852         return p;
1853 }
1854
1855 __attribute__((__visibility__("hidden")))
1856 int __dl_invalid_handle(void *h)
1857 {
1858         struct dso *p;
1859         for (p=head; p; p=p->next) if (h==p) return 0;
1860         error("Invalid library handle %p", (void *)h);
1861         return 1;
1862 }
1863
1864 static void *addr2dso(size_t a)
1865 {
1866         struct dso *p;
1867         size_t i;
1868         if (DL_FDPIC) for (p=head; p; p=p->next) {
1869                 i = count_syms(p);
1870                 if (a-(size_t)p->funcdescs < i*sizeof(*p->funcdescs))
1871                         return p;
1872         }
1873         for (p=head; p; p=p->next) {
1874                 if (DL_FDPIC && p->loadmap) {
1875                         for (i=0; i<p->loadmap->nsegs; i++) {
1876                                 if (a-p->loadmap->segs[i].p_vaddr
1877                                     < p->loadmap->segs[i].p_memsz)
1878                                         return p;
1879                         }
1880                 } else {
1881                         if (a-(size_t)p->map < p->map_len)
1882                                 return p;
1883                 }
1884         }
1885         return 0;
1886 }
1887
1888 void *__tls_get_addr(tls_mod_off_t *);
1889
1890 static void *do_dlsym(struct dso *p, const char *s, void *ra)
1891 {
1892         size_t i;
1893         uint32_t h = 0, gh = 0, *ght;
1894         Sym *sym;
1895         if (p == head || p == RTLD_DEFAULT || p == RTLD_NEXT) {
1896                 if (p == RTLD_DEFAULT) {
1897                         p = head;
1898                 } else if (p == RTLD_NEXT) {
1899                         p = addr2dso((size_t)ra);
1900                         if (!p) p=head;
1901                         p = p->next;
1902                 }
1903                 struct symdef def = find_sym(p, s, 0);
1904                 if (!def.sym) goto failed;
1905                 if ((def.sym->st_info&0xf) == STT_TLS)
1906                         return __tls_get_addr((tls_mod_off_t []){def.dso->tls_id, def.sym->st_value});
1907                 if (DL_FDPIC && (def.sym->st_info&0xf) == STT_FUNC)
1908                         return def.dso->funcdescs + (def.sym - def.dso->syms);
1909                 return laddr(def.dso, def.sym->st_value);
1910         }
1911         if (__dl_invalid_handle(p))
1912                 return 0;
1913         if ((ght = p->ghashtab)) {
1914                 gh = gnu_hash(s);
1915                 sym = gnu_lookup(gh, ght, p, s);
1916         } else {
1917                 h = sysv_hash(s);
1918                 sym = sysv_lookup(s, h, p);
1919         }
1920         if (sym && (sym->st_info&0xf) == STT_TLS)
1921                 return __tls_get_addr((tls_mod_off_t []){p->tls_id, sym->st_value});
1922         if (DL_FDPIC && sym && sym->st_shndx && (sym->st_info&0xf) == STT_FUNC)
1923                 return p->funcdescs + (sym - p->syms);
1924         if (sym && sym->st_value && (1<<(sym->st_info&0xf) & OK_TYPES))
1925                 return laddr(p, sym->st_value);
1926         for (i=0; p->deps[i]; i++) {
1927                 if ((ght = p->deps[i]->ghashtab)) {
1928                         if (!gh) gh = gnu_hash(s);
1929                         sym = gnu_lookup(gh, ght, p->deps[i], s);
1930                 } else {
1931                         if (!h) h = sysv_hash(s);
1932                         sym = sysv_lookup(s, h, p->deps[i]);
1933                 }
1934                 if (sym && (sym->st_info&0xf) == STT_TLS)
1935                         return __tls_get_addr((tls_mod_off_t []){p->deps[i]->tls_id, sym->st_value});
1936                 if (DL_FDPIC && sym && sym->st_shndx && (sym->st_info&0xf) == STT_FUNC)
1937                         return p->deps[i]->funcdescs + (sym - p->deps[i]->syms);
1938                 if (sym && sym->st_value && (1<<(sym->st_info&0xf) & OK_TYPES))
1939                         return laddr(p->deps[i], sym->st_value);
1940         }
1941 failed:
1942         error("Symbol not found: %s", s);
1943         return 0;
1944 }
1945
1946 int dladdr(const void *addr, Dl_info *info)
1947 {
1948         struct dso *p;
1949         Sym *sym, *bestsym;
1950         uint32_t nsym;
1951         char *strings;
1952         void *best = 0;
1953
1954         pthread_rwlock_rdlock(&lock);
1955         p = addr2dso((size_t)addr);
1956         pthread_rwlock_unlock(&lock);
1957
1958         if (!p) return 0;
1959
1960         sym = p->syms;
1961         strings = p->strings;
1962         nsym = count_syms(p);
1963
1964         if (DL_FDPIC) {
1965                 size_t idx = ((size_t)addr-(size_t)p->funcdescs)
1966                         / sizeof(*p->funcdescs);
1967                 if (idx < nsym && (sym[idx].st_info&0xf) == STT_FUNC) {
1968                         best = p->funcdescs + idx;
1969                         bestsym = sym + idx;
1970                 }
1971         }
1972
1973         if (!best) for (; nsym; nsym--, sym++) {
1974                 if (sym->st_value
1975                  && (1<<(sym->st_info&0xf) & OK_TYPES)
1976                  && (1<<(sym->st_info>>4) & OK_BINDS)) {
1977                         void *symaddr = laddr(p, sym->st_value);
1978                         if (symaddr > addr || symaddr < best)
1979                                 continue;
1980                         best = symaddr;
1981                         bestsym = sym;
1982                         if (addr == symaddr)
1983                                 break;
1984                 }
1985         }
1986
1987         if (!best) return 0;
1988
1989         if (DL_FDPIC && (bestsym->st_info&0xf) == STT_FUNC)
1990                 best = p->funcdescs + (bestsym - p->syms);
1991
1992         info->dli_fname = p->name;
1993         info->dli_fbase = p->map;
1994         info->dli_sname = strings + bestsym->st_name;
1995         info->dli_saddr = best;
1996
1997         return 1;
1998 }
1999
2000 __attribute__((__visibility__("hidden")))
2001 void *__dlsym(void *restrict p, const char *restrict s, void *restrict ra)
2002 {
2003         void *res;
2004         pthread_rwlock_rdlock(&lock);
2005         res = do_dlsym(p, s, ra);
2006         pthread_rwlock_unlock(&lock);
2007         return res;
2008 }
2009
2010 int dl_iterate_phdr(int(*callback)(struct dl_phdr_info *info, size_t size, void *data), void *data)
2011 {
2012         struct dso *current;
2013         struct dl_phdr_info info;
2014         int ret = 0;
2015         for(current = head; current;) {
2016                 info.dlpi_addr      = (uintptr_t)current->base;
2017                 info.dlpi_name      = current->name;
2018                 info.dlpi_phdr      = current->phdr;
2019                 info.dlpi_phnum     = current->phnum;
2020                 info.dlpi_adds      = gencnt;
2021                 info.dlpi_subs      = 0;
2022                 info.dlpi_tls_modid = current->tls_id;
2023                 info.dlpi_tls_data  = current->tls.image;
2024
2025                 ret = (callback)(&info, sizeof (info), data);
2026
2027                 if (ret != 0) break;
2028
2029                 pthread_rwlock_rdlock(&lock);
2030                 current = current->next;
2031                 pthread_rwlock_unlock(&lock);
2032         }
2033         return ret;
2034 }
2035
2036 __attribute__((__visibility__("hidden")))
2037 void __dl_vseterr(const char *, va_list);
2038
2039 static void error(const char *fmt, ...)
2040 {
2041         va_list ap;
2042         va_start(ap, fmt);
2043         if (!runtime) {
2044                 vdprintf(2, fmt, ap);
2045                 dprintf(2, "\n");
2046                 ldso_fail = 1;
2047                 va_end(ap);
2048                 return;
2049         }
2050         __dl_vseterr(fmt, ap);
2051         va_end(ap);
2052 }