use a dedicated futex object for pthread_join instead of tid field
[musl] / src / env / __init_tls.c
1 #include <elf.h>
2 #include <limits.h>
3 #include <sys/mman.h>
4 #include <string.h>
5 #include <stddef.h>
6 #include "pthread_impl.h"
7 #include "libc.h"
8 #include "atomic.h"
9 #include "syscall.h"
10
11 int __init_tp(void *p)
12 {
13         pthread_t td = p;
14         td->self = td;
15         int r = __set_thread_area(TP_ADJ(p));
16         if (r < 0) return -1;
17         if (!r) libc.can_do_threads = 1;
18         td->join_futex = -1;
19         td->tid = __syscall(SYS_set_tid_address, &td->join_futex);
20         td->locale = &libc.global_locale;
21         td->robust_list.head = &td->robust_list.head;
22         return 0;
23 }
24
25 static struct builtin_tls {
26         char c;
27         struct pthread pt;
28         void *space[16];
29 } builtin_tls[1];
30 #define MIN_TLS_ALIGN offsetof(struct builtin_tls, pt)
31
32 static struct tls_module main_tls;
33
34 void *__copy_tls(unsigned char *mem)
35 {
36         pthread_t td;
37         struct tls_module *p;
38         size_t i;
39         void **dtv;
40
41 #ifdef TLS_ABOVE_TP
42         dtv = (void **)(mem + libc.tls_size) - (libc.tls_cnt + 1);
43
44         mem += -((uintptr_t)mem + sizeof(struct pthread)) & (libc.tls_align-1);
45         td = (pthread_t)mem;
46         mem += sizeof(struct pthread);
47
48         for (i=1, p=libc.tls_head; p; i++, p=p->next) {
49                 dtv[i] = mem + p->offset;
50                 memcpy(dtv[i], p->image, p->len);
51         }
52 #else
53         dtv = (void **)mem;
54
55         mem += libc.tls_size - sizeof(struct pthread);
56         mem -= (uintptr_t)mem & (libc.tls_align-1);
57         td = (pthread_t)mem;
58
59         for (i=1, p=libc.tls_head; p; i++, p=p->next) {
60                 dtv[i] = mem - p->offset;
61                 memcpy(dtv[i], p->image, p->len);
62         }
63 #endif
64         dtv[0] = (void *)libc.tls_cnt;
65         td->dtv = td->dtv_copy = dtv;
66         return td;
67 }
68
69 #if ULONG_MAX == 0xffffffff
70 typedef Elf32_Phdr Phdr;
71 #else
72 typedef Elf64_Phdr Phdr;
73 #endif
74
75 __attribute__((__weak__, __visibility__("hidden")))
76 extern const size_t _DYNAMIC[];
77
78 static void static_init_tls(size_t *aux)
79 {
80         unsigned char *p;
81         size_t n;
82         Phdr *phdr, *tls_phdr=0;
83         size_t base = 0;
84         void *mem;
85
86         for (p=(void *)aux[AT_PHDR],n=aux[AT_PHNUM]; n; n--,p+=aux[AT_PHENT]) {
87                 phdr = (void *)p;
88                 if (phdr->p_type == PT_PHDR)
89                         base = aux[AT_PHDR] - phdr->p_vaddr;
90                 if (phdr->p_type == PT_DYNAMIC && _DYNAMIC)
91                         base = (size_t)_DYNAMIC - phdr->p_vaddr;
92                 if (phdr->p_type == PT_TLS)
93                         tls_phdr = phdr;
94         }
95
96         if (tls_phdr) {
97                 main_tls.image = (void *)(base + tls_phdr->p_vaddr);
98                 main_tls.len = tls_phdr->p_filesz;
99                 main_tls.size = tls_phdr->p_memsz;
100                 main_tls.align = tls_phdr->p_align;
101                 libc.tls_cnt = 1;
102                 libc.tls_head = &main_tls;
103         }
104
105         main_tls.size += (-main_tls.size - (uintptr_t)main_tls.image)
106                 & (main_tls.align-1);
107         if (main_tls.align < MIN_TLS_ALIGN) main_tls.align = MIN_TLS_ALIGN;
108 #ifndef TLS_ABOVE_TP
109         main_tls.offset = main_tls.size;
110 #endif
111
112         libc.tls_align = main_tls.align;
113         libc.tls_size = 2*sizeof(void *) + sizeof(struct pthread)
114                 + main_tls.size + main_tls.align
115                 + MIN_TLS_ALIGN-1 & -MIN_TLS_ALIGN;
116
117         if (libc.tls_size > sizeof builtin_tls) {
118 #ifndef SYS_mmap2
119 #define SYS_mmap2 SYS_mmap
120 #endif
121                 mem = (void *)__syscall(
122                         SYS_mmap2,
123                         0, libc.tls_size, PROT_READ|PROT_WRITE,
124                         MAP_ANONYMOUS|MAP_PRIVATE, -1, 0);
125                 /* -4095...-1 cast to void * will crash on dereference anyway,
126                  * so don't bloat the init code checking for error codes and
127                  * explicitly calling a_crash(). */
128         } else {
129                 mem = builtin_tls;
130         }
131
132         /* Failure to initialize thread pointer is always fatal. */
133         if (__init_tp(__copy_tls(mem)) < 0)
134                 a_crash();
135 }
136
137 weak_alias(static_init_tls, __init_tls);