pthread_create.c 6.3 KB
Newer Older
R
Rich Felker 已提交
1 2
#include "pthread_impl.h"

3 4 5 6
static void dummy_1(pthread_t self)
{
}
weak_alias(dummy_1, __pthread_tsd_run_dtors);
7
weak_alias(dummy_1, __sigtimer_handler);
8

9 10 11 12 13
#ifdef __pthread_unwind_next
#undef __pthread_unwind_next
#define __pthread_unwind_next __pthread_unwind_next_3
#endif

14 15 16 17 18 19 20 21 22 23
void __pthread_unwind_next(struct __ptcb *cb)
{
	pthread_t self;

	if (cb->__next) longjmp((void *)cb->__next->__jb, 1);

	self = pthread_self();

	LOCK(&self->exitlock);

24
	__pthread_tsd_run_dtors(self);
25

26 27
	/* Mark this thread dead before decrementing count */
	self->dead = 1;
28

29 30 31
	if (!a_fetch_add(&libc.threads_minus_1, -1))
		exit(0);

32
	if (self->detached && self->map_base) {
33
		syscall(__NR_rt_sigprocmask, SIG_BLOCK, (long)(uint64_t[1]){-1},0,8);
34
		__unmapself(self->map_base, self->map_size);
35
	}
36

37
	syscall(SYS_exit, 0);
38
}
R
Rich Felker 已提交
39 40 41 42

static void docancel(struct pthread *self)
{
	struct __ptcb cb = { .__next = self->cancelbuf };
43 44
	self->canceldisable = 1;
	self->cancelasync = 0;
R
Rich Felker 已提交
45 46 47 48 49
	__pthread_unwind_next(&cb);
}

static void cancel_handler(int sig, siginfo_t *si, void *ctx)
{
50
	struct pthread *self = __pthread_self();
51 52 53
	if (si->si_code == SI_TIMER) __sigtimer_handler(self);
	if (self->cancel && !self->canceldisable &&
	    (self->cancelasync || (self->cancelpoint==1 && PC_AT_SYS(ctx))))
54
		docancel(self);
R
Rich Felker 已提交
55 56
}

57 58 59 60
static void cancelpt(int x)
{
	struct pthread *self = __pthread_self();
	if (self->canceldisable) return;
61 62
	if ((self->cancelpoint+=x)==1 && x>=0 && self->cancel)
		docancel(self);
63 64
}

R
Rich Felker 已提交
65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
/* "rsyscall" is a mechanism by which a thread can synchronously force all
 * other threads to perform an arbitrary syscall. It is necessary to work
 * around the non-conformant implementation of setuid() et al on Linux,
 * which affect only the calling thread and not the whole process. This
 * implementation performs some tricks with signal delivery to work around
 * the fact that it does not keep any list of threads in userspace. */

static struct {
	volatile int lock, hold, blocks, cnt;
	unsigned long arg[6];
	int nr;
	int err;
} rs;

static void rsyscall_handler(int sig, siginfo_t *si, void *ctx)
{
81 82 83 84
	struct pthread *self = __pthread_self();

	if (si->si_code > 0 || si->si_pid != self->pid ||
		rs.cnt == libc.threads_minus_1) return;
85

86 87 88 89 90 91
	/* Threads which have already decremented themselves from the
	 * thread count must not increment rs.cnt or otherwise act. */
	if (self->dead) {
		__wait(&rs.hold, 0, 1, 1);
		return;
	}
R
Rich Felker 已提交
92

93
	if (syscall(rs.nr, rs.arg[0], rs.arg[1], rs.arg[2],
R
Rich Felker 已提交
94 95 96 97 98 99 100 101 102 103 104 105 106 107
		rs.arg[3], rs.arg[4], rs.arg[5]) < 0 && !rs.err) rs.err=errno;

	a_inc(&rs.cnt);
	__wake(&rs.cnt, 1, 1);
	while(rs.hold)
		__wait(&rs.hold, 0, 1, 1);
	a_dec(&rs.cnt);
	if (!rs.cnt) __wake(&rs.cnt, 1, 1);
}

static int rsyscall(int nr, long a, long b, long c, long d, long e, long f)
{
	int i, ret;
	sigset_t set = { 0 };
108
	struct pthread *self = __pthread_self();
R
Rich Felker 已提交
109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141
	sigaddset(&set, SIGSYSCALL);

	LOCK(&rs.lock);
	while ((i=rs.blocks))
		__wait(&rs.blocks, 0, i, 1);

	__libc_sigprocmask(SIG_BLOCK, &set, 0);

	rs.nr = nr;
	rs.arg[0] = a; rs.arg[1] = b;
	rs.arg[2] = c; rs.arg[3] = d;
	rs.arg[4] = d; rs.arg[5] = f;
	rs.hold = 1;
	rs.err = 0;
	rs.cnt = 0;

	/* Dispatch signals until all threads respond */
	for (i=libc.threads_minus_1; i; i--)
		sigqueue(self->pid, SIGSYSCALL, (union sigval){0});
	while ((i=rs.cnt) < libc.threads_minus_1) {
		sigqueue(self->pid, SIGSYSCALL, (union sigval){0});
		__wait(&rs.cnt, 0, i, 1);
	}

	/* Handle any lingering signals with no-op */
	__libc_sigprocmask(SIG_UNBLOCK, &set, 0);

	/* Resume other threads' signal handlers and wait for them */
	rs.hold = 0;
	__wake(&rs.hold, -1, 0);
	while((i=rs.cnt)) __wait(&rs.cnt, 0, i, 1);

	if (rs.err) errno = rs.err, ret = -1;
142
	else ret = syscall(nr, a, b, c, d, e, f);
R
Rich Felker 已提交
143 144 145 146 147 148 149 150 151

	UNLOCK(&rs.lock);
	return ret;
}

static void init_threads()
{
	struct sigaction sa = { .sa_flags = SA_SIGINFO | SA_RESTART };
	libc.lock = __lock;
152
	libc.lockfile = __lockfile;
R
Rich Felker 已提交
153 154 155 156 157 158 159 160 161 162 163 164 165 166
	libc.cancelpt = cancelpt;
	libc.rsyscall = rsyscall;
	sa.sa_sigaction = cancel_handler;
	__libc_sigaction(SIGCANCEL, &sa, 0);
	sigaddset(&sa.sa_mask, SIGSYSCALL);
	sigaddset(&sa.sa_mask, SIGCANCEL);
	sa.sa_sigaction = rsyscall_handler;
	__libc_sigaction(SIGSYSCALL, &sa, 0);
	sigprocmask(SIG_UNBLOCK, &sa.sa_mask, 0);
}

static int start(void *p)
{
	struct pthread *self = p;
167 168 169 170 171 172
	if (self->unblock_cancel) {
		sigset_t set;
		sigemptyset(&set);
		sigaddset(&set, SIGCANCEL);
		__libc_sigprocmask(SIG_UNBLOCK, &set, 0);
	}
R
Rich Felker 已提交
173 174 175 176
	pthread_exit(self->start(self->start_arg));
	return 0;
}

177
int __uniclone(void *, int (*)(), void *);
R
Rich Felker 已提交
178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197

#define ROUND(x) (((x)+PAGE_SIZE-1)&-PAGE_SIZE)

/* pthread_key_create.c overrides this */
static const size_t dummy = 0;
weak_alias(dummy, __pthread_tsd_size);

int pthread_create(pthread_t *res, const pthread_attr_t *attr, void *(*entry)(void *), void *arg)
{
	static int init;
	int ret;
	size_t size, guard;
	struct pthread *self = pthread_self(), *new;
	unsigned char *map, *stack, *tsd;
	static const pthread_attr_t default_attr;

	if (!self) return errno = ENOSYS;
	if (!init && ++init) init_threads();

	if (!attr) attr = &default_attr;
198 199
	guard = ROUND(attr->_a_guardsize + DEFAULT_GUARD_SIZE);
	size = guard + ROUND(attr->_a_stacksize + DEFAULT_STACK_SIZE);
R
Rich Felker 已提交
200 201 202
	size += __pthread_tsd_size;
	map = mmap(0, size, PROT_READ|PROT_WRITE|PROT_EXEC, MAP_PRIVATE|MAP_ANON, -1, 0);
	if (!map) return EAGAIN;
203
	if (guard) mprotect(map, guard, PROT_NONE);
R
Rich Felker 已提交
204 205 206 207 208 209 210 211 212 213 214

	tsd = map + size - __pthread_tsd_size;
	new = (void *)(tsd - sizeof *new - PAGE_SIZE%sizeof *new);
	new->map_base = map;
	new->map_size = size;
	new->pid = self->pid;
	new->errno_ptr = &new->errno_val;
	new->start = entry;
	new->start_arg = arg;
	new->self = new;
	new->tsd = (void *)tsd;
215
	new->detached = attr->_a_detach;
R
Rich Felker 已提交
216
	new->attr = *attr;
217
	new->unblock_cancel = self->cancel;
218
	new->result = PTHREAD_CANCELED;
R
Rich Felker 已提交
219 220 221 222 223 224 225 226 227 228
	memcpy(new->tlsdesc, self->tlsdesc, sizeof new->tlsdesc);
	new->tlsdesc[1] = (uintptr_t)new;
	stack = (void *)((uintptr_t)new-1 & ~(uintptr_t)15);

	/* We must synchronize new thread creation with rsyscall
	 * delivery. This looks to be the least expensive way: */
	a_inc(&rs.blocks);
	while (rs.lock) __wait(&rs.lock, 0, 1, 1);

	a_inc(&libc.threads_minus_1);
229
	ret = __uniclone(stack, start, new);
R
Rich Felker 已提交
230 231 232 233 234 235 236

	a_dec(&rs.blocks);
	if (rs.lock) __wake(&rs.blocks, 1, 1);

	if (ret < 0) {
		a_dec(&libc.threads_minus_1);
		munmap(map, size);
237
		return EAGAIN;
R
Rich Felker 已提交
238 239 240 241
	}
	*res = new;
	return 0;
}
242 243 244 245 246 247 248

void pthread_exit(void *result)
{
	struct pthread *self = pthread_self();
	self->result = result;
	docancel(self);
}