pthread_create.c 6.3 KB
Newer Older
R
Rich Felker 已提交
1 2
#include "pthread_impl.h"

3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
void __pthread_unwind_next(struct __ptcb *cb)
{
	int i, j, not_finished;
	pthread_t self;

	if (cb->__next) longjmp((void *)cb->__next->__jb, 1);

	self = pthread_self();
	if (self->cancel) self->result = PTHREAD_CANCELLED;

	LOCK(&self->exitlock);

	not_finished = self->tsd_used;
	for (j=0; not_finished && j<PTHREAD_DESTRUCTOR_ITERATIONS; j++) {
		not_finished = 0;
		for (i=0; i<PTHREAD_KEYS_MAX; i++) {
			if (self->tsd[i] && libc.tsd_keys[i]) {
				void *tmp = self->tsd[i];
				self->tsd[i] = 0;
				libc.tsd_keys[i](tmp);
				not_finished = 1;
			}
		}
	}

28 29
	/* Mark this thread dead before decrementing count */
	self->dead = 1;
30

31 32 33
	if (!a_fetch_add(&libc.threads_minus_1, -1))
		exit(0);

34
	if (self->detached && self->map_base) {
35
		syscall(__NR_rt_sigprocmask, SIG_BLOCK, (long)(uint64_t[1]){-1},0,8);
36
		__unmapself(self->map_base, self->map_size);
37
	}
38

39
	syscall(SYS_exit, 0);
40
}
R
Rich Felker 已提交
41 42 43 44

static void docancel(struct pthread *self)
{
	struct __ptcb cb = { .__next = self->cancelbuf };
45 46 47 48 49 50
	sigset_t set;
	self->canceldisable = 1;
	self->cancelasync = 0;
	sigemptyset(&set);
	sigaddset(&set, SIGCANCEL);
	__libc_sigprocmask(SIG_UNBLOCK, &set, 0);
R
Rich Felker 已提交
51 52 53 54 55
	__pthread_unwind_next(&cb);
}

static void cancel_handler(int sig, siginfo_t *si, void *ctx)
{
56
	struct pthread *self = __pthread_self();
57
	if (si->si_code > 0 || si->si_pid != self->pid) return;
R
Rich Felker 已提交
58
	self->cancel = 1;
59 60 61
	if (self->canceldisable) return;
	if (self->cancelasync || (self->cancelpoint==1 && PC_AT_SYS(ctx)))
		docancel(self);
R
Rich Felker 已提交
62 63
}

64 65 66 67
static void cancelpt(int x)
{
	struct pthread *self = __pthread_self();
	if (self->canceldisable) return;
68 69
	if ((self->cancelpoint+=x)==1 && x>=0 && self->cancel)
		docancel(self);
70 71
}

R
Rich Felker 已提交
72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87
/* "rsyscall" is a mechanism by which a thread can synchronously force all
 * other threads to perform an arbitrary syscall. It is necessary to work
 * around the non-conformant implementation of setuid() et al on Linux,
 * which affect only the calling thread and not the whole process. This
 * implementation performs some tricks with signal delivery to work around
 * the fact that it does not keep any list of threads in userspace. */

static struct {
	volatile int lock, hold, blocks, cnt;
	unsigned long arg[6];
	int nr;
	int err;
} rs;

static void rsyscall_handler(int sig, siginfo_t *si, void *ctx)
{
88 89 90 91
	struct pthread *self = __pthread_self();

	if (si->si_code > 0 || si->si_pid != self->pid ||
		rs.cnt == libc.threads_minus_1) return;
92

93 94 95 96 97 98
	/* Threads which have already decremented themselves from the
	 * thread count must not increment rs.cnt or otherwise act. */
	if (self->dead) {
		__wait(&rs.hold, 0, 1, 1);
		return;
	}
R
Rich Felker 已提交
99

100
	if (syscall(rs.nr, rs.arg[0], rs.arg[1], rs.arg[2],
R
Rich Felker 已提交
101 102 103 104 105 106 107 108 109 110 111 112 113 114
		rs.arg[3], rs.arg[4], rs.arg[5]) < 0 && !rs.err) rs.err=errno;

	a_inc(&rs.cnt);
	__wake(&rs.cnt, 1, 1);
	while(rs.hold)
		__wait(&rs.hold, 0, 1, 1);
	a_dec(&rs.cnt);
	if (!rs.cnt) __wake(&rs.cnt, 1, 1);
}

static int rsyscall(int nr, long a, long b, long c, long d, long e, long f)
{
	int i, ret;
	sigset_t set = { 0 };
115
	struct pthread *self = __pthread_self();
R
Rich Felker 已提交
116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148
	sigaddset(&set, SIGSYSCALL);

	LOCK(&rs.lock);
	while ((i=rs.blocks))
		__wait(&rs.blocks, 0, i, 1);

	__libc_sigprocmask(SIG_BLOCK, &set, 0);

	rs.nr = nr;
	rs.arg[0] = a; rs.arg[1] = b;
	rs.arg[2] = c; rs.arg[3] = d;
	rs.arg[4] = d; rs.arg[5] = f;
	rs.hold = 1;
	rs.err = 0;
	rs.cnt = 0;

	/* Dispatch signals until all threads respond */
	for (i=libc.threads_minus_1; i; i--)
		sigqueue(self->pid, SIGSYSCALL, (union sigval){0});
	while ((i=rs.cnt) < libc.threads_minus_1) {
		sigqueue(self->pid, SIGSYSCALL, (union sigval){0});
		__wait(&rs.cnt, 0, i, 1);
	}

	/* Handle any lingering signals with no-op */
	__libc_sigprocmask(SIG_UNBLOCK, &set, 0);

	/* Resume other threads' signal handlers and wait for them */
	rs.hold = 0;
	__wake(&rs.hold, -1, 0);
	while((i=rs.cnt)) __wait(&rs.cnt, 0, i, 1);

	if (rs.err) errno = rs.err, ret = -1;
149
	else ret = syscall(nr, a, b, c, d, e, f);
R
Rich Felker 已提交
150 151 152 153 154 155 156 157 158

	UNLOCK(&rs.lock);
	return ret;
}

static void init_threads()
{
	struct sigaction sa = { .sa_flags = SA_SIGINFO | SA_RESTART };
	libc.lock = __lock;
159
	libc.lockfile = __lockfile;
R
Rich Felker 已提交
160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177
	libc.cancelpt = cancelpt;
	libc.rsyscall = rsyscall;
	sa.sa_sigaction = cancel_handler;
	__libc_sigaction(SIGCANCEL, &sa, 0);
	sigaddset(&sa.sa_mask, SIGSYSCALL);
	sigaddset(&sa.sa_mask, SIGCANCEL);
	sa.sa_sigaction = rsyscall_handler;
	__libc_sigaction(SIGSYSCALL, &sa, 0);
	sigprocmask(SIG_UNBLOCK, &sa.sa_mask, 0);
}

static int start(void *p)
{
	struct pthread *self = p;
	pthread_exit(self->start(self->start_arg));
	return 0;
}

178
int __uniclone(void *, int (*)(), void *);
R
Rich Felker 已提交
179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198

#define ROUND(x) (((x)+PAGE_SIZE-1)&-PAGE_SIZE)

/* pthread_key_create.c overrides this */
static const size_t dummy = 0;
weak_alias(dummy, __pthread_tsd_size);

int pthread_create(pthread_t *res, const pthread_attr_t *attr, void *(*entry)(void *), void *arg)
{
	static int init;
	int ret;
	size_t size, guard;
	struct pthread *self = pthread_self(), *new;
	unsigned char *map, *stack, *tsd;
	static const pthread_attr_t default_attr;

	if (!self) return errno = ENOSYS;
	if (!init && ++init) init_threads();

	if (!attr) attr = &default_attr;
199 200
	guard = ROUND(attr->_a_guardsize + DEFAULT_GUARD_SIZE);
	size = guard + ROUND(attr->_a_stacksize + DEFAULT_STACK_SIZE);
R
Rich Felker 已提交
201 202 203
	size += __pthread_tsd_size;
	map = mmap(0, size, PROT_READ|PROT_WRITE|PROT_EXEC, MAP_PRIVATE|MAP_ANON, -1, 0);
	if (!map) return EAGAIN;
204
	if (guard) mprotect(map, guard, PROT_NONE);
R
Rich Felker 已提交
205 206 207 208 209 210 211 212 213 214 215

	tsd = map + size - __pthread_tsd_size;
	new = (void *)(tsd - sizeof *new - PAGE_SIZE%sizeof *new);
	new->map_base = map;
	new->map_size = size;
	new->pid = self->pid;
	new->errno_ptr = &new->errno_val;
	new->start = entry;
	new->start_arg = arg;
	new->self = new;
	new->tsd = (void *)tsd;
216
	new->detached = attr->_a_detach;
R
Rich Felker 已提交
217 218 219 220 221 222 223 224 225 226 227
	new->attr = *attr;
	memcpy(new->tlsdesc, self->tlsdesc, sizeof new->tlsdesc);
	new->tlsdesc[1] = (uintptr_t)new;
	stack = (void *)((uintptr_t)new-1 & ~(uintptr_t)15);

	/* We must synchronize new thread creation with rsyscall
	 * delivery. This looks to be the least expensive way: */
	a_inc(&rs.blocks);
	while (rs.lock) __wait(&rs.lock, 0, 1, 1);

	a_inc(&libc.threads_minus_1);
228
	ret = __uniclone(stack, start, new);
R
Rich Felker 已提交
229 230 231 232 233 234 235

	a_dec(&rs.blocks);
	if (rs.lock) __wake(&rs.blocks, 1, 1);

	if (ret < 0) {
		a_dec(&libc.threads_minus_1);
		munmap(map, size);
236
		return EAGAIN;
R
Rich Felker 已提交
237 238 239 240
	}
	*res = new;
	return 0;
}
241 242 243 244 245 246 247

void pthread_exit(void *result)
{
	struct pthread *self = pthread_self();
	self->result = result;
	docancel(self);
}