pthread_create.c 6.4 KB
Newer Older
R
Rich Felker 已提交
1 2
#include "pthread_impl.h"

3 4 5 6
static void dummy_1(pthread_t self)
{
}
weak_alias(dummy_1, __pthread_tsd_run_dtors);
7
weak_alias(dummy_1, __sigtimer_handler);
8

9 10 11 12 13
#ifdef __pthread_unwind_next
#undef __pthread_unwind_next
#define __pthread_unwind_next __pthread_unwind_next_3
#endif

14 15 16 17 18 19 20 21 22 23
void __pthread_unwind_next(struct __ptcb *cb)
{
	pthread_t self;

	if (cb->__next) longjmp((void *)cb->__next->__jb, 1);

	self = pthread_self();

	LOCK(&self->exitlock);

24
	__pthread_tsd_run_dtors(self);
25

26 27
	/* Mark this thread dead before decrementing count */
	self->dead = 1;
28

29 30 31
	if (!a_fetch_add(&libc.threads_minus_1, -1))
		exit(0);

32
	if (self->detached && self->map_base) {
33
		syscall(__NR_rt_sigprocmask, SIG_BLOCK, (long)(uint64_t[1]){-1},0,8);
34
		__unmapself(self->map_base, self->map_size);
35
	}
36

37
	syscall(SYS_exit, 0);
38
}
R
Rich Felker 已提交
39 40 41 42

static void docancel(struct pthread *self)
{
	struct __ptcb cb = { .__next = self->cancelbuf };
43 44
	self->canceldisable = 1;
	self->cancelasync = 0;
R
Rich Felker 已提交
45 46 47 48 49
	__pthread_unwind_next(&cb);
}

static void cancel_handler(int sig, siginfo_t *si, void *ctx)
{
50
	struct pthread *self = __pthread_self();
51 52 53
	if (si->si_code == SI_TIMER) __sigtimer_handler(self);
	if (self->cancel && !self->canceldisable &&
	    (self->cancelasync || (self->cancelpoint==1 && PC_AT_SYS(ctx))))
54
		docancel(self);
R
Rich Felker 已提交
55 56
}

57 58 59 60
static void cancelpt(int x)
{
	struct pthread *self = __pthread_self();
	if (self->canceldisable) return;
61 62
	if ((self->cancelpoint+=x)==1 && x>=0 && self->cancel)
		docancel(self);
63 64
}

R
Rich Felker 已提交
65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
/* "rsyscall" is a mechanism by which a thread can synchronously force all
 * other threads to perform an arbitrary syscall. It is necessary to work
 * around the non-conformant implementation of setuid() et al on Linux,
 * which affect only the calling thread and not the whole process. This
 * implementation performs some tricks with signal delivery to work around
 * the fact that it does not keep any list of threads in userspace. */

static struct {
	volatile int lock, hold, blocks, cnt;
	unsigned long arg[6];
	int nr;
	int err;
} rs;

static void rsyscall_handler(int sig, siginfo_t *si, void *ctx)
{
81 82
	struct pthread *self = __pthread_self();

83
	if (!rs.hold || rs.cnt == libc.threads_minus_1) return;
84

85 86 87
	/* Threads which have already decremented themselves from the
	 * thread count must not increment rs.cnt or otherwise act. */
	if (self->dead) {
R
Rich Felker 已提交
88
		sigfillset(&((ucontext_t *)ctx)->uc_sigmask);
89 90
		return;
	}
R
Rich Felker 已提交
91

92
	if (syscall(rs.nr, rs.arg[0], rs.arg[1], rs.arg[2],
R
Rich Felker 已提交
93 94 95 96 97 98 99 100 101 102 103 104 105 106
		rs.arg[3], rs.arg[4], rs.arg[5]) < 0 && !rs.err) rs.err=errno;

	a_inc(&rs.cnt);
	__wake(&rs.cnt, 1, 1);
	while(rs.hold)
		__wait(&rs.hold, 0, 1, 1);
	a_dec(&rs.cnt);
	if (!rs.cnt) __wake(&rs.cnt, 1, 1);
}

static int rsyscall(int nr, long a, long b, long c, long d, long e, long f)
{
	int i, ret;
	sigset_t set = { 0 };
107
	struct pthread *self = __pthread_self();
R
Rich Felker 已提交
108 109 110 111 112 113 114 115 116 117 118 119 120 121
	sigaddset(&set, SIGSYSCALL);

	LOCK(&rs.lock);
	while ((i=rs.blocks))
		__wait(&rs.blocks, 0, i, 1);

	__libc_sigprocmask(SIG_BLOCK, &set, 0);

	rs.nr = nr;
	rs.arg[0] = a; rs.arg[1] = b;
	rs.arg[2] = c; rs.arg[3] = d;
	rs.arg[4] = d; rs.arg[5] = f;
	rs.err = 0;
	rs.cnt = 0;
122
	rs.hold = 1;
R
Rich Felker 已提交
123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140

	/* Dispatch signals until all threads respond */
	for (i=libc.threads_minus_1; i; i--)
		sigqueue(self->pid, SIGSYSCALL, (union sigval){0});
	while ((i=rs.cnt) < libc.threads_minus_1) {
		sigqueue(self->pid, SIGSYSCALL, (union sigval){0});
		__wait(&rs.cnt, 0, i, 1);
	}

	/* Handle any lingering signals with no-op */
	__libc_sigprocmask(SIG_UNBLOCK, &set, 0);

	/* Resume other threads' signal handlers and wait for them */
	rs.hold = 0;
	__wake(&rs.hold, -1, 0);
	while((i=rs.cnt)) __wait(&rs.cnt, 0, i, 1);

	if (rs.err) errno = rs.err, ret = -1;
141
	else ret = syscall(nr, a, b, c, d, e, f);
R
Rich Felker 已提交
142 143 144 145 146 147 148 149 150

	UNLOCK(&rs.lock);
	return ret;
}

static void init_threads()
{
	struct sigaction sa = { .sa_flags = SA_SIGINFO | SA_RESTART };
	libc.lock = __lock;
151
	libc.lockfile = __lockfile;
R
Rich Felker 已提交
152 153
	libc.cancelpt = cancelpt;
	libc.rsyscall = rsyscall;
R
Rich Felker 已提交
154 155 156 157 158 159

	sigfillset(&sa.sa_mask);
	sa.sa_sigaction = rsyscall_handler;
	__libc_sigaction(SIGSYSCALL, &sa, 0);

	sigemptyset(&sa.sa_mask);
R
Rich Felker 已提交
160 161
	sa.sa_sigaction = cancel_handler;
	__libc_sigaction(SIGCANCEL, &sa, 0);
R
Rich Felker 已提交
162

R
Rich Felker 已提交
163 164
	sigaddset(&sa.sa_mask, SIGSYSCALL);
	sigaddset(&sa.sa_mask, SIGCANCEL);
R
Rich Felker 已提交
165
	__libc_sigprocmask(SIG_UNBLOCK, &sa.sa_mask, 0);
R
Rich Felker 已提交
166 167 168 169 170
}

static int start(void *p)
{
	struct pthread *self = p;
171 172 173 174 175 176
	if (self->unblock_cancel) {
		sigset_t set;
		sigemptyset(&set);
		sigaddset(&set, SIGCANCEL);
		__libc_sigprocmask(SIG_UNBLOCK, &set, 0);
	}
R
Rich Felker 已提交
177 178 179 180
	pthread_exit(self->start(self->start_arg));
	return 0;
}

181
int __uniclone(void *, int (*)(), void *);
R
Rich Felker 已提交
182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201

#define ROUND(x) (((x)+PAGE_SIZE-1)&-PAGE_SIZE)

/* pthread_key_create.c overrides this */
static const size_t dummy = 0;
weak_alias(dummy, __pthread_tsd_size);

int pthread_create(pthread_t *res, const pthread_attr_t *attr, void *(*entry)(void *), void *arg)
{
	static int init;
	int ret;
	size_t size, guard;
	struct pthread *self = pthread_self(), *new;
	unsigned char *map, *stack, *tsd;
	static const pthread_attr_t default_attr;

	if (!self) return errno = ENOSYS;
	if (!init && ++init) init_threads();

	if (!attr) attr = &default_attr;
202 203
	guard = ROUND(attr->_a_guardsize + DEFAULT_GUARD_SIZE);
	size = guard + ROUND(attr->_a_stacksize + DEFAULT_STACK_SIZE);
R
Rich Felker 已提交
204 205 206
	size += __pthread_tsd_size;
	map = mmap(0, size, PROT_READ|PROT_WRITE|PROT_EXEC, MAP_PRIVATE|MAP_ANON, -1, 0);
	if (!map) return EAGAIN;
207
	if (guard) mprotect(map, guard, PROT_NONE);
R
Rich Felker 已提交
208 209 210 211 212 213 214 215 216 217 218

	tsd = map + size - __pthread_tsd_size;
	new = (void *)(tsd - sizeof *new - PAGE_SIZE%sizeof *new);
	new->map_base = map;
	new->map_size = size;
	new->pid = self->pid;
	new->errno_ptr = &new->errno_val;
	new->start = entry;
	new->start_arg = arg;
	new->self = new;
	new->tsd = (void *)tsd;
219
	new->detached = attr->_a_detach;
R
Rich Felker 已提交
220
	new->attr = *attr;
221
	new->unblock_cancel = self->cancel;
222
	new->result = PTHREAD_CANCELED;
R
Rich Felker 已提交
223 224 225 226 227 228 229 230 231 232
	memcpy(new->tlsdesc, self->tlsdesc, sizeof new->tlsdesc);
	new->tlsdesc[1] = (uintptr_t)new;
	stack = (void *)((uintptr_t)new-1 & ~(uintptr_t)15);

	/* We must synchronize new thread creation with rsyscall
	 * delivery. This looks to be the least expensive way: */
	a_inc(&rs.blocks);
	while (rs.lock) __wait(&rs.lock, 0, 1, 1);

	a_inc(&libc.threads_minus_1);
233
	ret = __uniclone(stack, start, new);
R
Rich Felker 已提交
234 235 236 237 238 239 240

	a_dec(&rs.blocks);
	if (rs.lock) __wake(&rs.blocks, 1, 1);

	if (ret < 0) {
		a_dec(&libc.threads_minus_1);
		munmap(map, size);
241
		return EAGAIN;
R
Rich Felker 已提交
242 243 244 245
	}
	*res = new;
	return 0;
}
246 247 248 249 250 251 252

void pthread_exit(void *result)
{
	struct pthread *self = pthread_self();
	self->result = result;
	docancel(self);
}