vnode.c 9.0 KB
Newer Older
D
David Howells 已提交
1
/* AFS vnode management
L
Linus Torvalds 已提交
2
 *
3
 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
L
Linus Torvalds 已提交
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
 * Written by David Howells (dhowells@redhat.com)
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version
 * 2 of the License, or (at your option) any later version.
 */

#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/init.h>
#include <linux/slab.h>
#include <linux/fs.h>
#include "internal.h"

19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40
#if 0
static noinline bool dump_tree_aux(struct rb_node *node, struct rb_node *parent,
				   int depth, char lr)
{
	struct afs_vnode *vnode;
	bool bad = false;

	if (!node)
		return false;

	if (node->rb_left)
		bad = dump_tree_aux(node->rb_left, node, depth + 2, '/');

	vnode = rb_entry(node, struct afs_vnode, cb_promise);
	kdebug("%c %*.*s%c%p {%d}",
	       rb_is_red(node) ? 'R' : 'B',
	       depth, depth, "", lr,
	       vnode, vnode->cb_expires_at);
	if (rb_parent(node) != parent) {
		printk("BAD: %p != %p\n", rb_parent(node), parent);
		bad = true;
	}
L
Linus Torvalds 已提交
41

42 43
	if (node->rb_right)
		bad |= dump_tree_aux(node->rb_right, node, depth + 2, '\\');
L
Linus Torvalds 已提交
44

45 46
	return bad;
}
L
Linus Torvalds 已提交
47

48 49 50 51 52 53
static noinline void dump_tree(const char *name, struct afs_server *server)
{
	kenter("%s", name);
	if (dump_tree_aux(server->cb_promises.rb_node, NULL, 0, '-'))
		BUG();
}
L
Linus Torvalds 已提交
54 55 56
#endif

/*
57
 * insert a vnode into the backing server's vnode tree
L
Linus Torvalds 已提交
58
 */
59 60
static void afs_install_vnode(struct afs_vnode *vnode,
			      struct afs_server *server)
L
Linus Torvalds 已提交
61
{
62 63 64
	struct afs_server *old_server = vnode->server;
	struct afs_vnode *xvnode;
	struct rb_node *parent, **p;
L
Linus Torvalds 已提交
65

66
	_enter("%p,%p", vnode, server);
L
Linus Torvalds 已提交
67

68 69 70 71 72
	if (old_server) {
		spin_lock(&old_server->fs_lock);
		rb_erase(&vnode->server_rb, &old_server->fs_vnodes);
		spin_unlock(&old_server->fs_lock);
	}
L
Linus Torvalds 已提交
73

74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100
	afs_get_server(server);
	vnode->server = server;
	afs_put_server(old_server);

	/* insert into the server's vnode tree in FID order */
	spin_lock(&server->fs_lock);

	parent = NULL;
	p = &server->fs_vnodes.rb_node;
	while (*p) {
		parent = *p;
		xvnode = rb_entry(parent, struct afs_vnode, server_rb);
		if (vnode->fid.vid < xvnode->fid.vid)
			p = &(*p)->rb_left;
		else if (vnode->fid.vid > xvnode->fid.vid)
			p = &(*p)->rb_right;
		else if (vnode->fid.vnode < xvnode->fid.vnode)
			p = &(*p)->rb_left;
		else if (vnode->fid.vnode > xvnode->fid.vnode)
			p = &(*p)->rb_right;
		else if (vnode->fid.unique < xvnode->fid.unique)
			p = &(*p)->rb_left;
		else if (vnode->fid.unique > xvnode->fid.unique)
			p = &(*p)->rb_right;
		else
			BUG(); /* can't happen unless afs_iget() malfunctions */
	}
L
Linus Torvalds 已提交
101

102 103
	rb_link_node(&vnode->server_rb, parent, p);
	rb_insert_color(&vnode->server_rb, &server->fs_vnodes);
L
Linus Torvalds 已提交
104

105 106 107
	spin_unlock(&server->fs_lock);
	_leave("");
}
L
Linus Torvalds 已提交
108

109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138
/*
 * insert a vnode into the promising server's update/expiration tree
 * - caller must hold vnode->lock
 */
static void afs_vnode_note_promise(struct afs_vnode *vnode,
				   struct afs_server *server)
{
	struct afs_server *old_server;
	struct afs_vnode *xvnode;
	struct rb_node *parent, **p;

	_enter("%p,%p", vnode, server);

	ASSERT(server != NULL);

	old_server = vnode->server;
	if (vnode->cb_promised) {
		if (server == old_server &&
		    vnode->cb_expires == vnode->cb_expires_at) {
			_leave(" [no change]");
			return;
		}

		spin_lock(&old_server->cb_lock);
		if (vnode->cb_promised) {
			_debug("delete");
			rb_erase(&vnode->cb_promise, &old_server->cb_promises);
			vnode->cb_promised = false;
		}
		spin_unlock(&old_server->cb_lock);
L
Linus Torvalds 已提交
139 140
	}

141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161
	if (vnode->server != server)
		afs_install_vnode(vnode, server);

	vnode->cb_expires_at = vnode->cb_expires;
	_debug("PROMISE on %p {%lu}",
	       vnode, (unsigned long) vnode->cb_expires_at);

	/* abuse an RB-tree to hold the expiration order (we may have multiple
	 * items with the same expiration time) */
	spin_lock(&server->cb_lock);

	parent = NULL;
	p = &server->cb_promises.rb_node;
	while (*p) {
		parent = *p;
		xvnode = rb_entry(parent, struct afs_vnode, cb_promise);
		if (vnode->cb_expires_at < xvnode->cb_expires_at)
			p = &(*p)->rb_left;
		else
			p = &(*p)->rb_right;
	}
L
Linus Torvalds 已提交
162

163 164 165
	rb_link_node(&vnode->cb_promise, parent, p);
	rb_insert_color(&vnode->cb_promise, &server->cb_promises);
	vnode->cb_promised = true;
L
Linus Torvalds 已提交
166

167
	spin_unlock(&server->cb_lock);
L
Linus Torvalds 已提交
168
	_leave("");
D
David Howells 已提交
169
}
L
Linus Torvalds 已提交
170

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
/*
 * handle remote file deletion by discarding the callback promise
 */
static void afs_vnode_deleted_remotely(struct afs_vnode *vnode)
{
	struct afs_server *server;

	set_bit(AFS_VNODE_DELETED, &vnode->flags);

	server = vnode->server;
	if (vnode->cb_promised) {
		spin_lock(&server->cb_lock);
		if (vnode->cb_promised) {
			rb_erase(&vnode->cb_promise, &server->cb_promises);
			vnode->cb_promised = false;
		}
		spin_unlock(&server->cb_lock);
	}

	afs_put_server(server);
}

L
Linus Torvalds 已提交
193 194 195 196 197 198 199 200 201 202 203 204 205 206 207
/*
 * finish off updating the recorded status of a file
 * - starts callback expiry timer
 * - adds to server's callback list
 */
static void afs_vnode_finalise_status_update(struct afs_vnode *vnode,
					     struct afs_server *server,
					     int ret)
{
	struct afs_server *oldserver = NULL;

	_enter("%p,%p,%d", vnode, server, ret);

	spin_lock(&vnode->lock);

208
	clear_bit(AFS_VNODE_CB_BROKEN, &vnode->flags);
L
Linus Torvalds 已提交
209

210 211 212 213 214 215
	switch (ret) {
	case 0:
		afs_vnode_note_promise(vnode, server);
		break;
	case -ENOENT:
		/* the file was deleted on the server */
L
Linus Torvalds 已提交
216
		_debug("got NOENT from server - marking file deleted");
217 218 219 220
		afs_vnode_deleted_remotely(vnode);
		break;
	default:
		break;
L
Linus Torvalds 已提交
221 222 223 224 225 226 227 228 229 230 231
	}

	vnode->update_cnt--;

	spin_unlock(&vnode->lock);

	wake_up_all(&vnode->update_waitq);

	afs_put_server(oldserver);

	_leave("");
D
David Howells 已提交
232
}
L
Linus Torvalds 已提交
233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251

/*
 * fetch file status from the volume
 * - don't issue a fetch if:
 *   - the changed bit is not set and there's a valid callback
 *   - there are any outstanding ops that will fetch the status
 * - TODO implement local caching
 */
int afs_vnode_fetch_status(struct afs_vnode *vnode)
{
	struct afs_server *server;
	int ret;

	DECLARE_WAITQUEUE(myself, current);

	_enter("%s,{%u,%u,%u}",
	       vnode->volume->vlocation->vldb.name,
	       vnode->fid.vid, vnode->fid.vnode, vnode->fid.unique);

252 253
	if (!test_bit(AFS_VNODE_CB_BROKEN, &vnode->flags) &&
	    vnode->cb_promised) {
L
Linus Torvalds 已提交
254 255 256 257
		_leave(" [unchanged]");
		return 0;
	}

258
	if (test_bit(AFS_VNODE_DELETED, &vnode->flags)) {
L
Linus Torvalds 已提交
259 260 261 262 263 264
		_leave(" [deleted]");
		return -ENOENT;
	}

	spin_lock(&vnode->lock);

265 266
	if (!test_bit(AFS_VNODE_CB_BROKEN, &vnode->flags) &&
	    vnode->cb_promised) {
L
Linus Torvalds 已提交
267 268 269 270 271 272 273 274
		spin_unlock(&vnode->lock);
		_leave(" [unchanged]");
		return 0;
	}

	if (vnode->update_cnt > 0) {
		/* someone else started a fetch */
		set_current_state(TASK_UNINTERRUPTIBLE);
275
		ASSERT(myself.func != NULL);
L
Linus Torvalds 已提交
276 277 278 279
		add_wait_queue(&vnode->update_waitq, &myself);

		/* wait for the status to be updated */
		for (;;) {
280
			if (!test_bit(AFS_VNODE_CB_BROKEN, &vnode->flags))
L
Linus Torvalds 已提交
281
				break;
282
			if (test_bit(AFS_VNODE_DELETED, &vnode->flags))
L
Linus Torvalds 已提交
283 284
				break;

285 286
			/* check to see if it got updated and invalidated all
			 * before we saw it */
L
Linus Torvalds 已提交
287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305
			if (vnode->update_cnt == 0) {
				remove_wait_queue(&vnode->update_waitq,
						  &myself);
				set_current_state(TASK_RUNNING);
				goto get_anyway;
			}

			spin_unlock(&vnode->lock);

			schedule();
			set_current_state(TASK_UNINTERRUPTIBLE);

			spin_lock(&vnode->lock);
		}

		remove_wait_queue(&vnode->update_waitq, &myself);
		spin_unlock(&vnode->lock);
		set_current_state(TASK_RUNNING);

306 307
		return test_bit(AFS_VNODE_DELETED, &vnode->flags) ?
			-ENOENT : 0;
L
Linus Torvalds 已提交
308 309
	}

D
David Howells 已提交
310
get_anyway:
L
Linus Torvalds 已提交
311 312 313 314 315 316 317 318 319
	/* okay... we're going to have to initiate the op */
	vnode->update_cnt++;

	spin_unlock(&vnode->lock);

	/* merge AFS status fetches and clear outstanding callback on this
	 * vnode */
	do {
		/* pick a server to query */
320 321 322
		server = afs_volume_pick_fileserver(vnode);
		if (IS_ERR(server))
			return PTR_ERR(server);
L
Linus Torvalds 已提交
323

324 325
		_debug("USING SERVER: %p{%08x}",
		       server, ntohl(server->addr.s_addr));
L
Linus Torvalds 已提交
326

327 328
		ret = afs_fs_fetch_file_status(server, vnode, NULL,
					       &afs_sync_call);
L
Linus Torvalds 已提交
329

330
	} while (!afs_volume_release_fileserver(vnode, server, ret));
L
Linus Torvalds 已提交
331 332 333 334 335 336

	/* adjust the flags */
	afs_vnode_finalise_status_update(vnode, server, ret);

	_leave(" = %d", ret);
	return ret;
D
David Howells 已提交
337
}
L
Linus Torvalds 已提交
338 339 340 341 342

/*
 * fetch file data from the volume
 * - TODO implement caching and server failover
 */
343 344
int afs_vnode_fetch_data(struct afs_vnode *vnode, off_t offset, size_t length,
			 struct page *page)
L
Linus Torvalds 已提交
345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363
{
	struct afs_server *server;
	int ret;

	_enter("%s,{%u,%u,%u}",
	       vnode->volume->vlocation->vldb.name,
	       vnode->fid.vid,
	       vnode->fid.vnode,
	       vnode->fid.unique);

	/* this op will fetch the status */
	spin_lock(&vnode->lock);
	vnode->update_cnt++;
	spin_unlock(&vnode->lock);

	/* merge in AFS status fetches and clear outstanding callback on this
	 * vnode */
	do {
		/* pick a server to query */
364 365 366
		server = afs_volume_pick_fileserver(vnode);
		if (IS_ERR(server))
			return PTR_ERR(server);
L
Linus Torvalds 已提交
367 368 369

		_debug("USING SERVER: %08x\n", ntohl(server->addr.s_addr));

370 371
		ret = afs_fs_fetch_data(server, vnode, offset, length, page,
					NULL, &afs_sync_call);
L
Linus Torvalds 已提交
372

373
	} while (!afs_volume_release_fileserver(vnode, server, ret));
L
Linus Torvalds 已提交
374 375 376 377 378 379

	/* adjust the flags */
	afs_vnode_finalise_status_update(vnode, server, ret);

	_leave(" = %d", ret);
	return ret;
D
David Howells 已提交
380
}