common.h 10.7 KB
Newer Older
K
Konrad Rzeszutek Wilk 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
/*
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License version 2
 * as published by the Free Software Foundation; or, when distributed
 * separately from the Linux kernel or incorporated into other
 * software packages, subject to the following license:
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this source file (the "Software"), to deal in the Software without
 * restriction, including without limitation the rights to use, copy, modify,
 * merge, publish, distribute, sublicense, and/or sell copies of the Software,
 * and to permit persons to whom the Software is furnished to do so, subject to
 * the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 */

27 28
#ifndef __XEN_BLKIF__BACKEND__COMMON_H__
#define __XEN_BLKIF__BACKEND__COMMON_H__
K
Konrad Rzeszutek Wilk 已提交
29 30 31 32 33 34 35

#include <linux/module.h>
#include <linux/interrupt.h>
#include <linux/slab.h>
#include <linux/blkdev.h>
#include <linux/vmalloc.h>
#include <linux/wait.h>
36
#include <linux/io.h>
37
#include <linux/rbtree.h>
K
Konrad Rzeszutek Wilk 已提交
38 39 40
#include <asm/setup.h>
#include <asm/pgalloc.h>
#include <asm/hypervisor.h>
J
Jeremy Fitzhardinge 已提交
41
#include <xen/grant_table.h>
K
Konrad Rzeszutek Wilk 已提交
42
#include <xen/xenbus.h>
43 44 45
#include <xen/interface/io/ring.h>
#include <xen/interface/io/blkif.h>
#include <xen/interface/io/protocols.h>
K
Konrad Rzeszutek Wilk 已提交
46

47
#define DRV_PFX "xen-blkback:"
48
#define DPRINTK(fmt, args...)				\
49
	pr_debug(DRV_PFX "(%s:%d) " fmt ".\n",		\
50
		 __func__, __LINE__, ##args)
K
Konrad Rzeszutek Wilk 已提交
51

52 53 54 55 56 57 58 59 60 61 62 63

/* Not a real protocol.  Used to generate ring structs which contain
 * the elements common to all protocols only.  This way we get a
 * compiler-checkable way to use common struct elements, so we can
 * avoid using switch(protocol) in a number of places.  */
struct blkif_common_request {
	char dummy;
};
struct blkif_common_response {
	char dummy;
};

64
struct blkif_x86_32_request_rw {
65 66 67
	uint8_t        nr_segments;  /* number of segments                   */
	blkif_vdev_t   handle;       /* only for read/write requests         */
	uint64_t       id;           /* private guest value, echoed in resp  */
68 69
	blkif_sector_t sector_number;/* start sector idx on disk (r/w only)  */
	struct blkif_request_segment seg[BLKIF_MAX_SEGMENTS_PER_REQUEST];
70
} __attribute__((__packed__));
71 72

struct blkif_x86_32_request_discard {
73
	uint8_t        flag;         /* BLKIF_DISCARD_SECURE or zero         */
74 75
	blkif_vdev_t   _pad1;        /* was "handle" for read/write requests */
	uint64_t       id;           /* private guest value, echoed in resp  */
76
	blkif_sector_t sector_number;/* start sector idx on disk (r/w only)  */
77 78
	uint64_t       nr_sectors;
} __attribute__((__packed__));
79

80 81 82 83 84 85
struct blkif_x86_32_request_other {
	uint8_t        _pad1;
	blkif_vdev_t   _pad2;
	uint64_t       id;           /* private guest value, echoed in resp  */
} __attribute__((__packed__));

86 87
struct blkif_x86_32_request {
	uint8_t        operation;    /* BLKIF_OP_???                         */
88 89 90
	union {
		struct blkif_x86_32_request_rw rw;
		struct blkif_x86_32_request_discard discard;
91
		struct blkif_x86_32_request_other other;
92
	} u;
93 94 95 96
} __attribute__((__packed__));

/* i386 protocol version */
#pragma pack(push, 4)
97 98 99 100 101 102 103
struct blkif_x86_32_response {
	uint64_t        id;              /* copied from request */
	uint8_t         operation;       /* copied from request */
	int16_t         status;          /* BLKIF_RSP_???       */
};
#pragma pack(pop)
/* x86_64 protocol version */
104 105

struct blkif_x86_64_request_rw {
106 107 108 109
	uint8_t        nr_segments;  /* number of segments                   */
	blkif_vdev_t   handle;       /* only for read/write requests         */
	uint32_t       _pad1;        /* offsetof(blkif_reqest..,u.rw.id)==8  */
	uint64_t       id;
110 111
	blkif_sector_t sector_number;/* start sector idx on disk (r/w only)  */
	struct blkif_request_segment seg[BLKIF_MAX_SEGMENTS_PER_REQUEST];
112
} __attribute__((__packed__));
113 114

struct blkif_x86_64_request_discard {
115
	uint8_t        flag;         /* BLKIF_DISCARD_SECURE or zero         */
116 117 118
	blkif_vdev_t   _pad1;        /* was "handle" for read/write requests */
        uint32_t       _pad2;        /* offsetof(blkif_..,u.discard.id)==8   */
	uint64_t       id;
119
	blkif_sector_t sector_number;/* start sector idx on disk (r/w only)  */
120 121
	uint64_t       nr_sectors;
} __attribute__((__packed__));
122

123 124 125 126 127 128 129
struct blkif_x86_64_request_other {
	uint8_t        _pad1;
	blkif_vdev_t   _pad2;
	uint32_t       _pad3;        /* offsetof(blkif_..,u.discard.id)==8   */
	uint64_t       id;           /* private guest value, echoed in resp  */
} __attribute__((__packed__));

130 131
struct blkif_x86_64_request {
	uint8_t        operation;    /* BLKIF_OP_???                         */
132 133 134
	union {
		struct blkif_x86_64_request_rw rw;
		struct blkif_x86_64_request_discard discard;
135
		struct blkif_x86_64_request_other other;
136
	} u;
137 138
} __attribute__((__packed__));

139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164
struct blkif_x86_64_response {
	uint64_t       __attribute__((__aligned__(8))) id;
	uint8_t         operation;       /* copied from request */
	int16_t         status;          /* BLKIF_RSP_???       */
};

DEFINE_RING_TYPES(blkif_common, struct blkif_common_request,
		  struct blkif_common_response);
DEFINE_RING_TYPES(blkif_x86_32, struct blkif_x86_32_request,
		  struct blkif_x86_32_response);
DEFINE_RING_TYPES(blkif_x86_64, struct blkif_x86_64_request,
		  struct blkif_x86_64_response);

union blkif_back_rings {
	struct blkif_back_ring        native;
	struct blkif_common_back_ring common;
	struct blkif_x86_32_back_ring x86_32;
	struct blkif_x86_64_back_ring x86_64;
};

enum blkif_protocol {
	BLKIF_PROTOCOL_NATIVE = 1,
	BLKIF_PROTOCOL_X86_32 = 2,
	BLKIF_PROTOCOL_X86_64 = 3,
};

165
struct xen_vbd {
166 167 168 169 170 171 172 173 174 175 176
	/* What the domain refers to this vbd as. */
	blkif_vdev_t		handle;
	/* Non-zero -> read-only */
	unsigned char		readonly;
	/* VDISK_xxx */
	unsigned char		type;
	/* phys device that this vbd maps to. */
	u32			pdevice;
	struct block_device	*bdev;
	/* Cached size parameter. */
	sector_t		size;
177 178
	unsigned int		flush_support:1;
	unsigned int		discard_secure:1;
179 180
	unsigned int		feature_gnt_persistent:1;
	unsigned int		overflow_max_grants:1;
K
Konrad Rzeszutek Wilk 已提交
181 182 183 184
};

struct backend_info;

185 186 187 188 189 190 191 192

struct persistent_gnt {
	struct page *page;
	grant_ref_t gnt;
	grant_handle_t handle;
	struct rb_node node;
};

193
struct xen_blkif {
K
Konrad Rzeszutek Wilk 已提交
194
	/* Unique identifier for this interface. */
195 196
	domid_t			domid;
	unsigned int		handle;
K
Konrad Rzeszutek Wilk 已提交
197
	/* Physical parameters of the comms window. */
198
	unsigned int		irq;
K
Konrad Rzeszutek Wilk 已提交
199
	/* Comms information. */
200 201
	enum blkif_protocol	blk_protocol;
	union blkif_back_rings	blk_rings;
202
	void			*blk_ring;
K
Konrad Rzeszutek Wilk 已提交
203
	/* The VBD attached to this interface. */
204
	struct xen_vbd		vbd;
K
Konrad Rzeszutek Wilk 已提交
205
	/* Back pointer to the backend_info. */
206
	struct backend_info	*be;
K
Konrad Rzeszutek Wilk 已提交
207
	/* Private fields. */
208 209
	spinlock_t		blk_ring_lock;
	atomic_t		refcnt;
K
Konrad Rzeszutek Wilk 已提交
210

211
	wait_queue_head_t	wq;
212 213 214
	/* for barrier (drain) requests */
	struct completion	drain_complete;
	atomic_t		drain;
215
	/* One thread per one blkif. */
216 217
	struct task_struct	*xenblkd;
	unsigned int		waiting_reqs;
K
Konrad Rzeszutek Wilk 已提交
218

219 220 221 222
	/* tree to store persistent grants */
	struct rb_root		persistent_gnts;
	unsigned int		persistent_gnt_c;

K
Konrad Rzeszutek Wilk 已提交
223
	/* statistics */
224
	unsigned long		st_print;
225 226 227 228 229 230 231
	unsigned long long			st_rd_req;
	unsigned long long			st_wr_req;
	unsigned long long			st_oo_req;
	unsigned long long			st_f_req;
	unsigned long long			st_ds_req;
	unsigned long long			st_rd_sect;
	unsigned long long			st_wr_sect;
232 233

	wait_queue_head_t	waiting_to_free;
234
};
K
Konrad Rzeszutek Wilk 已提交
235

236 237 238 239

#define vbd_sz(_v)	((_v)->bdev->bd_part ? \
			 (_v)->bdev->bd_part->nr_sects : \
			  get_capacity((_v)->bdev->bd_disk))
K
Konrad Rzeszutek Wilk 已提交
240

241 242
#define xen_blkif_get(_b) (atomic_inc(&(_b)->refcnt))
#define xen_blkif_put(_b)				\
K
Konrad Rzeszutek Wilk 已提交
243 244 245 246 247 248
	do {						\
		if (atomic_dec_and_test(&(_b)->refcnt))	\
			wake_up(&(_b)->waiting_to_free);\
	} while (0)

struct phys_req {
249
	unsigned short		dev;
250
	blkif_sector_t		nr_sects;
251 252
	struct block_device	*bdev;
	blkif_sector_t		sector_number;
K
Konrad Rzeszutek Wilk 已提交
253
};
254
int xen_blkif_interface_init(void);
K
Konrad Rzeszutek Wilk 已提交
255

256
int xen_blkif_xenbus_init(void);
K
Konrad Rzeszutek Wilk 已提交
257

258 259
irqreturn_t xen_blkif_be_int(int irq, void *dev_id);
int xen_blkif_schedule(void *arg);
K
Konrad Rzeszutek Wilk 已提交
260

261 262
int xen_blkbk_flush_diskcache(struct xenbus_transaction xbt,
			      struct backend_info *be, int state);
K
Konrad Rzeszutek Wilk 已提交
263

264 265
int xen_blkbk_barrier(struct xenbus_transaction xbt,
		      struct backend_info *be, int state);
266
struct xenbus_device *xen_blkbk_xenbus(struct backend_info *be);
267

268
static inline void blkif_get_x86_32_req(struct blkif_request *dst,
269 270 271 272
					struct blkif_x86_32_request *src)
{
	int i, n = BLKIF_MAX_SEGMENTS_PER_REQUEST;
	dst->operation = src->operation;
273 274 275 276 277
	switch (src->operation) {
	case BLKIF_OP_READ:
	case BLKIF_OP_WRITE:
	case BLKIF_OP_WRITE_BARRIER:
	case BLKIF_OP_FLUSH_DISKCACHE:
278 279 280
		dst->u.rw.nr_segments = src->u.rw.nr_segments;
		dst->u.rw.handle = src->u.rw.handle;
		dst->u.rw.id = src->u.rw.id;
281 282
		dst->u.rw.sector_number = src->u.rw.sector_number;
		barrier();
283 284
		if (n > dst->u.rw.nr_segments)
			n = dst->u.rw.nr_segments;
285 286 287 288
		for (i = 0; i < n; i++)
			dst->u.rw.seg[i] = src->u.rw.seg[i];
		break;
	case BLKIF_OP_DISCARD:
289
		dst->u.discard.flag = src->u.discard.flag;
290
		dst->u.discard.id = src->u.discard.id;
291 292 293 294
		dst->u.discard.sector_number = src->u.discard.sector_number;
		dst->u.discard.nr_sectors = src->u.discard.nr_sectors;
		break;
	default:
295 296 297 298 299
		/*
		 * Don't know how to translate this op. Only get the
		 * ID so failure can be reported to the frontend.
		 */
		dst->u.other.id = src->u.other.id;
300 301
		break;
	}
302 303
}

304
static inline void blkif_get_x86_64_req(struct blkif_request *dst,
305 306 307 308
					struct blkif_x86_64_request *src)
{
	int i, n = BLKIF_MAX_SEGMENTS_PER_REQUEST;
	dst->operation = src->operation;
309 310 311 312 313
	switch (src->operation) {
	case BLKIF_OP_READ:
	case BLKIF_OP_WRITE:
	case BLKIF_OP_WRITE_BARRIER:
	case BLKIF_OP_FLUSH_DISKCACHE:
314 315 316
		dst->u.rw.nr_segments = src->u.rw.nr_segments;
		dst->u.rw.handle = src->u.rw.handle;
		dst->u.rw.id = src->u.rw.id;
317 318
		dst->u.rw.sector_number = src->u.rw.sector_number;
		barrier();
319 320
		if (n > dst->u.rw.nr_segments)
			n = dst->u.rw.nr_segments;
321 322 323 324
		for (i = 0; i < n; i++)
			dst->u.rw.seg[i] = src->u.rw.seg[i];
		break;
	case BLKIF_OP_DISCARD:
325
		dst->u.discard.flag = src->u.discard.flag;
326
		dst->u.discard.id = src->u.discard.id;
327 328 329 330
		dst->u.discard.sector_number = src->u.discard.sector_number;
		dst->u.discard.nr_sectors = src->u.discard.nr_sectors;
		break;
	default:
331 332 333 334 335
		/*
		 * Don't know how to translate this op. Only get the
		 * ID so failure can be reported to the frontend.
		 */
		dst->u.other.id = src->u.other.id;
336 337
		break;
	}
338 339
}

340
#endif /* __XEN_BLKIF__BACKEND__COMMON_H__ */