virtio.c 51.1 KB
Newer Older
A
aliguori 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Virtio Support
 *
 * Copyright IBM, Corp. 2007
 *
 * Authors:
 *  Anthony Liguori   <aliguori@us.ibm.com>
 *
 * This work is licensed under the terms of the GNU GPL, version 2.  See
 * the COPYING file in the top-level directory.
 *
 */

P
Peter Maydell 已提交
14
#include "qemu/osdep.h"
15
#include "qapi/error.h"
16 17
#include "qemu-common.h"
#include "cpu.h"
18
#include "trace.h"
19
#include "exec/address-spaces.h"
20
#include "qemu/error-report.h"
P
Paolo Bonzini 已提交
21
#include "hw/virtio/virtio.h"
22
#include "qemu/atomic.h"
P
Paolo Bonzini 已提交
23
#include "hw/virtio/virtio-bus.h"
24
#include "migration/migration.h"
25
#include "hw/virtio/virtio-access.h"
A
aliguori 已提交
26

27 28 29 30 31
/*
 * The alignment to use between consumer and producer parts of vring.
 * x86 pagesize again. This is the default, used by transports like PCI
 * which don't provide a means for the guest to tell the host the alignment.
 */
32 33
#define VIRTIO_PCI_VRING_ALIGN         4096

A
aliguori 已提交
34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
typedef struct VRingDesc
{
    uint64_t addr;
    uint32_t len;
    uint16_t flags;
    uint16_t next;
} VRingDesc;

typedef struct VRingAvail
{
    uint16_t flags;
    uint16_t idx;
    uint16_t ring[0];
} VRingAvail;

typedef struct VRingUsedElem
{
    uint32_t id;
    uint32_t len;
} VRingUsedElem;

typedef struct VRingUsed
{
    uint16_t flags;
    uint16_t idx;
    VRingUsedElem ring[0];
} VRingUsed;

typedef struct VRing
{
    unsigned int num;
C
Cornelia Huck 已提交
65
    unsigned int num_default;
66
    unsigned int align;
A
Avi Kivity 已提交
67 68 69
    hwaddr desc;
    hwaddr avail;
    hwaddr used;
A
aliguori 已提交
70 71 72 73 74
} VRing;

struct VirtQueue
{
    VRing vring;
75 76

    /* Next head to pop */
A
aliguori 已提交
77
    uint16_t last_avail_idx;
78

79 80 81
    /* Last avail_idx read from VQ. */
    uint16_t shadow_avail_idx;

82 83
    uint16_t used_idx;

M
Michael S. Tsirkin 已提交
84 85 86 87 88 89 90 91 92
    /* Last used index value we have signalled on */
    uint16_t signalled_used;

    /* Last used index value we have signalled on */
    bool signalled_used_valid;

    /* Notification enabled? */
    bool notification;

93 94
    uint16_t queue_index;

A
aliguori 已提交
95
    int inuse;
M
Michael S. Tsirkin 已提交
96

97
    uint16_t vector;
A
aliguori 已提交
98
    void (*handle_output)(VirtIODevice *vdev, VirtQueue *vq);
99 100 101
    VirtIODevice *vdev;
    EventNotifier guest_notifier;
    EventNotifier host_notifier;
102
    QLIST_ENTRY(VirtQueue) node;
A
aliguori 已提交
103 104 105
};

/* virt queue functions */
106
void virtio_queue_update_rings(VirtIODevice *vdev, int n)
A
aliguori 已提交
107
{
108
    VRing *vring = &vdev->vq[n].vring;
P
Paul Brook 已提交
109

110 111 112 113 114 115 116 117
    if (!vring->desc) {
        /* not yet setup -> nothing to do */
        return;
    }
    vring->avail = vring->desc + vring->num * sizeof(VRingDesc);
    vring->used = vring_align(vring->avail +
                              offsetof(VRingAvail, ring[vring->num]),
                              vring->align);
A
aliguori 已提交
118 119
}

120 121
static void vring_desc_read(VirtIODevice *vdev, VRingDesc *desc,
                            hwaddr desc_pa, int i)
A
aliguori 已提交
122
{
123 124 125 126 127 128
    address_space_read(&address_space_memory, desc_pa + i * sizeof(VRingDesc),
                       MEMTXATTRS_UNSPECIFIED, (void *)desc, sizeof(VRingDesc));
    virtio_tswap64s(vdev, &desc->addr);
    virtio_tswap32s(vdev, &desc->len);
    virtio_tswap16s(vdev, &desc->flags);
    virtio_tswap16s(vdev, &desc->next);
A
aliguori 已提交
129 130 131 132
}

static inline uint16_t vring_avail_flags(VirtQueue *vq)
{
A
Avi Kivity 已提交
133
    hwaddr pa;
A
aliguori 已提交
134
    pa = vq->vring.avail + offsetof(VRingAvail, flags);
135
    return virtio_lduw_phys(vq->vdev, pa);
A
aliguori 已提交
136 137 138 139
}

static inline uint16_t vring_avail_idx(VirtQueue *vq)
{
A
Avi Kivity 已提交
140
    hwaddr pa;
A
aliguori 已提交
141
    pa = vq->vring.avail + offsetof(VRingAvail, idx);
142 143
    vq->shadow_avail_idx = virtio_lduw_phys(vq->vdev, pa);
    return vq->shadow_avail_idx;
A
aliguori 已提交
144 145 146 147
}

static inline uint16_t vring_avail_ring(VirtQueue *vq, int i)
{
A
Avi Kivity 已提交
148
    hwaddr pa;
A
aliguori 已提交
149
    pa = vq->vring.avail + offsetof(VRingAvail, ring[i]);
150
    return virtio_lduw_phys(vq->vdev, pa);
A
aliguori 已提交
151 152
}

153
static inline uint16_t vring_get_used_event(VirtQueue *vq)
M
Michael S. Tsirkin 已提交
154 155 156 157
{
    return vring_avail_ring(vq, vq->vring.num);
}

158 159
static inline void vring_used_write(VirtQueue *vq, VRingUsedElem *uelem,
                                    int i)
A
aliguori 已提交
160
{
A
Avi Kivity 已提交
161
    hwaddr pa;
162 163 164 165 166
    virtio_tswap32s(vq->vdev, &uelem->id);
    virtio_tswap32s(vq->vdev, &uelem->len);
    pa = vq->vring.used + offsetof(VRingUsed, ring[i]);
    address_space_write(&address_space_memory, pa, MEMTXATTRS_UNSPECIFIED,
                       (void *)uelem, sizeof(VRingUsedElem));
A
aliguori 已提交
167 168 169 170
}

static uint16_t vring_used_idx(VirtQueue *vq)
{
A
Avi Kivity 已提交
171
    hwaddr pa;
A
aliguori 已提交
172
    pa = vq->vring.used + offsetof(VRingUsed, idx);
173
    return virtio_lduw_phys(vq->vdev, pa);
A
aliguori 已提交
174 175
}

M
Michael S. Tsirkin 已提交
176
static inline void vring_used_idx_set(VirtQueue *vq, uint16_t val)
A
aliguori 已提交
177
{
A
Avi Kivity 已提交
178
    hwaddr pa;
A
aliguori 已提交
179
    pa = vq->vring.used + offsetof(VRingUsed, idx);
180
    virtio_stw_phys(vq->vdev, pa, val);
181
    vq->used_idx = val;
A
aliguori 已提交
182 183 184 185
}

static inline void vring_used_flags_set_bit(VirtQueue *vq, int mask)
{
186
    VirtIODevice *vdev = vq->vdev;
A
Avi Kivity 已提交
187
    hwaddr pa;
A
aliguori 已提交
188
    pa = vq->vring.used + offsetof(VRingUsed, flags);
189
    virtio_stw_phys(vdev, pa, virtio_lduw_phys(vdev, pa) | mask);
A
aliguori 已提交
190 191 192 193
}

static inline void vring_used_flags_unset_bit(VirtQueue *vq, int mask)
{
194
    VirtIODevice *vdev = vq->vdev;
A
Avi Kivity 已提交
195
    hwaddr pa;
A
aliguori 已提交
196
    pa = vq->vring.used + offsetof(VRingUsed, flags);
197
    virtio_stw_phys(vdev, pa, virtio_lduw_phys(vdev, pa) & ~mask);
A
aliguori 已提交
198 199
}

200
static inline void vring_set_avail_event(VirtQueue *vq, uint16_t val)
M
Michael S. Tsirkin 已提交
201
{
A
Avi Kivity 已提交
202
    hwaddr pa;
M
Michael S. Tsirkin 已提交
203 204 205 206
    if (!vq->notification) {
        return;
    }
    pa = vq->vring.used + offsetof(VRingUsed, ring[vq->vring.num]);
207
    virtio_stw_phys(vq->vdev, pa, val);
M
Michael S. Tsirkin 已提交
208 209
}

A
aliguori 已提交
210 211
void virtio_queue_set_notification(VirtQueue *vq, int enable)
{
M
Michael S. Tsirkin 已提交
212
    vq->notification = enable;
213
    if (virtio_vdev_has_feature(vq->vdev, VIRTIO_RING_F_EVENT_IDX)) {
214
        vring_set_avail_event(vq, vring_avail_idx(vq));
M
Michael S. Tsirkin 已提交
215
    } else if (enable) {
A
aliguori 已提交
216
        vring_used_flags_unset_bit(vq, VRING_USED_F_NO_NOTIFY);
M
Michael S. Tsirkin 已提交
217
    } else {
A
aliguori 已提交
218
        vring_used_flags_set_bit(vq, VRING_USED_F_NO_NOTIFY);
M
Michael S. Tsirkin 已提交
219
    }
220 221 222 223
    if (enable) {
        /* Expose avail event/used flags before caller checks the avail idx. */
        smp_mb();
    }
A
aliguori 已提交
224 225 226 227 228 229 230
}

int virtio_queue_ready(VirtQueue *vq)
{
    return vq->vring.avail != 0;
}

231 232
/* Fetch avail_idx from VQ memory only when we really need to know if
 * guest has added some buffers. */
A
aliguori 已提交
233 234
int virtio_queue_empty(VirtQueue *vq)
{
235 236 237 238
    if (vq->shadow_avail_idx != vq->last_avail_idx) {
        return 0;
    }

A
aliguori 已提交
239 240 241
    return vring_avail_idx(vq) == vq->last_avail_idx;
}

242 243
static void virtqueue_unmap_sg(VirtQueue *vq, const VirtQueueElement *elem,
                               unsigned int len)
A
aliguori 已提交
244 245 246 247 248 249 250 251
{
    unsigned int offset;
    int i;

    offset = 0;
    for (i = 0; i < elem->in_num; i++) {
        size_t size = MIN(len - offset, elem->in_sg[i].iov_len);

252 253 254
        cpu_physical_memory_unmap(elem->in_sg[i].iov_base,
                                  elem->in_sg[i].iov_len,
                                  1, size);
A
aliguori 已提交
255

256
        offset += size;
A
aliguori 已提交
257 258
    }

259 260 261 262
    for (i = 0; i < elem->out_num; i++)
        cpu_physical_memory_unmap(elem->out_sg[i].iov_base,
                                  elem->out_sg[i].iov_len,
                                  0, elem->out_sg[i].iov_len);
263 264
}

J
Jason Wang 已提交
265 266 267 268 269 270 271
void virtqueue_discard(VirtQueue *vq, const VirtQueueElement *elem,
                       unsigned int len)
{
    vq->last_avail_idx--;
    virtqueue_unmap_sg(vq, elem, len);
}

272 273 274
void virtqueue_fill(VirtQueue *vq, const VirtQueueElement *elem,
                    unsigned int len, unsigned int idx)
{
275 276
    VRingUsedElem uelem;

277 278 279
    trace_virtqueue_fill(vq, elem, len, idx);

    virtqueue_unmap_sg(vq, elem, len);
280

281
    idx = (idx + vq->used_idx) % vq->vring.num;
A
aliguori 已提交
282

283 284 285
    uelem.id = elem->index;
    uelem.len = len;
    vring_used_write(vq, &uelem, idx);
A
aliguori 已提交
286 287 288 289
}

void virtqueue_flush(VirtQueue *vq, unsigned int count)
{
M
Michael S. Tsirkin 已提交
290
    uint16_t old, new;
A
aliguori 已提交
291
    /* Make sure buffer is written before we update index. */
292
    smp_wmb();
293
    trace_virtqueue_flush(vq, count);
294
    old = vq->used_idx;
M
Michael S. Tsirkin 已提交
295 296
    new = old + count;
    vring_used_idx_set(vq, new);
A
aliguori 已提交
297
    vq->inuse -= count;
M
Michael S. Tsirkin 已提交
298 299
    if (unlikely((int16_t)(new - vq->signalled_used) < (uint16_t)(new - old)))
        vq->signalled_used_valid = false;
A
aliguori 已提交
300 301 302 303 304 305 306 307 308 309 310 311 312 313
}

void virtqueue_push(VirtQueue *vq, const VirtQueueElement *elem,
                    unsigned int len)
{
    virtqueue_fill(vq, elem, len, 0);
    virtqueue_flush(vq, 1);
}

static int virtqueue_num_heads(VirtQueue *vq, unsigned int idx)
{
    uint16_t num_heads = vring_avail_idx(vq) - idx;

    /* Check it isn't doing very strange things with descriptor numbers. */
A
aliguori 已提交
314
    if (num_heads > vq->vring.num) {
315
        error_report("Guest moved used index from %u to %u",
316
                     idx, vq->shadow_avail_idx);
A
aliguori 已提交
317 318
        exit(1);
    }
319 320 321 322 323
    /* On success, callers read a descriptor at vq->last_avail_idx.
     * Make sure descriptor read does not bypass avail index read. */
    if (num_heads) {
        smp_rmb();
    }
A
aliguori 已提交
324 325 326 327 328 329 330 331 332 333 334 335 336

    return num_heads;
}

static unsigned int virtqueue_get_head(VirtQueue *vq, unsigned int idx)
{
    unsigned int head;

    /* Grab the next descriptor number they're advertising, and increment
     * the index we've seen. */
    head = vring_avail_ring(vq, idx % vq->vring.num);

    /* If their number is silly, that's a fatal mistake. */
A
aliguori 已提交
337
    if (head >= vq->vring.num) {
338
        error_report("Guest says index %u is available", head);
A
aliguori 已提交
339 340
        exit(1);
    }
A
aliguori 已提交
341 342 343 344

    return head;
}

345 346
static unsigned virtqueue_read_next_desc(VirtIODevice *vdev, VRingDesc *desc,
                                         hwaddr desc_pa, unsigned int max)
A
aliguori 已提交
347 348 349 350
{
    unsigned int next;

    /* If this descriptor says it doesn't chain, we're done. */
351
    if (!(desc->flags & VRING_DESC_F_NEXT)) {
352
        return max;
353
    }
A
aliguori 已提交
354 355

    /* Check they're not leading us off end of descriptors. */
356
    next = desc->next;
A
aliguori 已提交
357
    /* Make sure compiler knows to grab that: we don't want it changing! */
358
    smp_wmb();
A
aliguori 已提交
359

360
    if (next >= max) {
361
        error_report("Desc next is %u", next);
A
aliguori 已提交
362 363
        exit(1);
    }
A
aliguori 已提交
364

365
    vring_desc_read(vdev, desc, desc_pa, next);
A
aliguori 已提交
366 367 368
    return next;
}

369
void virtqueue_get_avail_bytes(VirtQueue *vq, unsigned int *in_bytes,
370 371
                               unsigned int *out_bytes,
                               unsigned max_in_bytes, unsigned max_out_bytes)
A
aliguori 已提交
372
{
373
    unsigned int idx;
374
    unsigned int total_bufs, in_total, out_total;
A
aliguori 已提交
375 376 377

    idx = vq->last_avail_idx;

378
    total_bufs = in_total = out_total = 0;
A
aliguori 已提交
379
    while (virtqueue_num_heads(vq, idx)) {
380
        VirtIODevice *vdev = vq->vdev;
381
        unsigned int max, num_bufs, indirect = 0;
382
        VRingDesc desc;
A
Avi Kivity 已提交
383
        hwaddr desc_pa;
A
aliguori 已提交
384 385
        int i;

386 387
        max = vq->vring.num;
        num_bufs = total_bufs;
A
aliguori 已提交
388
        i = virtqueue_get_head(vq, idx++);
389
        desc_pa = vq->vring.desc;
390
        vring_desc_read(vdev, &desc, desc_pa, i);
391

392 393
        if (desc.flags & VRING_DESC_F_INDIRECT) {
            if (desc.len % sizeof(VRingDesc)) {
394
                error_report("Invalid size for indirect buffer table");
395 396 397 398 399
                exit(1);
            }

            /* If we've got too many, that implies a descriptor loop. */
            if (num_bufs >= max) {
400
                error_report("Looped descriptor");
401 402 403 404 405
                exit(1);
            }

            /* loop over the indirect descriptor table */
            indirect = 1;
406 407
            max = desc.len / sizeof(VRingDesc);
            desc_pa = desc.addr;
408
            num_bufs = i = 0;
409
            vring_desc_read(vdev, &desc, desc_pa, i);
410 411
        }

A
aliguori 已提交
412 413
        do {
            /* If we've got too many, that implies a descriptor loop. */
414
            if (++num_bufs > max) {
415
                error_report("Looped descriptor");
A
aliguori 已提交
416 417
                exit(1);
            }
A
aliguori 已提交
418

419 420
            if (desc.flags & VRING_DESC_F_WRITE) {
                in_total += desc.len;
A
aliguori 已提交
421
            } else {
422
                out_total += desc.len;
A
aliguori 已提交
423
            }
424 425 426
            if (in_total >= max_in_bytes && out_total >= max_out_bytes) {
                goto done;
            }
427
        } while ((i = virtqueue_read_next_desc(vdev, &desc, desc_pa, max)) != max);
428 429 430 431 432

        if (!indirect)
            total_bufs = num_bufs;
        else
            total_bufs++;
A
aliguori 已提交
433
    }
434
done:
435 436 437 438 439 440 441
    if (in_bytes) {
        *in_bytes = in_total;
    }
    if (out_bytes) {
        *out_bytes = out_total;
    }
}
A
aliguori 已提交
442

443 444 445 446 447
int virtqueue_avail_bytes(VirtQueue *vq, unsigned int in_bytes,
                          unsigned int out_bytes)
{
    unsigned int in_total, out_total;

448 449
    virtqueue_get_avail_bytes(vq, &in_total, &out_total, in_bytes, out_bytes);
    return in_bytes <= in_total && out_bytes <= out_total;
A
aliguori 已提交
450 451
}

452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477
static void virtqueue_map_desc(unsigned int *p_num_sg, hwaddr *addr, struct iovec *iov,
                               unsigned int max_num_sg, bool is_write,
                               hwaddr pa, size_t sz)
{
    unsigned num_sg = *p_num_sg;
    assert(num_sg <= max_num_sg);

    while (sz) {
        hwaddr len = sz;

        if (num_sg == max_num_sg) {
            error_report("virtio: too many write descriptors in indirect table");
            exit(1);
        }

        iov[num_sg].iov_base = cpu_physical_memory_map(pa, &len, is_write);
        iov[num_sg].iov_len = len;
        addr[num_sg] = pa;

        sz -= len;
        pa += len;
        num_sg++;
    }
    *p_num_sg = num_sg;
}

M
Michael S. Tsirkin 已提交
478 479 480
static void virtqueue_map_iovec(struct iovec *sg, hwaddr *addr,
                                unsigned int *num_sg, unsigned int max_size,
                                int is_write)
K
Kevin Wolf 已提交
481 482
{
    unsigned int i;
A
Avi Kivity 已提交
483
    hwaddr len;
K
Kevin Wolf 已提交
484

M
Michael S. Tsirkin 已提交
485 486 487 488 489 490 491 492 493 494 495 496 497
    /* Note: this function MUST validate input, some callers
     * are passing in num_sg values received over the network.
     */
    /* TODO: teach all callers that this can fail, and return failure instead
     * of asserting here.
     * When we do, we might be able to re-enable NDEBUG below.
     */
#ifdef NDEBUG
#error building with NDEBUG is not supported
#endif
    assert(*num_sg <= max_size);

    for (i = 0; i < *num_sg; i++) {
K
Kevin Wolf 已提交
498 499
        len = sg[i].iov_len;
        sg[i].iov_base = cpu_physical_memory_map(addr[i], &len, is_write);
M
Michael S. Tsirkin 已提交
500
        if (!sg[i].iov_base) {
M
Michael Tokarev 已提交
501
            error_report("virtio: error trying to map MMIO memory");
K
Kevin Wolf 已提交
502 503
            exit(1);
        }
504 505
        if (len != sg[i].iov_len) {
            error_report("virtio: unexpected memory split");
M
Michael S. Tsirkin 已提交
506 507
            exit(1);
        }
K
Kevin Wolf 已提交
508 509 510
    }
}

M
Michael S. Tsirkin 已提交
511 512 513
void virtqueue_map(VirtQueueElement *elem)
{
    virtqueue_map_iovec(elem->in_sg, elem->in_addr, &elem->in_num,
514
                        VIRTQUEUE_MAX_SIZE, 1);
M
Michael S. Tsirkin 已提交
515
    virtqueue_map_iovec(elem->out_sg, elem->out_addr, &elem->out_num,
516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537
                        VIRTQUEUE_MAX_SIZE, 0);
}

void *virtqueue_alloc_element(size_t sz, unsigned out_num, unsigned in_num)
{
    VirtQueueElement *elem;
    size_t in_addr_ofs = QEMU_ALIGN_UP(sz, __alignof__(elem->in_addr[0]));
    size_t out_addr_ofs = in_addr_ofs + in_num * sizeof(elem->in_addr[0]);
    size_t out_addr_end = out_addr_ofs + out_num * sizeof(elem->out_addr[0]);
    size_t in_sg_ofs = QEMU_ALIGN_UP(out_addr_end, __alignof__(elem->in_sg[0]));
    size_t out_sg_ofs = in_sg_ofs + in_num * sizeof(elem->in_sg[0]);
    size_t out_sg_end = out_sg_ofs + out_num * sizeof(elem->out_sg[0]);

    assert(sz >= sizeof(VirtQueueElement));
    elem = g_malloc(out_sg_end);
    elem->out_num = out_num;
    elem->in_num = in_num;
    elem->in_addr = (void *)elem + in_addr_ofs;
    elem->out_addr = (void *)elem + out_addr_ofs;
    elem->in_sg = (void *)elem + in_sg_ofs;
    elem->out_sg = (void *)elem + out_sg_ofs;
    return elem;
M
Michael S. Tsirkin 已提交
538 539
}

540
void *virtqueue_pop(VirtQueue *vq, size_t sz)
A
aliguori 已提交
541
{
542
    unsigned int i, head, max;
A
Avi Kivity 已提交
543
    hwaddr desc_pa = vq->vring.desc;
544
    VirtIODevice *vdev = vq->vdev;
545
    VirtQueueElement *elem;
546 547 548
    unsigned out_num, in_num;
    hwaddr addr[VIRTQUEUE_MAX_SIZE];
    struct iovec iov[VIRTQUEUE_MAX_SIZE];
549
    VRingDesc desc;
A
aliguori 已提交
550

551
    if (virtio_queue_empty(vq)) {
552 553
        return NULL;
    }
554 555 556
    /* Needed after virtio_queue_empty(), see comment in
     * virtqueue_num_heads(). */
    smp_rmb();
A
aliguori 已提交
557 558

    /* When we start there are none of either input nor output. */
559
    out_num = in_num = 0;
A
aliguori 已提交
560

561 562
    max = vq->vring.num;

A
aliguori 已提交
563
    i = head = virtqueue_get_head(vq, vq->last_avail_idx++);
564
    if (virtio_vdev_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX)) {
565
        vring_set_avail_event(vq, vq->last_avail_idx);
M
Michael S. Tsirkin 已提交
566
    }
567

568 569 570
    vring_desc_read(vdev, &desc, desc_pa, i);
    if (desc.flags & VRING_DESC_F_INDIRECT) {
        if (desc.len % sizeof(VRingDesc)) {
571
            error_report("Invalid size for indirect buffer table");
572 573 574 575
            exit(1);
        }

        /* loop over the indirect descriptor table */
576 577
        max = desc.len / sizeof(VRingDesc);
        desc_pa = desc.addr;
578
        i = 0;
579
        vring_desc_read(vdev, &desc, desc_pa, i);
580 581
    }

K
Kevin Wolf 已提交
582
    /* Collect all the descriptors */
A
aliguori 已提交
583
    do {
584
        if (desc.flags & VRING_DESC_F_WRITE) {
585
            virtqueue_map_desc(&in_num, addr + out_num, iov + out_num,
586
                               VIRTQUEUE_MAX_SIZE - out_num, true, desc.addr, desc.len);
K
Kevin Wolf 已提交
587
        } else {
588 589
            if (in_num) {
                error_report("Incorrect order for descriptors");
590 591
                exit(1);
            }
592
            virtqueue_map_desc(&out_num, addr, iov,
593
                               VIRTQUEUE_MAX_SIZE, false, desc.addr, desc.len);
K
Kevin Wolf 已提交
594
        }
A
aliguori 已提交
595 596

        /* If we've got too many, that implies a descriptor loop. */
597
        if ((in_num + out_num) > max) {
598
            error_report("Looped descriptor");
A
aliguori 已提交
599 600
            exit(1);
        }
601
    } while ((i = virtqueue_read_next_desc(vdev, &desc, desc_pa, max)) != max);
A
aliguori 已提交
602

603 604
    /* Now copy what we have collected and mapped */
    elem = virtqueue_alloc_element(sz, out_num, in_num);
A
aliguori 已提交
605
    elem->index = head;
606 607 608 609 610 611 612 613
    for (i = 0; i < out_num; i++) {
        elem->out_addr[i] = addr[i];
        elem->out_sg[i] = iov[i];
    }
    for (i = 0; i < in_num; i++) {
        elem->in_addr[i] = addr[out_num + i];
        elem->in_sg[i] = iov[out_num + i];
    }
A
aliguori 已提交
614 615 616

    vq->inuse++;

617
    trace_virtqueue_pop(vq, elem, elem->in_num, elem->out_num);
618
    return elem;
A
aliguori 已提交
619 620
}

621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637
/* Reading and writing a structure directly to QEMUFile is *awful*, but
 * it is what QEMU has always done by mistake.  We can change it sooner
 * or later by bumping the version number of the affected vm states.
 * In the meanwhile, since the in-memory layout of VirtQueueElement
 * has changed, we need to marshal to and from the layout that was
 * used before the change.
 */
typedef struct VirtQueueElementOld {
    unsigned int index;
    unsigned int out_num;
    unsigned int in_num;
    hwaddr in_addr[VIRTQUEUE_MAX_SIZE];
    hwaddr out_addr[VIRTQUEUE_MAX_SIZE];
    struct iovec in_sg[VIRTQUEUE_MAX_SIZE];
    struct iovec out_sg[VIRTQUEUE_MAX_SIZE];
} VirtQueueElementOld;

638 639
void *qemu_get_virtqueue_element(QEMUFile *f, size_t sz)
{
640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668
    VirtQueueElement *elem;
    VirtQueueElementOld data;
    int i;

    qemu_get_buffer(f, (uint8_t *)&data, sizeof(VirtQueueElementOld));

    elem = virtqueue_alloc_element(sz, data.out_num, data.in_num);
    elem->index = data.index;

    for (i = 0; i < elem->in_num; i++) {
        elem->in_addr[i] = data.in_addr[i];
    }

    for (i = 0; i < elem->out_num; i++) {
        elem->out_addr[i] = data.out_addr[i];
    }

    for (i = 0; i < elem->in_num; i++) {
        /* Base is overwritten by virtqueue_map.  */
        elem->in_sg[i].iov_base = 0;
        elem->in_sg[i].iov_len = data.in_sg[i].iov_len;
    }

    for (i = 0; i < elem->out_num; i++) {
        /* Base is overwritten by virtqueue_map.  */
        elem->out_sg[i].iov_base = 0;
        elem->out_sg[i].iov_len = data.out_sg[i].iov_len;
    }

669 670 671 672 673 674
    virtqueue_map(elem);
    return elem;
}

void qemu_put_virtqueue_element(QEMUFile *f, VirtQueueElement *elem)
{
675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701
    VirtQueueElementOld data;
    int i;

    memset(&data, 0, sizeof(data));
    data.index = elem->index;
    data.in_num = elem->in_num;
    data.out_num = elem->out_num;

    for (i = 0; i < elem->in_num; i++) {
        data.in_addr[i] = elem->in_addr[i];
    }

    for (i = 0; i < elem->out_num; i++) {
        data.out_addr[i] = elem->out_addr[i];
    }

    for (i = 0; i < elem->in_num; i++) {
        /* Base is overwritten by virtqueue_map when loading.  Do not
         * save it, as it would leak the QEMU address space layout.  */
        data.in_sg[i].iov_len = elem->in_sg[i].iov_len;
    }

    for (i = 0; i < elem->out_num; i++) {
        /* Do not save iov_base as above.  */
        data.out_sg[i].iov_len = elem->out_sg[i].iov_len;
    }
    qemu_put_buffer(f, (uint8_t *)&data, sizeof(VirtQueueElementOld));
702 703
}

A
aliguori 已提交
704
/* virtio device */
705 706
static void virtio_notify_vector(VirtIODevice *vdev, uint16_t vector)
{
K
KONRAD Frederic 已提交
707 708 709 710 711
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);

    if (k->notify) {
        k->notify(qbus->parent, vector);
712 713
    }
}
A
aliguori 已提交
714

P
Paul Brook 已提交
715
void virtio_update_irq(VirtIODevice *vdev)
A
aliguori 已提交
716
{
717
    virtio_notify_vector(vdev, VIRTIO_NO_VECTOR);
A
aliguori 已提交
718 719
}

720 721 722 723 724 725 726 727 728 729 730 731
static int virtio_validate_features(VirtIODevice *vdev)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);

    if (k->validate_features) {
        return k->validate_features(vdev);
    } else {
        return 0;
    }
}

int virtio_set_status(VirtIODevice *vdev, uint8_t val)
732
{
733
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
734 735
    trace_virtio_set_status(vdev, val);

736
    if (virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1)) {
737 738 739 740 741 742 743 744 745
        if (!(vdev->status & VIRTIO_CONFIG_S_FEATURES_OK) &&
            val & VIRTIO_CONFIG_S_FEATURES_OK) {
            int ret = virtio_validate_features(vdev);

            if (ret) {
                return ret;
            }
        }
    }
746 747
    if (k->set_status) {
        k->set_status(vdev, val);
748 749
    }
    vdev->status = val;
750
    return 0;
751 752
}

753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773
bool target_words_bigendian(void);
static enum virtio_device_endian virtio_default_endian(void)
{
    if (target_words_bigendian()) {
        return VIRTIO_DEVICE_ENDIAN_BIG;
    } else {
        return VIRTIO_DEVICE_ENDIAN_LITTLE;
    }
}

static enum virtio_device_endian virtio_current_cpu_endian(void)
{
    CPUClass *cc = CPU_GET_CLASS(current_cpu);

    if (cc->virtio_is_big_endian(current_cpu)) {
        return VIRTIO_DEVICE_ENDIAN_BIG;
    } else {
        return VIRTIO_DEVICE_ENDIAN_LITTLE;
    }
}

P
Paul Brook 已提交
774
void virtio_reset(void *opaque)
A
aliguori 已提交
775 776
{
    VirtIODevice *vdev = opaque;
777
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
778 779
    int i;

780
    virtio_set_status(vdev, 0);
781 782 783 784 785 786 787
    if (current_cpu) {
        /* Guest initiated reset */
        vdev->device_endian = virtio_current_cpu_endian();
    } else {
        /* System reset */
        vdev->device_endian = virtio_default_endian();
    }
788

789 790 791
    if (k->reset) {
        k->reset(vdev);
    }
A
aliguori 已提交
792

793
    vdev->guest_features = 0;
A
aliguori 已提交
794 795 796
    vdev->queue_sel = 0;
    vdev->status = 0;
    vdev->isr = 0;
797 798
    vdev->config_vector = VIRTIO_NO_VECTOR;
    virtio_notify_vector(vdev, vdev->config_vector);
A
aliguori 已提交
799

800
    for(i = 0; i < VIRTIO_QUEUE_MAX; i++) {
A
aliguori 已提交
801 802 803 804
        vdev->vq[i].vring.desc = 0;
        vdev->vq[i].vring.avail = 0;
        vdev->vq[i].vring.used = 0;
        vdev->vq[i].last_avail_idx = 0;
805
        vdev->vq[i].shadow_avail_idx = 0;
806
        vdev->vq[i].used_idx = 0;
807
        virtio_queue_set_vector(vdev, i, VIRTIO_NO_VECTOR);
M
Michael S. Tsirkin 已提交
808 809 810
        vdev->vq[i].signalled_used = 0;
        vdev->vq[i].signalled_used_valid = false;
        vdev->vq[i].notification = true;
C
Cornelia Huck 已提交
811
        vdev->vq[i].vring.num = vdev->vq[i].vring.num_default;
A
aliguori 已提交
812 813 814
    }
}

P
Paul Brook 已提交
815
uint32_t virtio_config_readb(VirtIODevice *vdev, uint32_t addr)
A
aliguori 已提交
816
{
817
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
818 819
    uint8_t val;

820
    if (addr + sizeof(val) > vdev->config_len) {
A
aliguori 已提交
821
        return (uint32_t)-1;
822 823 824
    }

    k->get_config(vdev, vdev->config);
A
aliguori 已提交
825

826
    val = ldub_p(vdev->config + addr);
A
aliguori 已提交
827 828 829
    return val;
}

P
Paul Brook 已提交
830
uint32_t virtio_config_readw(VirtIODevice *vdev, uint32_t addr)
A
aliguori 已提交
831
{
832
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
833 834
    uint16_t val;

835
    if (addr + sizeof(val) > vdev->config_len) {
A
aliguori 已提交
836
        return (uint32_t)-1;
837 838 839
    }

    k->get_config(vdev, vdev->config);
A
aliguori 已提交
840

841
    val = lduw_p(vdev->config + addr);
A
aliguori 已提交
842 843 844
    return val;
}

P
Paul Brook 已提交
845
uint32_t virtio_config_readl(VirtIODevice *vdev, uint32_t addr)
A
aliguori 已提交
846
{
847
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
848 849
    uint32_t val;

850
    if (addr + sizeof(val) > vdev->config_len) {
A
aliguori 已提交
851
        return (uint32_t)-1;
852 853 854
    }

    k->get_config(vdev, vdev->config);
A
aliguori 已提交
855

856
    val = ldl_p(vdev->config + addr);
A
aliguori 已提交
857 858 859
    return val;
}

P
Paul Brook 已提交
860
void virtio_config_writeb(VirtIODevice *vdev, uint32_t addr, uint32_t data)
A
aliguori 已提交
861
{
862
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
863 864
    uint8_t val = data;

865
    if (addr + sizeof(val) > vdev->config_len) {
A
aliguori 已提交
866
        return;
867
    }
A
aliguori 已提交
868

869
    stb_p(vdev->config + addr, val);
A
aliguori 已提交
870

871 872 873
    if (k->set_config) {
        k->set_config(vdev, vdev->config);
    }
A
aliguori 已提交
874 875
}

P
Paul Brook 已提交
876
void virtio_config_writew(VirtIODevice *vdev, uint32_t addr, uint32_t data)
A
aliguori 已提交
877
{
878
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
879 880
    uint16_t val = data;

881
    if (addr + sizeof(val) > vdev->config_len) {
A
aliguori 已提交
882
        return;
883
    }
A
aliguori 已提交
884

885
    stw_p(vdev->config + addr, val);
A
aliguori 已提交
886

887 888 889
    if (k->set_config) {
        k->set_config(vdev, vdev->config);
    }
A
aliguori 已提交
890 891
}

P
Paul Brook 已提交
892
void virtio_config_writel(VirtIODevice *vdev, uint32_t addr, uint32_t data)
A
aliguori 已提交
893
{
894
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
895 896
    uint32_t val = data;

897
    if (addr + sizeof(val) > vdev->config_len) {
A
aliguori 已提交
898
        return;
899
    }
A
aliguori 已提交
900

901
    stl_p(vdev->config + addr, val);
A
aliguori 已提交
902

903 904 905
    if (k->set_config) {
        k->set_config(vdev, vdev->config);
    }
A
aliguori 已提交
906 907
}

908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003
uint32_t virtio_config_modern_readb(VirtIODevice *vdev, uint32_t addr)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
    uint8_t val;

    if (addr + sizeof(val) > vdev->config_len) {
        return (uint32_t)-1;
    }

    k->get_config(vdev, vdev->config);

    val = ldub_p(vdev->config + addr);
    return val;
}

uint32_t virtio_config_modern_readw(VirtIODevice *vdev, uint32_t addr)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
    uint16_t val;

    if (addr + sizeof(val) > vdev->config_len) {
        return (uint32_t)-1;
    }

    k->get_config(vdev, vdev->config);

    val = lduw_le_p(vdev->config + addr);
    return val;
}

uint32_t virtio_config_modern_readl(VirtIODevice *vdev, uint32_t addr)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
    uint32_t val;

    if (addr + sizeof(val) > vdev->config_len) {
        return (uint32_t)-1;
    }

    k->get_config(vdev, vdev->config);

    val = ldl_le_p(vdev->config + addr);
    return val;
}

void virtio_config_modern_writeb(VirtIODevice *vdev,
                                 uint32_t addr, uint32_t data)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
    uint8_t val = data;

    if (addr + sizeof(val) > vdev->config_len) {
        return;
    }

    stb_p(vdev->config + addr, val);

    if (k->set_config) {
        k->set_config(vdev, vdev->config);
    }
}

void virtio_config_modern_writew(VirtIODevice *vdev,
                                 uint32_t addr, uint32_t data)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
    uint16_t val = data;

    if (addr + sizeof(val) > vdev->config_len) {
        return;
    }

    stw_le_p(vdev->config + addr, val);

    if (k->set_config) {
        k->set_config(vdev, vdev->config);
    }
}

void virtio_config_modern_writel(VirtIODevice *vdev,
                                 uint32_t addr, uint32_t data)
{
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
    uint32_t val = data;

    if (addr + sizeof(val) > vdev->config_len) {
        return;
    }

    stl_le_p(vdev->config + addr, val);

    if (k->set_config) {
        k->set_config(vdev, vdev->config);
    }
}

A
Avi Kivity 已提交
1004
void virtio_queue_set_addr(VirtIODevice *vdev, int n, hwaddr addr)
A
aliguori 已提交
1005
{
1006 1007
    vdev->vq[n].vring.desc = addr;
    virtio_queue_update_rings(vdev, n);
P
Paul Brook 已提交
1008 1009
}

A
Avi Kivity 已提交
1010
hwaddr virtio_queue_get_addr(VirtIODevice *vdev, int n)
P
Paul Brook 已提交
1011
{
1012 1013 1014 1015 1016 1017 1018 1019 1020
    return vdev->vq[n].vring.desc;
}

void virtio_queue_set_rings(VirtIODevice *vdev, int n, hwaddr desc,
                            hwaddr avail, hwaddr used)
{
    vdev->vq[n].vring.desc = desc;
    vdev->vq[n].vring.avail = avail;
    vdev->vq[n].vring.used = used;
P
Paul Brook 已提交
1021 1022
}

1023 1024
void virtio_queue_set_num(VirtIODevice *vdev, int n, int num)
{
1025 1026 1027 1028 1029 1030 1031
    /* Don't allow guest to flip queue between existent and
     * nonexistent states, or to set it to an invalid size.
     */
    if (!!num != !!vdev->vq[n].vring.num ||
        num > VIRTQUEUE_MAX_SIZE ||
        num < 0) {
        return;
1032
    }
1033
    vdev->vq[n].vring.num = num;
1034 1035
}

1036 1037 1038 1039 1040 1041 1042 1043 1044 1045
VirtQueue *virtio_vector_first_queue(VirtIODevice *vdev, uint16_t vector)
{
    return QLIST_FIRST(&vdev->vector_queues[vector]);
}

VirtQueue *virtio_vector_next_queue(VirtQueue *vq)
{
    return QLIST_NEXT(vq, node);
}

P
Paul Brook 已提交
1046 1047 1048 1049
int virtio_queue_get_num(VirtIODevice *vdev, int n)
{
    return vdev->vq[n].vring.num;
}
A
aliguori 已提交
1050

1051 1052 1053 1054
int virtio_get_num_queues(VirtIODevice *vdev)
{
    int i;

1055
    for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1056 1057 1058 1059 1060 1061 1062 1063
        if (!virtio_queue_get_num(vdev, i)) {
            break;
        }
    }

    return i;
}

P
Paolo Bonzini 已提交
1064 1065 1066
int virtio_queue_get_id(VirtQueue *vq)
{
    VirtIODevice *vdev = vq->vdev;
1067
    assert(vq >= &vdev->vq[0] && vq < &vdev->vq[VIRTIO_QUEUE_MAX]);
P
Paolo Bonzini 已提交
1068 1069 1070
    return vq - &vdev->vq[0];
}

1071 1072 1073 1074 1075
void virtio_queue_set_align(VirtIODevice *vdev, int n, int align)
{
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);

1076
    /* virtio-1 compliant devices cannot change the alignment */
1077
    if (virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1)) {
1078 1079 1080
        error_report("tried to modify queue alignment for virtio-1 device");
        return;
    }
1081 1082 1083 1084 1085 1086 1087
    /* Check that the transport told us it was going to do this
     * (so a buggy transport will immediately assert rather than
     * silently failing to migrate this state)
     */
    assert(k->has_variable_vring_alignment);

    vdev->vq[n].vring.align = align;
1088
    virtio_queue_update_rings(vdev, n);
1089 1090
}

1091 1092
void virtio_queue_notify_vq(VirtQueue *vq)
{
1093
    if (vq->vring.desc && vq->handle_output) {
1094
        VirtIODevice *vdev = vq->vdev;
1095

1096 1097 1098 1099 1100
        trace_virtio_queue_notify(vdev, vq - vdev->vq, vq);
        vq->handle_output(vdev, vq);
    }
}

P
Paul Brook 已提交
1101 1102
void virtio_queue_notify(VirtIODevice *vdev, int n)
{
1103
    virtio_queue_notify_vq(&vdev->vq[n]);
A
aliguori 已提交
1104 1105
}

1106 1107
uint16_t virtio_queue_vector(VirtIODevice *vdev, int n)
{
1108
    return n < VIRTIO_QUEUE_MAX ? vdev->vq[n].vector :
1109 1110 1111 1112 1113
        VIRTIO_NO_VECTOR;
}

void virtio_queue_set_vector(VirtIODevice *vdev, int n, uint16_t vector)
{
1114 1115
    VirtQueue *vq = &vdev->vq[n];

1116
    if (n < VIRTIO_QUEUE_MAX) {
1117 1118 1119 1120
        if (vdev->vector_queues &&
            vdev->vq[n].vector != VIRTIO_NO_VECTOR) {
            QLIST_REMOVE(vq, node);
        }
1121
        vdev->vq[n].vector = vector;
1122 1123 1124 1125 1126
        if (vdev->vector_queues &&
            vector != VIRTIO_NO_VECTOR) {
            QLIST_INSERT_HEAD(&vdev->vector_queues[vector], vq, node);
        }
    }
1127 1128
}

A
aliguori 已提交
1129 1130 1131 1132 1133
VirtQueue *virtio_add_queue(VirtIODevice *vdev, int queue_size,
                            void (*handle_output)(VirtIODevice *, VirtQueue *))
{
    int i;

1134
    for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
A
aliguori 已提交
1135 1136 1137 1138
        if (vdev->vq[i].vring.num == 0)
            break;
    }

1139
    if (i == VIRTIO_QUEUE_MAX || queue_size > VIRTQUEUE_MAX_SIZE)
A
aliguori 已提交
1140 1141 1142
        abort();

    vdev->vq[i].vring.num = queue_size;
C
Cornelia Huck 已提交
1143
    vdev->vq[i].vring.num_default = queue_size;
1144
    vdev->vq[i].vring.align = VIRTIO_PCI_VRING_ALIGN;
A
aliguori 已提交
1145 1146 1147 1148 1149
    vdev->vq[i].handle_output = handle_output;

    return &vdev->vq[i];
}

1150 1151
void virtio_del_queue(VirtIODevice *vdev, int n)
{
1152
    if (n < 0 || n >= VIRTIO_QUEUE_MAX) {
1153 1154 1155 1156
        abort();
    }

    vdev->vq[n].vring.num = 0;
C
Cornelia Huck 已提交
1157
    vdev->vq[n].vring.num_default = 0;
1158 1159
}

1160 1161
void virtio_irq(VirtQueue *vq)
{
1162
    trace_virtio_irq(vq);
1163 1164 1165 1166
    vq->vdev->isr |= 0x01;
    virtio_notify_vector(vq->vdev, vq->vector);
}

1167
bool virtio_should_notify(VirtIODevice *vdev, VirtQueue *vq)
M
Michael S. Tsirkin 已提交
1168 1169 1170
{
    uint16_t old, new;
    bool v;
1171 1172
    /* We need to expose used array entries before checking used event. */
    smp_mb();
1173
    /* Always notify when queue is empty (when feature acknowledge) */
1174
    if (virtio_vdev_has_feature(vdev, VIRTIO_F_NOTIFY_ON_EMPTY) &&
1175
        !vq->inuse && virtio_queue_empty(vq)) {
M
Michael S. Tsirkin 已提交
1176 1177 1178
        return true;
    }

1179
    if (!virtio_vdev_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX)) {
M
Michael S. Tsirkin 已提交
1180 1181 1182 1183 1184 1185
        return !(vring_avail_flags(vq) & VRING_AVAIL_F_NO_INTERRUPT);
    }

    v = vq->signalled_used_valid;
    vq->signalled_used_valid = true;
    old = vq->signalled_used;
1186
    new = vq->signalled_used = vq->used_idx;
1187
    return !v || vring_need_event(vring_get_used_event(vq), new, old);
M
Michael S. Tsirkin 已提交
1188 1189 1190 1191
}

void virtio_notify(VirtIODevice *vdev, VirtQueue *vq)
{
1192
    if (!virtio_should_notify(vdev, vq)) {
A
aliguori 已提交
1193
        return;
M
Michael S. Tsirkin 已提交
1194
    }
A
aliguori 已提交
1195

1196
    trace_virtio_notify(vdev, vq);
A
aliguori 已提交
1197
    vdev->isr |= 0x01;
1198
    virtio_notify_vector(vdev, vq->vector);
A
aliguori 已提交
1199 1200 1201 1202
}

void virtio_notify_config(VirtIODevice *vdev)
{
1203 1204 1205
    if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))
        return;

A
aliguori 已提交
1206
    vdev->isr |= 0x03;
1207
    vdev->generation++;
1208
    virtio_notify_vector(vdev, vdev->config_vector);
A
aliguori 已提交
1209 1210
}

1211 1212 1213 1214 1215
static bool virtio_device_endian_needed(void *opaque)
{
    VirtIODevice *vdev = opaque;

    assert(vdev->device_endian != VIRTIO_DEVICE_ENDIAN_UNKNOWN);
1216
    if (!virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1)) {
1217 1218 1219 1220
        return vdev->device_endian != virtio_default_endian();
    }
    /* Devices conforming to VIRTIO 1.0 or later are always LE. */
    return vdev->device_endian != VIRTIO_DEVICE_ENDIAN_LITTLE;
1221 1222
}

G
Gerd Hoffmann 已提交
1223 1224 1225 1226 1227 1228 1229
static bool virtio_64bit_features_needed(void *opaque)
{
    VirtIODevice *vdev = opaque;

    return (vdev->host_features >> 32) != 0;
}

J
Jason Wang 已提交
1230 1231 1232 1233 1234 1235 1236
static bool virtio_virtqueue_needed(void *opaque)
{
    VirtIODevice *vdev = opaque;

    return virtio_host_has_feature(vdev, VIRTIO_F_VERSION_1);
}

C
Cornelia Huck 已提交
1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249
static bool virtio_ringsize_needed(void *opaque)
{
    VirtIODevice *vdev = opaque;
    int i;

    for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
        if (vdev->vq[i].vring.num != vdev->vq[i].vring.num_default) {
            return true;
        }
    }
    return false;
}

1250 1251 1252 1253 1254 1255 1256 1257 1258 1259
static bool virtio_extra_state_needed(void *opaque)
{
    VirtIODevice *vdev = opaque;
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);

    return k->has_extra_state &&
        k->has_extra_state(qbus->parent);
}

1260
static const VMStateDescription vmstate_virtqueue = {
J
Jason Wang 已提交
1261
    .name = "virtqueue_state",
1262 1263 1264 1265 1266 1267 1268
    .version_id = 1,
    .minimum_version_id = 1,
    .fields = (VMStateField[]) {
        VMSTATE_UINT64(vring.avail, struct VirtQueue),
        VMSTATE_UINT64(vring.used, struct VirtQueue),
        VMSTATE_END_OF_LIST()
    }
J
Jason Wang 已提交
1269 1270 1271 1272 1273 1274 1275 1276
};

static const VMStateDescription vmstate_virtio_virtqueues = {
    .name = "virtio/virtqueues",
    .version_id = 1,
    .minimum_version_id = 1,
    .needed = &virtio_virtqueue_needed,
    .fields = (VMStateField[]) {
D
Dr. David Alan Gilbert 已提交
1277 1278
        VMSTATE_STRUCT_VARRAY_POINTER_KNOWN(vq, struct VirtIODevice,
                      VIRTIO_QUEUE_MAX, 0, vmstate_virtqueue, VirtQueue),
J
Jason Wang 已提交
1279 1280 1281 1282
        VMSTATE_END_OF_LIST()
    }
};

1283
static const VMStateDescription vmstate_ringsize = {
C
Cornelia Huck 已提交
1284
    .name = "ringsize_state",
1285 1286 1287 1288 1289 1290
    .version_id = 1,
    .minimum_version_id = 1,
    .fields = (VMStateField[]) {
        VMSTATE_UINT32(vring.num_default, struct VirtQueue),
        VMSTATE_END_OF_LIST()
    }
C
Cornelia Huck 已提交
1291 1292 1293 1294 1295 1296 1297 1298
};

static const VMStateDescription vmstate_virtio_ringsize = {
    .name = "virtio/ringsize",
    .version_id = 1,
    .minimum_version_id = 1,
    .needed = &virtio_ringsize_needed,
    .fields = (VMStateField[]) {
D
Dr. David Alan Gilbert 已提交
1299 1300
        VMSTATE_STRUCT_VARRAY_POINTER_KNOWN(vq, struct VirtIODevice,
                      VIRTIO_QUEUE_MAX, 0, vmstate_ringsize, VirtQueue),
C
Cornelia Huck 已提交
1301 1302 1303 1304
        VMSTATE_END_OF_LIST()
    }
};

1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351
static int get_extra_state(QEMUFile *f, void *pv, size_t size)
{
    VirtIODevice *vdev = pv;
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);

    if (!k->load_extra_state) {
        return -1;
    } else {
        return k->load_extra_state(qbus->parent, f);
    }
}

static void put_extra_state(QEMUFile *f, void *pv, size_t size)
{
    VirtIODevice *vdev = pv;
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);

    k->save_extra_state(qbus->parent, f);
}

static const VMStateInfo vmstate_info_extra_state = {
    .name = "virtqueue_extra_state",
    .get = get_extra_state,
    .put = put_extra_state,
};

static const VMStateDescription vmstate_virtio_extra_state = {
    .name = "virtio/extra_state",
    .version_id = 1,
    .minimum_version_id = 1,
    .needed = &virtio_extra_state_needed,
    .fields = (VMStateField[]) {
        {
            .name         = "extra_state",
            .version_id   = 0,
            .field_exists = NULL,
            .size         = 0,
            .info         = &vmstate_info_extra_state,
            .flags        = VMS_SINGLE,
            .offset       = 0,
        },
        VMSTATE_END_OF_LIST()
    }
};

1352 1353 1354 1355
static const VMStateDescription vmstate_virtio_device_endian = {
    .name = "virtio/device_endian",
    .version_id = 1,
    .minimum_version_id = 1,
1356
    .needed = &virtio_device_endian_needed,
1357 1358 1359 1360 1361 1362
    .fields = (VMStateField[]) {
        VMSTATE_UINT8(device_endian, VirtIODevice),
        VMSTATE_END_OF_LIST()
    }
};

G
Gerd Hoffmann 已提交
1363 1364 1365 1366
static const VMStateDescription vmstate_virtio_64bit_features = {
    .name = "virtio/64bit_features",
    .version_id = 1,
    .minimum_version_id = 1,
1367
    .needed = &virtio_64bit_features_needed,
G
Gerd Hoffmann 已提交
1368 1369 1370 1371 1372 1373
    .fields = (VMStateField[]) {
        VMSTATE_UINT64(guest_features, VirtIODevice),
        VMSTATE_END_OF_LIST()
    }
};

1374 1375 1376 1377 1378 1379 1380
static const VMStateDescription vmstate_virtio = {
    .name = "virtio",
    .version_id = 1,
    .minimum_version_id = 1,
    .minimum_version_id_old = 1,
    .fields = (VMStateField[]) {
        VMSTATE_END_OF_LIST()
1381
    },
1382 1383 1384
    .subsections = (const VMStateDescription*[]) {
        &vmstate_virtio_device_endian,
        &vmstate_virtio_64bit_features,
J
Jason Wang 已提交
1385
        &vmstate_virtio_virtqueues,
C
Cornelia Huck 已提交
1386
        &vmstate_virtio_ringsize,
1387
        &vmstate_virtio_extra_state,
1388
        NULL
1389 1390 1391
    }
};

A
aliguori 已提交
1392 1393
void virtio_save(VirtIODevice *vdev, QEMUFile *f)
{
K
KONRAD Frederic 已提交
1394 1395
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1396
    VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(vdev);
G
Gerd Hoffmann 已提交
1397
    uint32_t guest_features_lo = (vdev->guest_features & 0xffffffff);
A
aliguori 已提交
1398 1399
    int i;

K
KONRAD Frederic 已提交
1400 1401 1402
    if (k->save_config) {
        k->save_config(qbus->parent, f);
    }
A
aliguori 已提交
1403 1404 1405 1406

    qemu_put_8s(f, &vdev->status);
    qemu_put_8s(f, &vdev->isr);
    qemu_put_be16s(f, &vdev->queue_sel);
G
Gerd Hoffmann 已提交
1407
    qemu_put_be32s(f, &guest_features_lo);
A
aliguori 已提交
1408 1409 1410
    qemu_put_be32(f, vdev->config_len);
    qemu_put_buffer(f, vdev->config, vdev->config_len);

1411
    for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
A
aliguori 已提交
1412 1413 1414 1415 1416 1417
        if (vdev->vq[i].vring.num == 0)
            break;
    }

    qemu_put_be32(f, i);

1418
    for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
A
aliguori 已提交
1419 1420 1421 1422
        if (vdev->vq[i].vring.num == 0)
            break;

        qemu_put_be32(f, vdev->vq[i].vring.num);
1423 1424 1425
        if (k->has_variable_vring_alignment) {
            qemu_put_be32(f, vdev->vq[i].vring.align);
        }
1426 1427
        /* XXX virtio-1 devices */
        qemu_put_be64(f, vdev->vq[i].vring.desc);
A
aliguori 已提交
1428
        qemu_put_be16s(f, &vdev->vq[i].last_avail_idx);
K
KONRAD Frederic 已提交
1429 1430 1431
        if (k->save_queue) {
            k->save_queue(qbus->parent, i, f);
        }
A
aliguori 已提交
1432
    }
1433 1434 1435 1436

    if (vdc->save != NULL) {
        vdc->save(vdev, f);
    }
1437 1438

    /* Subsections */
1439
    vmstate_save_state(f, &vmstate_virtio, vdev, NULL);
A
aliguori 已提交
1440 1441
}

1442
static int virtio_set_features_nocheck(VirtIODevice *vdev, uint64_t val)
1443
{
1444
    VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
C
Cornelia Huck 已提交
1445
    bool bad = (val & ~(vdev->host_features)) != 0;
1446

C
Cornelia Huck 已提交
1447
    val &= vdev->host_features;
1448 1449
    if (k->set_features) {
        k->set_features(vdev, val);
1450 1451 1452 1453 1454
    }
    vdev->guest_features = val;
    return bad ? -1 : 0;
}

1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466
int virtio_set_features(VirtIODevice *vdev, uint64_t val)
{
   /*
     * The driver must not attempt to set features after feature negotiation
     * has finished.
     */
    if (vdev->status & VIRTIO_CONFIG_S_FEATURES_OK) {
        return -EINVAL;
    }
    return virtio_set_features_nocheck(vdev, val);
}

1467
int virtio_load(VirtIODevice *vdev, QEMUFile *f, int version_id)
A
aliguori 已提交
1468
{
1469
    int i, ret;
1470
    int32_t config_len;
1471
    uint32_t num;
1472
    uint32_t features;
K
KONRAD Frederic 已提交
1473 1474
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1475
    VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(vdev);
A
aliguori 已提交
1476

1477 1478 1479 1480 1481 1482
    /*
     * We poison the endianness to ensure it does not get used before
     * subsections have been loaded.
     */
    vdev->device_endian = VIRTIO_DEVICE_ENDIAN_UNKNOWN;

K
KONRAD Frederic 已提交
1483 1484
    if (k->load_config) {
        ret = k->load_config(qbus->parent, f);
1485 1486 1487
        if (ret)
            return ret;
    }
A
aliguori 已提交
1488 1489 1490 1491

    qemu_get_8s(f, &vdev->status);
    qemu_get_8s(f, &vdev->isr);
    qemu_get_be16s(f, &vdev->queue_sel);
1492
    if (vdev->queue_sel >= VIRTIO_QUEUE_MAX) {
1493 1494
        return -1;
    }
1495
    qemu_get_be32s(f, &features);
1496

1497
    config_len = qemu_get_be32(f);
1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508

    /*
     * There are cases where the incoming config can be bigger or smaller
     * than what we have; so load what we have space for, and skip
     * any excess that's in the stream.
     */
    qemu_get_buffer(f, vdev->config, MIN(config_len, vdev->config_len));

    while (config_len > vdev->config_len) {
        qemu_get_byte(f);
        config_len--;
1509
    }
A
aliguori 已提交
1510 1511 1512

    num = qemu_get_be32(f);

1513
    if (num > VIRTIO_QUEUE_MAX) {
1514
        error_report("Invalid number of virtqueues: 0x%x", num);
1515 1516 1517
        return -1;
    }

A
aliguori 已提交
1518 1519
    for (i = 0; i < num; i++) {
        vdev->vq[i].vring.num = qemu_get_be32(f);
1520 1521 1522
        if (k->has_variable_vring_alignment) {
            vdev->vq[i].vring.align = qemu_get_be32(f);
        }
1523
        vdev->vq[i].vring.desc = qemu_get_be64(f);
A
aliguori 已提交
1524
        qemu_get_be16s(f, &vdev->vq[i].last_avail_idx);
M
Michael S. Tsirkin 已提交
1525 1526
        vdev->vq[i].signalled_used_valid = false;
        vdev->vq[i].notification = true;
A
aliguori 已提交
1527

1528 1529 1530
        if (vdev->vq[i].vring.desc) {
            /* XXX virtio-1 devices */
            virtio_queue_update_rings(vdev, i);
M
Michael S. Tsirkin 已提交
1531 1532
        } else if (vdev->vq[i].last_avail_idx) {
            error_report("VQ %d address 0x0 "
1533
                         "inconsistent with Host index 0x%x",
M
Michael S. Tsirkin 已提交
1534 1535
                         i, vdev->vq[i].last_avail_idx);
                return -1;
1536
	}
K
KONRAD Frederic 已提交
1537 1538
        if (k->load_queue) {
            ret = k->load_queue(qbus->parent, i, f);
1539 1540
            if (ret)
                return ret;
1541
        }
A
aliguori 已提交
1542 1543
    }

1544
    virtio_notify_vector(vdev, VIRTIO_NO_VECTOR);
1545 1546

    if (vdc->load != NULL) {
1547 1548 1549 1550
        ret = vdc->load(vdev, f, version_id);
        if (ret) {
            return ret;
        }
1551 1552
    }

1553 1554 1555 1556 1557 1558 1559 1560 1561 1562
    /* Subsections */
    ret = vmstate_load_state(f, &vmstate_virtio, vdev, 1);
    if (ret) {
        return ret;
    }

    if (vdev->device_endian == VIRTIO_DEVICE_ENDIAN_UNKNOWN) {
        vdev->device_endian = virtio_default_endian();
    }

G
Gerd Hoffmann 已提交
1563 1564 1565 1566 1567 1568 1569
    if (virtio_64bit_features_needed(vdev)) {
        /*
         * Subsection load filled vdev->guest_features.  Run them
         * through virtio_set_features to sanity-check them against
         * host_features.
         */
        uint64_t features64 = vdev->guest_features;
1570
        if (virtio_set_features_nocheck(vdev, features64) < 0) {
G
Gerd Hoffmann 已提交
1571 1572 1573 1574 1575 1576
            error_report("Features 0x%" PRIx64 " unsupported. "
                         "Allowed features: 0x%" PRIx64,
                         features64, vdev->host_features);
            return -1;
        }
    } else {
1577
        if (virtio_set_features_nocheck(vdev, features) < 0) {
G
Gerd Hoffmann 已提交
1578 1579 1580 1581 1582 1583 1584
            error_report("Features 0x%x unsupported. "
                         "Allowed features: 0x%" PRIx64,
                         features, vdev->host_features);
            return -1;
        }
    }

1585
    for (i = 0; i < num; i++) {
1586
        if (vdev->vq[i].vring.desc) {
1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597
            uint16_t nheads;
            nheads = vring_avail_idx(&vdev->vq[i]) - vdev->vq[i].last_avail_idx;
            /* Check it isn't doing strange things with descriptor numbers. */
            if (nheads > vdev->vq[i].vring.num) {
                error_report("VQ %d size 0x%x Guest index 0x%x "
                             "inconsistent with Host index 0x%x: delta 0x%x",
                             i, vdev->vq[i].vring.num,
                             vring_avail_idx(&vdev->vq[i]),
                             vdev->vq[i].last_avail_idx, nheads);
                return -1;
            }
1598
            vdev->vq[i].used_idx = vring_used_idx(&vdev->vq[i]);
1599
            vdev->vq[i].shadow_avail_idx = vring_avail_idx(&vdev->vq[i]);
1600 1601 1602 1603
        }
    }

    return 0;
A
aliguori 已提交
1604 1605
}

1606
void virtio_cleanup(VirtIODevice *vdev)
1607
{
1608
    qemu_del_vm_change_state_handler(vdev->vmstate);
1609
    g_free(vdev->config);
1610
    g_free(vdev->vq);
1611
    g_free(vdev->vector_queues);
1612 1613
}

1614
static void virtio_vmstate_change(void *opaque, int running, RunState state)
1615 1616
{
    VirtIODevice *vdev = opaque;
K
KONRAD Frederic 已提交
1617 1618
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1619
    bool backend_run = running && (vdev->status & VIRTIO_CONFIG_S_DRIVER_OK);
1620
    vdev->vm_running = running;
1621 1622 1623 1624 1625

    if (backend_run) {
        virtio_set_status(vdev, vdev->status);
    }

K
KONRAD Frederic 已提交
1626 1627
    if (k->vmstate_change) {
        k->vmstate_change(qbus->parent, backend_run);
1628 1629 1630 1631 1632 1633 1634
    }

    if (!backend_run) {
        virtio_set_status(vdev, vdev->status);
    }
}

1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645
void virtio_instance_init_common(Object *proxy_obj, void *data,
                                 size_t vdev_size, const char *vdev_name)
{
    DeviceState *vdev = data;

    object_initialize(vdev, vdev_size, vdev_name);
    object_property_add_child(proxy_obj, "virtio-backend", OBJECT(vdev), NULL);
    object_unref(OBJECT(vdev));
    qdev_alias_all_properties(vdev, proxy_obj);
}

1646 1647
void virtio_init(VirtIODevice *vdev, const char *name,
                 uint16_t device_id, size_t config_size)
A
aliguori 已提交
1648
{
1649 1650
    BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
    VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1651
    int i;
1652 1653 1654 1655 1656 1657 1658
    int nvectors = k->query_nvectors ? k->query_nvectors(qbus->parent) : 0;

    if (nvectors) {
        vdev->vector_queues =
            g_malloc0(sizeof(*vdev->vector_queues) * nvectors);
    }

P
Paul Brook 已提交
1659
    vdev->device_id = device_id;
A
aliguori 已提交
1660 1661 1662
    vdev->status = 0;
    vdev->isr = 0;
    vdev->queue_sel = 0;
1663
    vdev->config_vector = VIRTIO_NO_VECTOR;
1664
    vdev->vq = g_malloc0(sizeof(VirtQueue) * VIRTIO_QUEUE_MAX);
1665
    vdev->vm_running = runstate_is_running();
1666
    for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1667
        vdev->vq[i].vector = VIRTIO_NO_VECTOR;
1668
        vdev->vq[i].vdev = vdev;
1669
        vdev->vq[i].queue_index = i;
1670
    }
A
aliguori 已提交
1671 1672 1673

    vdev->name = name;
    vdev->config_len = config_size;
1674
    if (vdev->config_len) {
1675
        vdev->config = g_malloc0(config_size);
1676
    } else {
A
aliguori 已提交
1677
        vdev->config = NULL;
1678 1679 1680
    }
    vdev->vmstate = qemu_add_vm_change_state_handler(virtio_vmstate_change,
                                                     vdev);
1681
    vdev->device_endian = virtio_default_endian();
1682
    vdev->use_guest_notifier_mask = true;
1683
}
A
aliguori 已提交
1684

A
Avi Kivity 已提交
1685
hwaddr virtio_queue_get_desc_addr(VirtIODevice *vdev, int n)
1686 1687 1688 1689
{
    return vdev->vq[n].vring.desc;
}

A
Avi Kivity 已提交
1690
hwaddr virtio_queue_get_avail_addr(VirtIODevice *vdev, int n)
1691 1692 1693 1694
{
    return vdev->vq[n].vring.avail;
}

A
Avi Kivity 已提交
1695
hwaddr virtio_queue_get_used_addr(VirtIODevice *vdev, int n)
1696 1697 1698 1699
{
    return vdev->vq[n].vring.used;
}

A
Avi Kivity 已提交
1700
hwaddr virtio_queue_get_ring_addr(VirtIODevice *vdev, int n)
1701 1702 1703 1704
{
    return vdev->vq[n].vring.desc;
}

A
Avi Kivity 已提交
1705
hwaddr virtio_queue_get_desc_size(VirtIODevice *vdev, int n)
1706 1707 1708 1709
{
    return sizeof(VRingDesc) * vdev->vq[n].vring.num;
}

A
Avi Kivity 已提交
1710
hwaddr virtio_queue_get_avail_size(VirtIODevice *vdev, int n)
1711 1712
{
    return offsetof(VRingAvail, ring) +
1713
        sizeof(uint16_t) * vdev->vq[n].vring.num;
1714 1715
}

A
Avi Kivity 已提交
1716
hwaddr virtio_queue_get_used_size(VirtIODevice *vdev, int n)
1717 1718 1719 1720 1721
{
    return offsetof(VRingUsed, ring) +
        sizeof(VRingUsedElem) * vdev->vq[n].vring.num;
}

A
Avi Kivity 已提交
1722
hwaddr virtio_queue_get_ring_size(VirtIODevice *vdev, int n)
1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735
{
    return vdev->vq[n].vring.used - vdev->vq[n].vring.desc +
	    virtio_queue_get_used_size(vdev, n);
}

uint16_t virtio_queue_get_last_avail_idx(VirtIODevice *vdev, int n)
{
    return vdev->vq[n].last_avail_idx;
}

void virtio_queue_set_last_avail_idx(VirtIODevice *vdev, int n, uint16_t idx)
{
    vdev->vq[n].last_avail_idx = idx;
1736
    vdev->vq[n].shadow_avail_idx = idx;
1737 1738
}

1739 1740 1741 1742 1743
void virtio_queue_invalidate_signalled_used(VirtIODevice *vdev, int n)
{
    vdev->vq[n].signalled_used_valid = false;
}

1744 1745 1746 1747 1748
VirtQueue *virtio_get_queue(VirtIODevice *vdev, int n)
{
    return vdev->vq + n;
}

1749 1750 1751 1752 1753
uint16_t virtio_get_queue_index(VirtQueue *vq)
{
    return vq->queue_index;
}

1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777
static void virtio_queue_guest_notifier_read(EventNotifier *n)
{
    VirtQueue *vq = container_of(n, VirtQueue, guest_notifier);
    if (event_notifier_test_and_clear(n)) {
        virtio_irq(vq);
    }
}

void virtio_queue_set_guest_notifier_fd_handler(VirtQueue *vq, bool assign,
                                                bool with_irqfd)
{
    if (assign && !with_irqfd) {
        event_notifier_set_handler(&vq->guest_notifier,
                                   virtio_queue_guest_notifier_read);
    } else {
        event_notifier_set_handler(&vq->guest_notifier, NULL);
    }
    if (!assign) {
        /* Test and clear notifier before closing it,
         * in case poll callback didn't have time to run. */
        virtio_queue_guest_notifier_read(&vq->guest_notifier);
    }
}

1778 1779 1780 1781
EventNotifier *virtio_queue_get_guest_notifier(VirtQueue *vq)
{
    return &vq->guest_notifier;
}
1782 1783 1784 1785 1786 1787 1788 1789 1790

static void virtio_queue_host_notifier_read(EventNotifier *n)
{
    VirtQueue *vq = container_of(n, VirtQueue, host_notifier);
    if (event_notifier_test_and_clear(n)) {
        virtio_queue_notify_vq(vq);
    }
}

1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806
void virtio_queue_aio_set_host_notifier_handler(VirtQueue *vq, AioContext *ctx,
                                                bool assign, bool set_handler)
{
    if (assign && set_handler) {
        aio_set_event_notifier(ctx, &vq->host_notifier, true,
                               virtio_queue_host_notifier_read);
    } else {
        aio_set_event_notifier(ctx, &vq->host_notifier, true, NULL);
    }
    if (!assign) {
        /* Test and clear notifier before after disabling event,
         * in case poll callback didn't have time to run. */
        virtio_queue_host_notifier_read(&vq->host_notifier);
    }
}

P
Paolo Bonzini 已提交
1807 1808
void virtio_queue_set_host_notifier_fd_handler(VirtQueue *vq, bool assign,
                                               bool set_handler)
1809
{
P
Paolo Bonzini 已提交
1810
    if (assign && set_handler) {
1811 1812 1813 1814
        event_notifier_set_handler(&vq->host_notifier,
                                   virtio_queue_host_notifier_read);
    } else {
        event_notifier_set_handler(&vq->host_notifier, NULL);
P
Paolo Bonzini 已提交
1815 1816
    }
    if (!assign) {
1817 1818 1819 1820 1821 1822
        /* Test and clear notifier before after disabling event,
         * in case poll callback didn't have time to run. */
        virtio_queue_host_notifier_read(&vq->host_notifier);
    }
}

1823 1824 1825 1826
EventNotifier *virtio_queue_get_host_notifier(VirtQueue *vq)
{
    return &vq->host_notifier;
}
1827

1828 1829
void virtio_device_set_child_bus_name(VirtIODevice *vdev, char *bus_name)
{
1830
    g_free(vdev->bus_name);
1831
    vdev->bus_name = g_strdup(bus_name);
1832 1833
}

1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845
static void virtio_device_realize(DeviceState *dev, Error **errp)
{
    VirtIODevice *vdev = VIRTIO_DEVICE(dev);
    VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
    Error *err = NULL;

    if (vdc->realize != NULL) {
        vdc->realize(dev, &err);
        if (err != NULL) {
            error_propagate(errp, err);
            return;
        }
1846
    }
J
Jason Wang 已提交
1847 1848 1849 1850 1851 1852

    virtio_bus_device_plugged(vdev, &err);
    if (err != NULL) {
        error_propagate(errp, err);
        return;
    }
1853 1854
}

1855
static void virtio_device_unrealize(DeviceState *dev, Error **errp)
1856
{
1857
    VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1858 1859
    VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
    Error *err = NULL;
1860

1861 1862
    virtio_bus_device_unplugged(vdev);

1863 1864 1865 1866 1867 1868
    if (vdc->unrealize != NULL) {
        vdc->unrealize(dev, &err);
        if (err != NULL) {
            error_propagate(errp, err);
            return;
        }
1869
    }
1870

1871 1872
    g_free(vdev->bus_name);
    vdev->bus_name = NULL;
1873 1874
}

C
Cornelia Huck 已提交
1875 1876 1877 1878 1879
static Property virtio_properties[] = {
    DEFINE_VIRTIO_COMMON_FEATURES(VirtIODevice, host_features),
    DEFINE_PROP_END_OF_LIST(),
};

1880 1881 1882 1883
static void virtio_device_class_init(ObjectClass *klass, void *data)
{
    /* Set the default value here. */
    DeviceClass *dc = DEVICE_CLASS(klass);
1884 1885 1886

    dc->realize = virtio_device_realize;
    dc->unrealize = virtio_device_unrealize;
1887
    dc->bus_type = TYPE_VIRTIO_BUS;
C
Cornelia Huck 已提交
1888
    dc->props = virtio_properties;
1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905
}

static const TypeInfo virtio_device_info = {
    .name = TYPE_VIRTIO_DEVICE,
    .parent = TYPE_DEVICE,
    .instance_size = sizeof(VirtIODevice),
    .class_init = virtio_device_class_init,
    .abstract = true,
    .class_size = sizeof(VirtioDeviceClass),
};

static void virtio_register_types(void)
{
    type_register_static(&virtio_device_info);
}

type_init(virtio_register_types)