dma-helpers.c 11.0 KB
Newer Older
1 2 3 4 5 6 7 8 9
/*
 * DMA helper functions
 *
 * Copyright (c) 2009 Red Hat
 *
 * This work is licensed under the terms of the GNU General Public License
 * (GNU GPL), version 2 or later.
 */

10
#include "sysemu/dma.h"
K
Kevin Wolf 已提交
11
#include "trace.h"
12 13
#include "qemu/range.h"
#include "qemu/thread.h"
14

15 16
/* #define DEBUG_IOMMU */

17 18
static void do_dma_memory_set(AddressSpace *as,
                              dma_addr_t addr, uint8_t c, dma_addr_t len)
19 20 21 22 23 24 25 26
{
#define FILLBUF_SIZE 512
    uint8_t fillbuf[FILLBUF_SIZE];
    int l;

    memset(fillbuf, c, FILLBUF_SIZE);
    while (len > 0) {
        l = len < FILLBUF_SIZE ? len : FILLBUF_SIZE;
27
        address_space_rw(as, addr, fillbuf, l, true);
28 29
        len -= l;
        addr += l;
30
    }
31 32 33 34
}

int dma_memory_set(DMAContext *dma, dma_addr_t addr, uint8_t c, dma_addr_t len)
{
35 36
    dma_barrier(dma, DMA_DIRECTION_FROM_DEVICE);

37 38 39
    if (dma_has_iommu(dma)) {
        return iommu_dma_memory_set(dma, addr, c, len);
    }
40
    do_dma_memory_set(dma->as, addr, c, len);
41

42 43 44
    return 0;
}

45
void qemu_sglist_init(QEMUSGList *qsg, int alloc_hint, DMAContext *dma)
46
{
47
    qsg->sg = g_malloc(alloc_hint * sizeof(ScatterGatherEntry));
48 49 50
    qsg->nsg = 0;
    qsg->nalloc = alloc_hint;
    qsg->size = 0;
51
    qsg->dma = dma;
52 53
}

54
void qemu_sglist_add(QEMUSGList *qsg, dma_addr_t base, dma_addr_t len)
55 56 57
{
    if (qsg->nsg == qsg->nalloc) {
        qsg->nalloc = 2 * qsg->nalloc + 1;
58
        qsg->sg = g_realloc(qsg->sg, qsg->nalloc * sizeof(ScatterGatherEntry));
59 60 61 62 63 64 65 66 67
    }
    qsg->sg[qsg->nsg].base = base;
    qsg->sg[qsg->nsg].len = len;
    qsg->size += len;
    ++qsg->nsg;
}

void qemu_sglist_destroy(QEMUSGList *qsg)
{
68
    g_free(qsg->sg);
69
    memset(qsg, 0, sizeof(*qsg));
70 71
}

72
typedef struct {
73
    BlockDriverAIOCB common;
74 75 76 77
    BlockDriverState *bs;
    BlockDriverAIOCB *acb;
    QEMUSGList *sg;
    uint64_t sector_num;
78
    DMADirection dir;
79
    bool in_cancel;
80
    int sg_cur_index;
81
    dma_addr_t sg_cur_byte;
82 83
    QEMUIOVector iov;
    QEMUBH *bh;
84
    DMAIOFunc *io_func;
85
} DMAAIOCB;
86 87 88 89 90

static void dma_bdrv_cb(void *opaque, int ret);

static void reschedule_dma(void *opaque)
{
91
    DMAAIOCB *dbs = (DMAAIOCB *)opaque;
92 93 94

    qemu_bh_delete(dbs->bh);
    dbs->bh = NULL;
95
    dma_bdrv_cb(dbs, 0);
96 97 98 99
}

static void continue_after_map_failure(void *opaque)
{
100
    DMAAIOCB *dbs = (DMAAIOCB *)opaque;
101 102 103 104 105

    dbs->bh = qemu_bh_new(reschedule_dma, dbs);
    qemu_bh_schedule(dbs->bh);
}

106
static void dma_bdrv_unmap(DMAAIOCB *dbs)
107 108 109 110
{
    int i;

    for (i = 0; i < dbs->iov.niov; ++i) {
111 112 113
        dma_memory_unmap(dbs->sg->dma, dbs->iov.iov[i].iov_base,
                         dbs->iov.iov[i].iov_len, dbs->dir,
                         dbs->iov.iov[i].iov_len);
114
    }
115 116 117 118 119
    qemu_iovec_reset(&dbs->iov);
}

static void dma_complete(DMAAIOCB *dbs, int ret)
{
K
Kevin Wolf 已提交
120 121
    trace_dma_complete(dbs, ret, dbs->common.cb);

122 123 124 125 126 127 128 129 130 131 132 133 134 135 136
    dma_bdrv_unmap(dbs);
    if (dbs->common.cb) {
        dbs->common.cb(dbs->common.opaque, ret);
    }
    qemu_iovec_destroy(&dbs->iov);
    if (dbs->bh) {
        qemu_bh_delete(dbs->bh);
        dbs->bh = NULL;
    }
    if (!dbs->in_cancel) {
        /* Requests may complete while dma_aio_cancel is in progress.  In
         * this case, the AIOCB should not be released because it is still
         * referenced by dma_aio_cancel.  */
        qemu_aio_release(dbs);
    }
137 138
}

B
blueswir1 已提交
139
static void dma_bdrv_cb(void *opaque, int ret)
140 141
{
    DMAAIOCB *dbs = (DMAAIOCB *)opaque;
142
    dma_addr_t cur_addr, cur_len;
143 144
    void *mem;

K
Kevin Wolf 已提交
145 146
    trace_dma_bdrv_cb(dbs, ret);

147 148 149
    dbs->acb = NULL;
    dbs->sector_num += dbs->iov.size / 512;
    dma_bdrv_unmap(dbs);
150 151

    if (dbs->sg_cur_index == dbs->sg->nsg || ret < 0) {
152
        dma_complete(dbs, ret);
153 154 155 156 157 158
        return;
    }

    while (dbs->sg_cur_index < dbs->sg->nsg) {
        cur_addr = dbs->sg->sg[dbs->sg_cur_index].base + dbs->sg_cur_byte;
        cur_len = dbs->sg->sg[dbs->sg_cur_index].len - dbs->sg_cur_byte;
159
        mem = dma_memory_map(dbs->sg->dma, cur_addr, &cur_len, dbs->dir);
160 161 162 163 164 165 166 167 168 169 170
        if (!mem)
            break;
        qemu_iovec_add(&dbs->iov, mem, cur_len);
        dbs->sg_cur_byte += cur_len;
        if (dbs->sg_cur_byte == dbs->sg->sg[dbs->sg_cur_index].len) {
            dbs->sg_cur_byte = 0;
            ++dbs->sg_cur_index;
        }
    }

    if (dbs->iov.size == 0) {
K
Kevin Wolf 已提交
171
        trace_dma_map_wait(dbs);
172 173 174 175
        cpu_register_map_client(dbs, continue_after_map_failure);
        return;
    }

176 177
    dbs->acb = dbs->io_func(dbs->bs, dbs->sector_num, &dbs->iov,
                            dbs->iov.size / 512, dma_bdrv_cb, dbs);
178
    assert(dbs->acb);
179 180
}

181 182 183 184
static void dma_aio_cancel(BlockDriverAIOCB *acb)
{
    DMAAIOCB *dbs = container_of(acb, DMAAIOCB, common);

K
Kevin Wolf 已提交
185 186
    trace_dma_aio_cancel(dbs);

187
    if (dbs->acb) {
188 189 190 191 192
        BlockDriverAIOCB *acb = dbs->acb;
        dbs->acb = NULL;
        dbs->in_cancel = true;
        bdrv_aio_cancel(acb);
        dbs->in_cancel = false;
193
    }
194 195
    dbs->common.cb = NULL;
    dma_complete(dbs, 0);
196 197
}

S
Stefan Hajnoczi 已提交
198
static const AIOCBInfo dma_aiocb_info = {
199 200 201 202
    .aiocb_size         = sizeof(DMAAIOCB),
    .cancel             = dma_aio_cancel,
};

203
BlockDriverAIOCB *dma_bdrv_io(
204
    BlockDriverState *bs, QEMUSGList *sg, uint64_t sector_num,
205
    DMAIOFunc *io_func, BlockDriverCompletionFunc *cb,
206
    void *opaque, DMADirection dir)
207
{
S
Stefan Hajnoczi 已提交
208
    DMAAIOCB *dbs = qemu_aio_get(&dma_aiocb_info, bs, cb, opaque);
209

210
    trace_dma_bdrv_io(dbs, bs, sector_num, (dir == DMA_DIRECTION_TO_DEVICE));
K
Kevin Wolf 已提交
211

212
    dbs->acb = NULL;
213 214 215 216 217
    dbs->bs = bs;
    dbs->sg = sg;
    dbs->sector_num = sector_num;
    dbs->sg_cur_index = 0;
    dbs->sg_cur_byte = 0;
218
    dbs->dir = dir;
219
    dbs->io_func = io_func;
220 221 222
    dbs->bh = NULL;
    qemu_iovec_init(&dbs->iov, sg->nsg);
    dma_bdrv_cb(dbs, 0);
223
    return &dbs->common;
224 225 226 227 228 229 230
}


BlockDriverAIOCB *dma_bdrv_read(BlockDriverState *bs,
                                QEMUSGList *sg, uint64_t sector,
                                void (*cb)(void *opaque, int ret), void *opaque)
{
231 232
    return dma_bdrv_io(bs, sg, sector, bdrv_aio_readv, cb, opaque,
                       DMA_DIRECTION_FROM_DEVICE);
233 234 235 236 237 238
}

BlockDriverAIOCB *dma_bdrv_write(BlockDriverState *bs,
                                 QEMUSGList *sg, uint64_t sector,
                                 void (*cb)(void *opaque, int ret), void *opaque)
{
239 240
    return dma_bdrv_io(bs, sg, sector, bdrv_aio_writev, cb, opaque,
                       DMA_DIRECTION_TO_DEVICE);
241
}
242 243


244 245
static uint64_t dma_buf_rw(uint8_t *ptr, int32_t len, QEMUSGList *sg,
                           DMADirection dir)
246 247 248 249 250 251 252 253 254 255
{
    uint64_t resid;
    int sg_cur_index;

    resid = sg->size;
    sg_cur_index = 0;
    len = MIN(len, resid);
    while (len > 0) {
        ScatterGatherEntry entry = sg->sg[sg_cur_index++];
        int32_t xfer = MIN(len, entry.len);
256
        dma_memory_rw(sg->dma, entry.base, ptr, xfer, dir);
257 258 259 260 261 262 263 264 265 266
        ptr += xfer;
        len -= xfer;
        resid -= xfer;
    }

    return resid;
}

uint64_t dma_buf_read(uint8_t *ptr, int32_t len, QEMUSGList *sg)
{
267
    return dma_buf_rw(ptr, len, sg, DMA_DIRECTION_FROM_DEVICE);
268 269 270 271
}

uint64_t dma_buf_write(uint8_t *ptr, int32_t len, QEMUSGList *sg)
{
272
    return dma_buf_rw(ptr, len, sg, DMA_DIRECTION_TO_DEVICE);
273
}
274 275 276 277 278 279

void dma_acct_start(BlockDriverState *bs, BlockAcctCookie *cookie,
                    QEMUSGList *sg, enum BlockAcctType type)
{
    bdrv_acct_start(bs, cookie, sg->size, type);
}
280 281 282 283

bool iommu_dma_memory_valid(DMAContext *dma, dma_addr_t addr, dma_addr_t len,
                            DMADirection dir)
{
A
Avi Kivity 已提交
284
    hwaddr paddr, plen;
285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300

#ifdef DEBUG_IOMMU
    fprintf(stderr, "dma_memory_check context=%p addr=0x" DMA_ADDR_FMT
            " len=0x" DMA_ADDR_FMT " dir=%d\n", dma, addr, len, dir);
#endif

    while (len) {
        if (dma->translate(dma, addr, &paddr, &plen, dir) != 0) {
            return false;
        }

        /* The translation might be valid for larger regions. */
        if (plen > len) {
            plen = len;
        }

301 302 303 304 305
        if (!address_space_access_valid(dma->as, paddr, len,
                                        dir == DMA_DIRECTION_FROM_DEVICE)) {
            return false;
        }

306 307 308 309 310 311 312 313 314 315
        len -= plen;
        addr += plen;
    }

    return true;
}

int iommu_dma_memory_rw(DMAContext *dma, dma_addr_t addr,
                        void *buf, dma_addr_t len, DMADirection dir)
{
A
Avi Kivity 已提交
316
    hwaddr paddr, plen;
317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340
    int err;

#ifdef DEBUG_IOMMU
    fprintf(stderr, "dma_memory_rw context=%p addr=0x" DMA_ADDR_FMT " len=0x"
            DMA_ADDR_FMT " dir=%d\n", dma, addr, len, dir);
#endif

    while (len) {
        err = dma->translate(dma, addr, &paddr, &plen, dir);
        if (err) {
	    /*
             * In case of failure on reads from the guest, we clean the
             * destination buffer so that a device that doesn't test
             * for errors will not expose qemu internal memory.
	     */
	    memset(buf, 0, len);
            return -1;
        }

        /* The translation might be valid for larger regions. */
        if (plen > len) {
            plen = len;
        }

341
        address_space_rw(dma->as, paddr, buf, plen, dir == DMA_DIRECTION_FROM_DEVICE);
342 343 344 345 346 347 348 349 350 351 352 353

        len -= plen;
        addr += plen;
        buf += plen;
    }

    return 0;
}

int iommu_dma_memory_set(DMAContext *dma, dma_addr_t addr, uint8_t c,
                         dma_addr_t len)
{
A
Avi Kivity 已提交
354
    hwaddr paddr, plen;
355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373
    int err;

#ifdef DEBUG_IOMMU
    fprintf(stderr, "dma_memory_set context=%p addr=0x" DMA_ADDR_FMT
            " len=0x" DMA_ADDR_FMT "\n", dma, addr, len);
#endif

    while (len) {
        err = dma->translate(dma, addr, &paddr, &plen,
                             DMA_DIRECTION_FROM_DEVICE);
        if (err) {
            return err;
        }

        /* The translation might be valid for larger regions. */
        if (plen > len) {
            plen = len;
        }

374
        do_dma_memory_set(dma->as, paddr, c, plen);
375 376 377 378 379 380 381 382

        len -= plen;
        addr += plen;
    }

    return 0;
}

383
void dma_context_init(DMAContext *dma, AddressSpace *as, DMATranslateFunc translate,
384 385 386 387 388 389
                      DMAMapFunc map, DMAUnmapFunc unmap)
{
#ifdef DEBUG_IOMMU
    fprintf(stderr, "dma_context_init(%p, %p, %p, %p)\n",
            dma, translate, map, unmap);
#endif
390
    dma->as = as;
391 392 393 394 395 396 397 398 399
    dma->translate = translate;
    dma->map = map;
    dma->unmap = unmap;
}

void *iommu_dma_memory_map(DMAContext *dma, dma_addr_t addr, dma_addr_t *len,
                           DMADirection dir)
{
    int err;
A
Avi Kivity 已提交
400
    hwaddr paddr, plen;
401 402 403 404 405 406 407 408 409 410 411 412 413 414 415
    void *buf;

    if (dma->map) {
        return dma->map(dma, addr, len, dir);
    }

    plen = *len;
    err = dma->translate(dma, addr, &paddr, &plen, dir);
    if (err) {
        return NULL;
    }

    /*
     * If this is true, the virtual region is contiguous,
     * but the translated physical region isn't. We just
416
     * clamp *len, much like address_space_map() does.
417 418 419 420 421
     */
    if (plen < *len) {
        *len = plen;
    }

422
    buf = address_space_map(dma->as, paddr, &plen, dir == DMA_DIRECTION_FROM_DEVICE);
423 424 425 426 427 428 429 430 431 432 433 434 435
    *len = plen;

    return buf;
}

void iommu_dma_memory_unmap(DMAContext *dma, void *buffer, dma_addr_t len,
                            DMADirection dir, dma_addr_t access_len)
{
    if (dma->unmap) {
        dma->unmap(dma, buffer, len, dir, access_len);
        return;
    }

436 437
    address_space_unmap(dma->as, buffer, len, dir == DMA_DIRECTION_FROM_DEVICE,
                        access_len);
438 439

}