scsi-disk.c 84.1 KB
Newer Older
P
pbrook 已提交
1 2 3 4 5 6 7
/*
 * SCSI Device emulation
 *
 * Copyright (c) 2006 CodeSourcery.
 * Based on code by Fabrice Bellard
 *
 * Written by Paul Brook
8 9 10 11 12 13
 * Modifications:
 *  2009-Dec-12 Artyom Tarasenko : implemented stamdard inquiry for the case
 *                                 when the allocation length of CDB is smaller
 *                                 than 36.
 *  2009-Oct-13 Artyom Tarasenko : implemented the block descriptor in the
 *                                 MODE SENSE response.
P
pbrook 已提交
14
 *
M
Matthew Fernandez 已提交
15
 * This code is licensed under the LGPL.
P
pbrook 已提交
16 17
 *
 * Note that this file only handles the SCSI architecture model and device
18 19
 * commands.  Emulation of interface/link layer protocols is handled by
 * the host adapter emulator.
P
pbrook 已提交
20 21 22 23 24
 */

//#define DEBUG_SCSI

#ifdef DEBUG_SCSI
25 26
#define DPRINTF(fmt, ...) \
do { printf("scsi-disk: " fmt , ## __VA_ARGS__); } while (0)
P
pbrook 已提交
27
#else
28
#define DPRINTF(fmt, ...) do {} while(0)
P
pbrook 已提交
29 30
#endif

P
pbrook 已提交
31
#include "qemu-common.h"
32
#include "qemu/error-report.h"
P
Paolo Bonzini 已提交
33 34
#include "hw/scsi/scsi.h"
#include "block/scsi.h"
35
#include "sysemu/sysemu.h"
36
#include "sysemu/block-backend.h"
37
#include "sysemu/blockdev.h"
P
Paolo Bonzini 已提交
38
#include "hw/block/block.h"
39
#include "sysemu/dma.h"
40

41 42 43 44
#ifdef __linux
#include <scsi/sg.h>
#endif

45
#define SCSI_WRITE_SAME_MAX         524288
46 47 48 49 50
#define SCSI_DMA_BUF_SIZE           131072
#define SCSI_MAX_INQUIRY_LEN        256
#define SCSI_MAX_MODE_LEN           256

#define DEFAULT_DISCARD_GRANULARITY 4096
51
#define DEFAULT_MAX_UNMAP_SIZE      (1 << 30)   /* 1 GB */
52
#define DEFAULT_MAX_IO_SIZE         INT_MAX     /* 2 GB - 1 block */
P
pbrook 已提交
53

54 55
typedef struct SCSIDiskState SCSIDiskState;

56 57
typedef struct SCSIDiskReq {
    SCSIRequest req;
P
pbrook 已提交
58
    /* Both sector and sector_count are in terms of qemu 512 byte blocks.  */
59 60
    uint64_t sector;
    uint32_t sector_count;
61
    uint32_t buflen;
62
    bool started;
63 64
    struct iovec iov;
    QEMUIOVector qiov;
65
    BlockAcctCookie acct;
66
} SCSIDiskReq;
P
pbrook 已提交
67

68 69 70
#define SCSI_DISK_F_REMOVABLE             0
#define SCSI_DISK_F_DPOFUA                1
#define SCSI_DISK_F_NO_REMOVABLE_DEVOPS   2
71

72
struct SCSIDiskState
P
pbrook 已提交
73
{
74
    SCSIDevice qdev;
75
    uint32_t features;
76
    bool media_changed;
77
    bool media_event;
78
    bool eject_request;
79
    uint64_t wwn;
80 81
    uint64_t port_wwn;
    uint16_t port_index;
82
    uint64_t max_unmap_size;
83
    uint64_t max_io_size;
84
    QEMUBH *bh;
G
Gerd Hoffmann 已提交
85
    char *version;
86
    char *serial;
87 88
    char *vendor;
    char *product;
89
    bool tray_open;
90
    bool tray_locked;
P
pbrook 已提交
91 92
};

93
static int scsi_handle_rw_error(SCSIDiskReq *r, int error);
K
Kevin Wolf 已提交
94

P
Paolo Bonzini 已提交
95
static void scsi_free_request(SCSIRequest *req)
P
pbrook 已提交
96
{
P
Paolo Bonzini 已提交
97 98
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);

99
    qemu_vfree(r->iov.iov_base);
P
pbrook 已提交
100 101
}

102 103
/* Helper function for command completion with sense.  */
static void scsi_check_condition(SCSIDiskReq *r, SCSISense sense)
G
Gerd Hoffmann 已提交
104
{
B
Blue Swirl 已提交
105 106
    DPRINTF("Command complete tag=0x%x sense=%d/%d/%d\n",
            r->req.tag, sense.key, sense.asc, sense.ascq);
107 108
    scsi_req_build_sense(&r->req, sense);
    scsi_req_complete(&r->req, CHECK_CONDITION);
P
pbrook 已提交
109 110
}

P
Paolo Bonzini 已提交
111
static uint32_t scsi_init_iovec(SCSIDiskReq *r, size_t size)
112
{
113 114 115
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

    if (!r->iov.iov_base) {
P
Paolo Bonzini 已提交
116
        r->buflen = size;
117
        r->iov.iov_base = blk_blockalign(s->qdev.conf.blk, r->buflen);
118 119
    }
    r->iov.iov_len = MIN(r->sector_count * 512, r->buflen);
120 121 122 123
    qemu_iovec_init_external(&r->qiov, &r->iov, 1);
    return r->qiov.size / 512;
}

P
Paolo Bonzini 已提交
124 125 126 127 128 129 130
static void scsi_disk_save_request(QEMUFile *f, SCSIRequest *req)
{
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);

    qemu_put_be64s(f, &r->sector);
    qemu_put_be32s(f, &r->sector_count);
    qemu_put_be32s(f, &r->buflen);
131 132 133 134 135 136 137 138
    if (r->buflen) {
        if (r->req.cmd.mode == SCSI_XFER_TO_DEV) {
            qemu_put_buffer(f, r->iov.iov_base, r->iov.iov_len);
        } else if (!req->retry) {
            uint32_t len = r->iov.iov_len;
            qemu_put_be32s(f, &len);
            qemu_put_buffer(f, r->iov.iov_base, r->iov.iov_len);
        }
P
Paolo Bonzini 已提交
139 140 141 142 143 144 145 146 147 148 149 150 151 152
    }
}

static void scsi_disk_load_request(QEMUFile *f, SCSIRequest *req)
{
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);

    qemu_get_be64s(f, &r->sector);
    qemu_get_be32s(f, &r->sector_count);
    qemu_get_be32s(f, &r->buflen);
    if (r->buflen) {
        scsi_init_iovec(r, r->buflen);
        if (r->req.cmd.mode == SCSI_XFER_TO_DEV) {
            qemu_get_buffer(f, r->iov.iov_base, r->iov.iov_len);
153 154 155 156 157 158
        } else if (!r->req.retry) {
            uint32_t len;
            qemu_get_be32s(f, &len);
            r->iov.iov_len = len;
            assert(r->iov.iov_len <= r->buflen);
            qemu_get_buffer(f, r->iov.iov_base, r->iov.iov_len);
P
Paolo Bonzini 已提交
159 160 161 162 163 164
        }
    }

    qemu_iovec_init_external(&r->qiov, &r->iov, 1);
}

165
static void scsi_aio_complete(void *opaque, int ret)
166 167 168 169
{
    SCSIDiskReq *r = (SCSIDiskReq *)opaque;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

170 171
    assert(r->req.aiocb != NULL);
    r->req.aiocb = NULL;
172
    block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct);
173
    if (r->req.io_canceled) {
174
        scsi_req_cancel_complete(&r->req);
175 176
        goto done;
    }
177

178
    if (ret < 0) {
179 180 181 182 183 184 185 186
        if (scsi_handle_rw_error(r, -ret)) {
            goto done;
        }
    }

    scsi_req_complete(&r->req, GOOD);

done:
187
    scsi_req_unref(&r->req);
188 189
}

190 191 192 193 194 195 196 197 198 199 200
static bool scsi_is_cmd_fua(SCSICommand *cmd)
{
    switch (cmd->buf[0]) {
    case READ_10:
    case READ_12:
    case READ_16:
    case WRITE_10:
    case WRITE_12:
    case WRITE_16:
        return (cmd->buf[1] & 8) != 0;

201 202 203
    case VERIFY_10:
    case VERIFY_12:
    case VERIFY_16:
204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219
    case WRITE_VERIFY_10:
    case WRITE_VERIFY_12:
    case WRITE_VERIFY_16:
        return true;

    case READ_6:
    case WRITE_6:
    default:
        return false;
    }
}

static void scsi_write_do_fua(SCSIDiskReq *r)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

220 221
    assert(r->req.aiocb == NULL);

222
    if (r->req.io_canceled) {
223
        scsi_req_cancel_complete(&r->req);
224 225 226
        goto done;
    }

227
    if (scsi_is_cmd_fua(&r->req.cmd)) {
228
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct, 0,
229
                         BLOCK_ACCT_FLUSH);
230
        r->req.aiocb = blk_aio_flush(s->qdev.conf.blk, scsi_aio_complete, r);
231 232 233 234
        return;
    }

    scsi_req_complete(&r->req, GOOD);
235 236

done:
237
    scsi_req_unref(&r->req);
238 239
}

240
static void scsi_dma_complete_noio(SCSIDiskReq *r, int ret)
P
pbrook 已提交
241
{
242
    assert(r->req.aiocb == NULL);
P
pbrook 已提交
243

244
    if (r->req.io_canceled) {
245
        scsi_req_cancel_complete(&r->req);
246 247
        goto done;
    }
248

249
    if (ret < 0) {
250
        if (scsi_handle_rw_error(r, -ret)) {
251
            goto done;
K
Kevin Wolf 已提交
252
        }
P
pbrook 已提交
253
    }
K
Kevin Wolf 已提交
254

255 256
    r->sector += r->sector_count;
    r->sector_count = 0;
257 258 259 260 261 262
    if (r->req.cmd.mode == SCSI_XFER_TO_DEV) {
        scsi_write_do_fua(r);
        return;
    } else {
        scsi_req_complete(&r->req, GOOD);
    }
263 264

done:
265
    scsi_req_unref(&r->req);
P
pbrook 已提交
266 267
}

268 269 270
static void scsi_dma_complete(void *opaque, int ret)
{
    SCSIDiskReq *r = (SCSIDiskReq *)opaque;
271
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
272 273

    assert(r->req.aiocb != NULL);
274 275 276 277
    r->req.aiocb = NULL;

    block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct);
    scsi_dma_complete_noio(r, ret);
278 279
}

280
static void scsi_read_complete(void * opaque, int ret)
281 282 283
{
    SCSIDiskReq *r = (SCSIDiskReq *)opaque;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
284
    int n;
285

286 287
    assert(r->req.aiocb != NULL);
    r->req.aiocb = NULL;
288
    block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct);
289
    if (r->req.io_canceled) {
290
        scsi_req_cancel_complete(&r->req);
291 292
        goto done;
    }
293 294

    if (ret < 0) {
295
        if (scsi_handle_rw_error(r, -ret)) {
296
            goto done;
297 298 299
        }
    }

300 301 302 303 304 305
    DPRINTF("Data ready tag=0x%x len=%zd\n", r->req.tag, r->qiov.size);

    n = r->qiov.size / 512;
    r->sector += n;
    r->sector_count -= n;
    scsi_req_data(&r->req, r->qiov.size);
306 307

done:
308
    scsi_req_unref(&r->req);
309
}
K
Kevin Wolf 已提交
310

P
Paolo Bonzini 已提交
311
/* Actually issue a read to the block device.  */
312
static void scsi_do_read(SCSIDiskReq *r, int ret)
P
Paolo Bonzini 已提交
313 314 315 316
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
    uint32_t n;

317 318
    assert (r->req.aiocb == NULL);

319
    if (r->req.io_canceled) {
320
        scsi_req_cancel_complete(&r->req);
321 322
        goto done;
    }
P
Paolo Bonzini 已提交
323 324 325 326 327 328 329

    if (ret < 0) {
        if (scsi_handle_rw_error(r, -ret)) {
            goto done;
        }
    }

P
Paolo Bonzini 已提交
330 331 332
    /* The request is used as the AIO opaque value, so add a ref.  */
    scsi_req_ref(&r->req);

P
Paolo Bonzini 已提交
333
    if (r->req.sg) {
334
        dma_acct_start(s->qdev.conf.blk, &r->acct, r->req.sg, BLOCK_ACCT_READ);
P
Paolo Bonzini 已提交
335
        r->req.resid -= r->req.sg->size;
336 337
        r->req.aiocb = dma_blk_read(s->qdev.conf.blk, r->req.sg, r->sector,
                                    scsi_dma_complete, r);
P
Paolo Bonzini 已提交
338 339
    } else {
        n = scsi_init_iovec(r, SCSI_DMA_BUF_SIZE);
340
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct,
341
                         n * BDRV_SECTOR_SIZE, BLOCK_ACCT_READ);
342 343
        r->req.aiocb = blk_aio_readv(s->qdev.conf.blk, r->sector, &r->qiov, n,
                                     scsi_read_complete, r);
P
Paolo Bonzini 已提交
344 345 346
    }

done:
347
    scsi_req_unref(&r->req);
P
Paolo Bonzini 已提交
348 349
}

350 351 352 353 354 355 356 357 358 359 360 361
static void scsi_do_read_cb(void *opaque, int ret)
{
    SCSIDiskReq *r = (SCSIDiskReq *)opaque;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

    assert (r->req.aiocb != NULL);
    r->req.aiocb = NULL;

    block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct);
    scsi_do_read(opaque, ret);
}

362 363
/* Read more data from scsi device into buffer.  */
static void scsi_read_data(SCSIRequest *req)
P
pbrook 已提交
364
{
365
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);
K
Kevin Wolf 已提交
366
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
P
Paolo Bonzini 已提交
367
    bool first;
P
pbrook 已提交
368

P
pbrook 已提交
369 370
    DPRINTF("Read sector_count=%d\n", r->sector_count);
    if (r->sector_count == 0) {
371 372
        /* This also clears the sense buffer for REQUEST SENSE.  */
        scsi_req_complete(&r->req, GOOD);
P
pbrook 已提交
373
        return;
P
pbrook 已提交
374 375
    }

376 377 378
    /* No data transfer may already be in progress */
    assert(r->req.aiocb == NULL);

379 380
    /* The request is used as the AIO opaque value, so add a ref.  */
    scsi_req_ref(&r->req);
381 382 383 384 385 386
    if (r->req.cmd.mode == SCSI_XFER_TO_DEV) {
        DPRINTF("Data transfer direction invalid\n");
        scsi_read_complete(r, -EINVAL);
        return;
    }

387 388
    if (s->tray_open) {
        scsi_read_complete(r, -ENOMEDIUM);
389
        return;
390
    }
391

P
Paolo Bonzini 已提交
392
    first = !r->started;
393
    r->started = true;
P
Paolo Bonzini 已提交
394
    if (first && scsi_is_cmd_fua(&r->req.cmd)) {
395
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct, 0,
396
                         BLOCK_ACCT_FLUSH);
397
        r->req.aiocb = blk_aio_flush(s->qdev.conf.blk, scsi_do_read_cb, r);
398
    } else {
P
Paolo Bonzini 已提交
399
        scsi_do_read(r, 0);
400
    }
P
pbrook 已提交
401 402
}

403 404 405 406 407 408 409
/*
 * scsi_handle_rw_error has two return values.  0 means that the error
 * must be ignored, 1 means that the error has been processed and the
 * caller should not do anything else for this request.  Note that
 * scsi_handle_rw_error always manages its reference counts, independent
 * of the return value.
 */
410
static int scsi_handle_rw_error(SCSIDiskReq *r, int error)
K
Kevin Wolf 已提交
411
{
412
    bool is_read = (r->req.cmd.mode == SCSI_XFER_FROM_DEV);
413
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
414 415
    BlockErrorAction action = blk_get_error_action(s->qdev.conf.blk,
                                                   is_read, error);
416

W
Wenchao Xia 已提交
417
    if (action == BLOCK_ERROR_ACTION_REPORT) {
418
        switch (error) {
419 420 421
        case ENOMEDIUM:
            scsi_check_condition(r, SENSE_CODE(NO_MEDIUM));
            break;
422
        case ENOMEM:
423
            scsi_check_condition(r, SENSE_CODE(TARGET_FAILURE));
424 425
            break;
        case EINVAL:
426
            scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
427
            break;
428 429 430
        case ENOSPC:
            scsi_check_condition(r, SENSE_CODE(SPACE_ALLOC_FAILED));
            break;
431
        default:
432
            scsi_check_condition(r, SENSE_CODE(IO_ERROR));
433
            break;
434
        }
435
    }
436
    blk_error_action(s->qdev.conf.blk, action, is_read, error);
W
Wenchao Xia 已提交
437
    if (action == BLOCK_ERROR_ACTION_STOP) {
438 439
        scsi_req_retry(&r->req);
    }
W
Wenchao Xia 已提交
440
    return action != BLOCK_ERROR_ACTION_IGNORE;
441 442
}

443
static void scsi_write_complete_noio(SCSIDiskReq *r, int ret)
P
pbrook 已提交
444
{
445 446
    uint32_t n;

447 448
    assert (r->req.aiocb == NULL);

449
    if (r->req.io_canceled) {
450
        scsi_req_cancel_complete(&r->req);
451 452
        goto done;
    }
453

454
    if (ret < 0) {
455
        if (scsi_handle_rw_error(r, -ret)) {
456
            goto done;
K
Kevin Wolf 已提交
457
        }
P
pbrook 已提交
458 459
    }

460
    n = r->qiov.size / 512;
461 462
    r->sector += n;
    r->sector_count -= n;
P
pbrook 已提交
463
    if (r->sector_count == 0) {
464 465
        scsi_write_do_fua(r);
        return;
P
pbrook 已提交
466
    } else {
P
Paolo Bonzini 已提交
467
        scsi_init_iovec(r, SCSI_DMA_BUF_SIZE);
468
        DPRINTF("Write complete tag=0x%x more=%zd\n", r->req.tag, r->qiov.size);
469
        scsi_req_data(&r->req, r->qiov.size);
P
pbrook 已提交
470
    }
471 472

done:
473
    scsi_req_unref(&r->req);
P
pbrook 已提交
474 475
}

476 477 478 479 480 481 482 483 484 485 486 487
static void scsi_write_complete(void * opaque, int ret)
{
    SCSIDiskReq *r = (SCSIDiskReq *)opaque;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

    assert (r->req.aiocb != NULL);
    r->req.aiocb = NULL;

    block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct);
    scsi_write_complete_noio(r, ret);
}

488
static void scsi_write_data(SCSIRequest *req)
489
{
490
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);
491
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
492 493
    uint32_t n;

494 495 496
    /* No data transfer may already be in progress */
    assert(r->req.aiocb == NULL);

497 498
    /* The request is used as the AIO opaque value, so add a ref.  */
    scsi_req_ref(&r->req);
499 500
    if (r->req.cmd.mode != SCSI_XFER_TO_DEV) {
        DPRINTF("Data transfer direction invalid\n");
501
        scsi_write_complete_noio(r, -EINVAL);
502
        return;
503 504
    }

505 506
    if (!r->req.sg && !r->qiov.size) {
        /* Called for the first time.  Ask the driver to send us more data.  */
507
        r->started = true;
508
        scsi_write_complete_noio(r, 0);
509 510 511
        return;
    }
    if (s->tray_open) {
512
        scsi_write_complete_noio(r, -ENOMEDIUM);
513 514 515
        return;
    }

516 517 518
    if (r->req.cmd.buf[0] == VERIFY_10 || r->req.cmd.buf[0] == VERIFY_12 ||
        r->req.cmd.buf[0] == VERIFY_16) {
        if (r->req.sg) {
519
            scsi_dma_complete_noio(r, 0);
520
        } else {
521
            scsi_write_complete_noio(r, 0);
522 523 524 525
        }
        return;
    }

526
    if (r->req.sg) {
527
        dma_acct_start(s->qdev.conf.blk, &r->acct, r->req.sg, BLOCK_ACCT_WRITE);
528
        r->req.resid -= r->req.sg->size;
529 530
        r->req.aiocb = dma_blk_write(s->qdev.conf.blk, r->req.sg, r->sector,
                                     scsi_dma_complete, r);
531 532
    } else {
        n = r->qiov.size / 512;
533
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct,
534
                         n * BDRV_SECTOR_SIZE, BLOCK_ACCT_WRITE);
535 536
        r->req.aiocb = blk_aio_writev(s->qdev.conf.blk, r->sector, &r->qiov, n,
                                      scsi_write_complete, r);
537
    }
P
pbrook 已提交
538
}
P
pbrook 已提交
539

P
pbrook 已提交
540
/* Return a pointer to the data buffer.  */
541
static uint8_t *scsi_get_buf(SCSIRequest *req)
P
pbrook 已提交
542
{
543
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);
P
pbrook 已提交
544

545
    return (uint8_t *)r->iov.iov_base;
P
pbrook 已提交
546 547
}

548 549
static int scsi_disk_emulate_inquiry(SCSIRequest *req, uint8_t *outbuf)
{
G
Gerd Hoffmann 已提交
550
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, req->dev);
551
    int buflen = 0;
552
    int start;
553 554 555 556 557

    if (req->cmd.buf[1] & 0x1) {
        /* Vital product data */
        uint8_t page_code = req->cmd.buf[2];

558
        outbuf[buflen++] = s->qdev.type & 0x1f;
559 560
        outbuf[buflen++] = page_code ; // this page
        outbuf[buflen++] = 0x00;
561 562
        outbuf[buflen++] = 0x00;
        start = buflen;
563 564 565

        switch (page_code) {
        case 0x00: /* Supported page codes, mandatory */
H
Hannes Reinecke 已提交
566
        {
567 568 569
            DPRINTF("Inquiry EVPD[Supported pages] "
                    "buffer size %zd\n", req->cmd.xfer);
            outbuf[buflen++] = 0x00; // list of supported pages (this page)
570
            if (s->serial) {
571
                outbuf[buflen++] = 0x80; // unit serial number
572
            }
573
            outbuf[buflen++] = 0x83; // device identification
H
Hannes Reinecke 已提交
574
            if (s->qdev.type == TYPE_DISK) {
575 576
                outbuf[buflen++] = 0xb0; // block limits
                outbuf[buflen++] = 0xb2; // thin provisioning
H
Hannes Reinecke 已提交
577
            }
578
            break;
H
Hannes Reinecke 已提交
579
        }
580 581
        case 0x80: /* Device serial number, optional */
        {
582
            int l;
583

584 585 586 587 588 589
            if (!s->serial) {
                DPRINTF("Inquiry (EVPD[Serial number] not supported\n");
                return -1;
            }

            l = strlen(s->serial);
590
            if (l > 20) {
591
                l = 20;
592
            }
593 594 595

            DPRINTF("Inquiry EVPD[Serial number] "
                    "buffer size %zd\n", req->cmd.xfer);
596
            memcpy(outbuf+buflen, s->serial, l);
597 598 599 600 601 602
            buflen += l;
            break;
        }

        case 0x83: /* Device identification page, mandatory */
        {
603
            const char *str = s->serial ?: blk_name(s->qdev.conf.blk);
604 605
            int max_len = s->serial ? 20 : 255 - 8;
            int id_len = strlen(str);
606

607
            if (id_len > max_len) {
608
                id_len = max_len;
609
            }
610 611 612 613 614 615 616
            DPRINTF("Inquiry EVPD[Device identification] "
                    "buffer size %zd\n", req->cmd.xfer);

            outbuf[buflen++] = 0x2; // ASCII
            outbuf[buflen++] = 0;   // not officially assigned
            outbuf[buflen++] = 0;   // reserved
            outbuf[buflen++] = id_len; // length of data following
617
            memcpy(outbuf+buflen, str, id_len);
618
            buflen += id_len;
619 620 621 622 623 624 625 626 627

            if (s->wwn) {
                outbuf[buflen++] = 0x1; // Binary
                outbuf[buflen++] = 0x3; // NAA
                outbuf[buflen++] = 0;   // reserved
                outbuf[buflen++] = 8;
                stq_be_p(&outbuf[buflen], s->wwn);
                buflen += 8;
            }
628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645

            if (s->port_wwn) {
                outbuf[buflen++] = 0x61; // SAS / Binary
                outbuf[buflen++] = 0x93; // PIV / Target port / NAA
                outbuf[buflen++] = 0;    // reserved
                outbuf[buflen++] = 8;
                stq_be_p(&outbuf[buflen], s->port_wwn);
                buflen += 8;
            }

            if (s->port_index) {
                outbuf[buflen++] = 0x61; // SAS / Binary
                outbuf[buflen++] = 0x94; // PIV / Target port / relative target port
                outbuf[buflen++] = 0;    // reserved
                outbuf[buflen++] = 4;
                stw_be_p(&outbuf[buflen + 2], s->port_index);
                buflen += 4;
            }
646 647
            break;
        }
648
        case 0xb0: /* block limits */
C
Christoph Hellwig 已提交
649
        {
650 651
            unsigned int unmap_sectors =
                    s->qdev.conf.discard_granularity / s->qdev.blocksize;
652 653 654 655
            unsigned int min_io_size =
                    s->qdev.conf.min_io_size / s->qdev.blocksize;
            unsigned int opt_io_size =
                    s->qdev.conf.opt_io_size / s->qdev.blocksize;
656 657
            unsigned int max_unmap_sectors =
                    s->max_unmap_size / s->qdev.blocksize;
658 659
            unsigned int max_io_sectors =
                    s->max_io_size / s->qdev.blocksize;
C
Christoph Hellwig 已提交
660

H
Hannes Reinecke 已提交
661
            if (s->qdev.type == TYPE_ROM) {
H
Hannes Reinecke 已提交
662 663 664 665
                DPRINTF("Inquiry (EVPD[%02X] not supported for CDROM\n",
                        page_code);
                return -1;
            }
C
Christoph Hellwig 已提交
666
            /* required VPD size with unmap support */
667
            buflen = 0x40;
C
Christoph Hellwig 已提交
668 669
            memset(outbuf + 4, 0, buflen - 4);

670 671
            outbuf[4] = 0x1; /* wsnz */

C
Christoph Hellwig 已提交
672 673 674 675
            /* optimal transfer length granularity */
            outbuf[6] = (min_io_size >> 8) & 0xff;
            outbuf[7] = min_io_size & 0xff;

676 677 678 679 680 681
            /* maximum transfer length */
            outbuf[8] = (max_io_sectors >> 24) & 0xff;
            outbuf[9] = (max_io_sectors >> 16) & 0xff;
            outbuf[10] = (max_io_sectors >> 8) & 0xff;
            outbuf[11] = max_io_sectors & 0xff;

C
Christoph Hellwig 已提交
682 683 684 685 686
            /* optimal transfer length */
            outbuf[12] = (opt_io_size >> 24) & 0xff;
            outbuf[13] = (opt_io_size >> 16) & 0xff;
            outbuf[14] = (opt_io_size >> 8) & 0xff;
            outbuf[15] = opt_io_size & 0xff;
687

688 689 690 691 692 693 694 695 696 697 698 699
            /* max unmap LBA count, default is 1GB */
            outbuf[20] = (max_unmap_sectors >> 24) & 0xff;
            outbuf[21] = (max_unmap_sectors >> 16) & 0xff;
            outbuf[22] = (max_unmap_sectors >> 8) & 0xff;
            outbuf[23] = max_unmap_sectors & 0xff;

            /* max unmap descriptors, 255 fit in 4 kb with an 8-byte header.  */
            outbuf[24] = 0;
            outbuf[25] = 0;
            outbuf[26] = 0;
            outbuf[27] = 255;

700 701 702 703 704
            /* optimal unmap granularity */
            outbuf[28] = (unmap_sectors >> 24) & 0xff;
            outbuf[29] = (unmap_sectors >> 16) & 0xff;
            outbuf[30] = (unmap_sectors >> 8) & 0xff;
            outbuf[31] = unmap_sectors & 0xff;
705 706 707 708 709 710 711 712 713 714 715

            /* max write same size */
            outbuf[36] = 0;
            outbuf[37] = 0;
            outbuf[38] = 0;
            outbuf[39] = 0;

            outbuf[40] = (max_io_sectors >> 24) & 0xff;
            outbuf[41] = (max_io_sectors >> 16) & 0xff;
            outbuf[42] = (max_io_sectors >> 8) & 0xff;
            outbuf[43] = max_io_sectors & 0xff;
716 717 718 719
            break;
        }
        case 0xb2: /* thin provisioning */
        {
720
            buflen = 8;
721
            outbuf[4] = 0;
722
            outbuf[5] = 0xe0; /* unmap & write_same 10/16 all supported */
723
            outbuf[6] = s->qdev.conf.discard_granularity ? 2 : 1;
724
            outbuf[7] = 0;
C
Christoph Hellwig 已提交
725 726
            break;
        }
727 728 729 730
        default:
            return -1;
        }
        /* done with EVPD */
731 732
        assert(buflen - start <= 255);
        outbuf[start - 1] = buflen - start;
733 734 735 736 737 738 739 740 741 742
        return buflen;
    }

    /* Standard INQUIRY data */
    if (req->cmd.buf[2] != 0) {
        return -1;
    }

    /* PAGE CODE == 0 */
    buflen = req->cmd.xfer;
743
    if (buflen > SCSI_MAX_INQUIRY_LEN) {
744
        buflen = SCSI_MAX_INQUIRY_LEN;
745
    }
746

H
Hannes Reinecke 已提交
747
    outbuf[0] = s->qdev.type & 0x1f;
748
    outbuf[1] = (s->features & (1 << SCSI_DISK_F_REMOVABLE)) ? 0x80 : 0;
749 750 751 752

    strpadcpy((char *) &outbuf[16], 16, s->product, ' ');
    strpadcpy((char *) &outbuf[8], 8, s->vendor, ' ');

G
Gerd Hoffmann 已提交
753
    memset(&outbuf[32], 0, 4);
754
    memcpy(&outbuf[32], s->version, MIN(4, strlen(s->version)));
755 756 757 758 759 760
    /*
     * We claim conformance to SPC-3, which is required for guests
     * to ask for modern features like READ CAPACITY(16) or the
     * block characteristics VPD page by default.  Not all of SPC-3
     * is actually implemented, but we're good enough.
     */
C
Christoph Hellwig 已提交
761
    outbuf[2] = 5;
762
    outbuf[3] = 2 | 0x10; /* Format 2, HiSup */
763 764 765 766 767 768 769 770 771

    if (buflen > 36) {
        outbuf[4] = buflen - 5; /* Additional Length = (Len - 1) - 4 */
    } else {
        /* If the allocation length of CDB is too small,
               the additional length is not adjusted */
        outbuf[4] = 36 - 5;
    }

772
    /* Sync data transfer and TCQ.  */
773
    outbuf[7] = 0x10 | (req->bus->info->tcq ? 0x02 : 0);
774 775 776
    return buflen;
}

777 778 779 780 781 782
static inline bool media_is_dvd(SCSIDiskState *s)
{
    uint64_t nb_sectors;
    if (s->qdev.type != TYPE_ROM) {
        return false;
    }
783
    if (!blk_is_inserted(s->qdev.conf.blk)) {
784 785
        return false;
    }
786 787 788
    if (s->tray_open) {
        return false;
    }
789
    blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
790 791 792
    return nb_sectors > CD_MAX_SECTORS;
}

793 794 795 796 797 798
static inline bool media_is_cd(SCSIDiskState *s)
{
    uint64_t nb_sectors;
    if (s->qdev.type != TYPE_ROM) {
        return false;
    }
799
    if (!blk_is_inserted(s->qdev.conf.blk)) {
800 801
        return false;
    }
802 803 804
    if (s->tray_open) {
        return false;
    }
805
    blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
806 807 808
    return nb_sectors <= CD_MAX_SECTORS;
}

809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841
static int scsi_read_disc_information(SCSIDiskState *s, SCSIDiskReq *r,
                                      uint8_t *outbuf)
{
    uint8_t type = r->req.cmd.buf[1] & 7;

    if (s->qdev.type != TYPE_ROM) {
        return -1;
    }

    /* Types 1/2 are only defined for Blu-Ray.  */
    if (type != 0) {
        scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
        return -1;
    }

    memset(outbuf, 0, 34);
    outbuf[1] = 32;
    outbuf[2] = 0xe; /* last session complete, disc finalized */
    outbuf[3] = 1;   /* first track on disc */
    outbuf[4] = 1;   /* # of sessions */
    outbuf[5] = 1;   /* first track of last session */
    outbuf[6] = 1;   /* last track of last session */
    outbuf[7] = 0x20; /* unrestricted use */
    outbuf[8] = 0x00; /* CD-ROM or DVD-ROM */
    /* 9-10-11: most significant byte corresponding bytes 4-5-6 */
    /* 12-23: not meaningful for CD-ROM or DVD-ROM */
    /* 24-31: disc bar code */
    /* 32: disc application code */
    /* 33: number of OPC tables */

    return 34;
}

842 843 844
static int scsi_read_dvd_structure(SCSIDiskState *s, SCSIDiskReq *r,
                                   uint8_t *outbuf)
{
845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865
    static const int rds_caps_size[5] = {
        [0] = 2048 + 4,
        [1] = 4 + 4,
        [3] = 188 + 4,
        [4] = 2048 + 4,
    };

    uint8_t media = r->req.cmd.buf[1];
    uint8_t layer = r->req.cmd.buf[6];
    uint8_t format = r->req.cmd.buf[7];
    int size = -1;

    if (s->qdev.type != TYPE_ROM) {
        return -1;
    }
    if (media != 0) {
        scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
        return -1;
    }

    if (format != 0xff) {
866
        if (s->tray_open || !blk_is_inserted(s->qdev.conf.blk)) {
867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887
            scsi_check_condition(r, SENSE_CODE(NO_MEDIUM));
            return -1;
        }
        if (media_is_cd(s)) {
            scsi_check_condition(r, SENSE_CODE(INCOMPATIBLE_FORMAT));
            return -1;
        }
        if (format >= ARRAY_SIZE(rds_caps_size)) {
            return -1;
        }
        size = rds_caps_size[format];
        memset(outbuf, 0, size);
    }

    switch (format) {
    case 0x00: {
        /* Physical format information */
        uint64_t nb_sectors;
        if (layer != 0) {
            goto fail;
        }
888
        blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932

        outbuf[4] = 1;   /* DVD-ROM, part version 1 */
        outbuf[5] = 0xf; /* 120mm disc, minimum rate unspecified */
        outbuf[6] = 1;   /* one layer, read-only (per MMC-2 spec) */
        outbuf[7] = 0;   /* default densities */

        stl_be_p(&outbuf[12], (nb_sectors >> 2) - 1); /* end sector */
        stl_be_p(&outbuf[16], (nb_sectors >> 2) - 1); /* l0 end sector */
        break;
    }

    case 0x01: /* DVD copyright information, all zeros */
        break;

    case 0x03: /* BCA information - invalid field for no BCA info */
        return -1;

    case 0x04: /* DVD disc manufacturing information, all zeros */
        break;

    case 0xff: { /* List capabilities */
        int i;
        size = 4;
        for (i = 0; i < ARRAY_SIZE(rds_caps_size); i++) {
            if (!rds_caps_size[i]) {
                continue;
            }
            outbuf[size] = i;
            outbuf[size + 1] = 0x40; /* Not writable, readable */
            stw_be_p(&outbuf[size + 2], rds_caps_size[i]);
            size += 4;
        }
        break;
     }

    default:
        return -1;
    }

    /* Size of buffer, not including 2 byte size field */
    stw_be_p(outbuf, size - 2);
    return size;

fail:
933 934 935
    return -1;
}

936
static int scsi_event_status_media(SCSIDiskState *s, uint8_t *outbuf)
937
{
938 939 940 941 942
    uint8_t event_code, media_status;

    media_status = 0;
    if (s->tray_open) {
        media_status = MS_TRAY_OPEN;
943
    } else if (blk_is_inserted(s->qdev.conf.blk)) {
944 945 946 947 948
        media_status = MS_MEDIA_PRESENT;
    }

    /* Event notification descriptor */
    event_code = MEC_NO_CHANGE;
949 950 951 952 953 954 955 956
    if (media_status != MS_TRAY_OPEN) {
        if (s->media_event) {
            event_code = MEC_NEW_MEDIA;
            s->media_event = false;
        } else if (s->eject_request) {
            event_code = MEC_EJECT_REQUESTED;
            s->eject_request = false;
        }
957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992
    }

    outbuf[0] = event_code;
    outbuf[1] = media_status;

    /* These fields are reserved, just clear them. */
    outbuf[2] = 0;
    outbuf[3] = 0;
    return 4;
}

static int scsi_get_event_status_notification(SCSIDiskState *s, SCSIDiskReq *r,
                                              uint8_t *outbuf)
{
    int size;
    uint8_t *buf = r->req.cmd.buf;
    uint8_t notification_class_request = buf[4];
    if (s->qdev.type != TYPE_ROM) {
        return -1;
    }
    if ((buf[1] & 1) == 0) {
        /* asynchronous */
        return -1;
    }

    size = 4;
    outbuf[0] = outbuf[1] = 0;
    outbuf[3] = 1 << GESN_MEDIA; /* supported events */
    if (notification_class_request & (1 << GESN_MEDIA)) {
        outbuf[2] = GESN_MEDIA;
        size += scsi_event_status_media(s, &outbuf[size]);
    } else {
        outbuf[2] = 0x80;
    }
    stw_be_p(outbuf, size - 4);
    return size;
993 994
}

995
static int scsi_get_configuration(SCSIDiskState *s, uint8_t *outbuf)
996
{
997 998
    int current;

999 1000 1001
    if (s->qdev.type != TYPE_ROM) {
        return -1;
    }
1002 1003 1004 1005 1006 1007 1008 1009 1010

    if (media_is_dvd(s)) {
        current = MMC_PROFILE_DVD_ROM;
    } else if (media_is_cd(s)) {
        current = MMC_PROFILE_CD_ROM;
    } else {
        current = MMC_PROFILE_NONE;
    }

1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034
    memset(outbuf, 0, 40);
    stl_be_p(&outbuf[0], 36); /* Bytes after the data length field */
    stw_be_p(&outbuf[6], current);
    /* outbuf[8] - outbuf[19]: Feature 0 - Profile list */
    outbuf[10] = 0x03; /* persistent, current */
    outbuf[11] = 8; /* two profiles */
    stw_be_p(&outbuf[12], MMC_PROFILE_DVD_ROM);
    outbuf[14] = (current == MMC_PROFILE_DVD_ROM);
    stw_be_p(&outbuf[16], MMC_PROFILE_CD_ROM);
    outbuf[18] = (current == MMC_PROFILE_CD_ROM);
    /* outbuf[20] - outbuf[31]: Feature 1 - Core feature */
    stw_be_p(&outbuf[20], 1);
    outbuf[22] = 0x08 | 0x03; /* version 2, persistent, current */
    outbuf[23] = 8;
    stl_be_p(&outbuf[24], 1); /* SCSI */
    outbuf[28] = 1; /* DBE = 1, mandatory */
    /* outbuf[32] - outbuf[39]: Feature 3 - Removable media feature */
    stw_be_p(&outbuf[32], 3);
    outbuf[34] = 0x08 | 0x03; /* version 2, persistent, current */
    outbuf[35] = 4;
    outbuf[36] = 0x39; /* tray, load=1, eject=1, unlocked at powerup, lock=1 */
    /* TODO: Random readable, CD read, DVD read, drive serial number,
       power management */
    return 40;
1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046
}

static int scsi_emulate_mechanism_status(SCSIDiskState *s, uint8_t *outbuf)
{
    if (s->qdev.type != TYPE_ROM) {
        return -1;
    }
    memset(outbuf, 0, 8);
    outbuf[5] = 1; /* CD-ROM */
    return 8;
}

1047
static int mode_sense_page(SCSIDiskState *s, int page, uint8_t **p_outbuf,
1048
                           int page_control)
1049
{
1050 1051 1052 1053
    static const int mode_sense_valid[0x3f] = {
        [MODE_PAGE_HD_GEOMETRY]            = (1 << TYPE_DISK),
        [MODE_PAGE_FLEXIBLE_DISK_GEOMETRY] = (1 << TYPE_DISK),
        [MODE_PAGE_CACHING]                = (1 << TYPE_DISK) | (1 << TYPE_ROM),
1054 1055
        [MODE_PAGE_R_W_ERROR]              = (1 << TYPE_DISK) | (1 << TYPE_ROM),
        [MODE_PAGE_AUDIO_CTL]              = (1 << TYPE_ROM),
1056 1057
        [MODE_PAGE_CAPABILITIES]           = (1 << TYPE_ROM),
    };
1058 1059 1060

    uint8_t *p = *p_outbuf + 2;
    int length;
1061

1062 1063 1064 1065
    if ((mode_sense_valid[page] & (1 << s->qdev.type)) == 0) {
        return -1;
    }

1066 1067 1068 1069 1070
    /*
     * If Changeable Values are requested, a mask denoting those mode parameters
     * that are changeable shall be returned. As we currently don't support
     * parameter changes via MODE_SELECT all bits are returned set to zero.
     * The buffer was already menset to zero by the caller of this function.
1071 1072 1073 1074 1075 1076
     *
     * The offsets here are off by two compared to the descriptions in the
     * SCSI specs, because those include a 2-byte header.  This is unfortunate,
     * but it is done so that offsets are consistent within our implementation
     * of MODE SENSE and MODE SELECT.  MODE SELECT has to deal with both
     * 2-byte and 4-byte headers.
1077
     */
1078
    switch (page) {
1079
    case MODE_PAGE_HD_GEOMETRY:
1080
        length = 0x16;
1081
        if (page_control == 1) { /* Changeable Values */
1082
            break;
1083
        }
1084
        /* if a geometry hint is available, use it */
1085 1086 1087 1088
        p[0] = (s->qdev.conf.cyls >> 16) & 0xff;
        p[1] = (s->qdev.conf.cyls >> 8) & 0xff;
        p[2] = s->qdev.conf.cyls & 0xff;
        p[3] = s->qdev.conf.heads & 0xff;
1089
        /* Write precomp start cylinder, disabled */
1090 1091 1092
        p[4] = (s->qdev.conf.cyls >> 16) & 0xff;
        p[5] = (s->qdev.conf.cyls >> 8) & 0xff;
        p[6] = s->qdev.conf.cyls & 0xff;
1093
        /* Reduced current start cylinder, disabled */
1094 1095 1096
        p[7] = (s->qdev.conf.cyls >> 16) & 0xff;
        p[8] = (s->qdev.conf.cyls >> 8) & 0xff;
        p[9] = s->qdev.conf.cyls & 0xff;
1097
        /* Device step rate [ns], 200ns */
1098 1099
        p[10] = 0;
        p[11] = 200;
1100
        /* Landing zone cylinder */
1101 1102
        p[12] = 0xff;
        p[13] =  0xff;
1103 1104
        p[14] = 0xff;
        /* Medium rotation rate [rpm], 5400 rpm */
1105 1106
        p[18] = (5400 >> 8) & 0xff;
        p[19] = 5400 & 0xff;
1107
        break;
1108

1109
    case MODE_PAGE_FLEXIBLE_DISK_GEOMETRY:
1110
        length = 0x1e;
1111
        if (page_control == 1) { /* Changeable Values */
1112
            break;
1113
        }
1114
        /* Transfer rate [kbit/s], 5Mbit/s */
1115 1116
        p[0] = 5000 >> 8;
        p[1] = 5000 & 0xff;
1117
        /* if a geometry hint is available, use it */
1118 1119 1120 1121 1122 1123
        p[2] = s->qdev.conf.heads & 0xff;
        p[3] = s->qdev.conf.secs & 0xff;
        p[4] = s->qdev.blocksize >> 8;
        p[6] = (s->qdev.conf.cyls >> 8) & 0xff;
        p[7] = s->qdev.conf.cyls & 0xff;
        /* Write precomp start cylinder, disabled */
1124 1125
        p[8] = (s->qdev.conf.cyls >> 8) & 0xff;
        p[9] = s->qdev.conf.cyls & 0xff;
1126
        /* Reduced current start cylinder, disabled */
1127 1128
        p[10] = (s->qdev.conf.cyls >> 8) & 0xff;
        p[11] = s->qdev.conf.cyls & 0xff;
1129
        /* Device step rate [100us], 100us */
1130 1131
        p[12] = 0;
        p[13] = 1;
1132
        /* Device step pulse width [us], 1us */
1133
        p[14] = 1;
1134
        /* Device head settle delay [100us], 100us */
1135 1136
        p[15] = 0;
        p[16] = 1;
1137
        /* Motor on delay [0.1s], 0.1s */
1138
        p[17] = 1;
1139
        /* Motor off delay [0.1s], 0.1s */
1140
        p[18] = 1;
1141
        /* Medium rotation rate [rpm], 5400 rpm */
1142 1143
        p[26] = (5400 >> 8) & 0xff;
        p[27] = 5400 & 0xff;
1144
        break;
1145

1146
    case MODE_PAGE_CACHING:
1147
        length = 0x12;
1148
        if (page_control == 1 || /* Changeable Values */
1149
            blk_enable_write_cache(s->qdev.conf.blk)) {
1150
            p[0] = 4; /* WCE */
1151
        }
1152
        break;
1153

1154
    case MODE_PAGE_R_W_ERROR:
1155
        length = 10;
1156 1157 1158
        if (page_control == 1) { /* Changeable Values */
            break;
        }
1159
        p[0] = 0x80; /* Automatic Write Reallocation Enabled */
1160
        if (s->qdev.type == TYPE_ROM) {
1161
            p[1] = 0x20; /* Read Retry Count */
1162 1163 1164 1165
        }
        break;

    case MODE_PAGE_AUDIO_CTL:
1166
        length = 14;
1167 1168
        break;

1169
    case MODE_PAGE_CAPABILITIES:
1170
        length = 0x14;
1171
        if (page_control == 1) { /* Changeable Values */
1172
            break;
1173
        }
1174

1175 1176 1177
        p[0] = 0x3b; /* CD-R & CD-RW read */
        p[1] = 0; /* Writing not supported */
        p[2] = 0x7f; /* Audio, composite, digital out,
1178
                        mode 2 form 1&2, multi session */
1179
        p[3] = 0xff; /* CD DA, DA accurate, RW supported,
1180 1181
                        RW corrected, C2 errors, ISRC,
                        UPC, Bar code */
1182
        p[4] = 0x2d | (s->tray_locked ? 2 : 0);
1183
        /* Locking supported, jumper present, eject, tray */
1184
        p[5] = 0; /* no volume & mute control, no
1185
                     changer */
1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196
        p[6] = (50 * 176) >> 8; /* 50x read speed */
        p[7] = (50 * 176) & 0xff;
        p[8] = 2 >> 8; /* Two volume levels */
        p[9] = 2 & 0xff;
        p[10] = 2048 >> 8; /* 2M buffer */
        p[11] = 2048 & 0xff;
        p[12] = (16 * 176) >> 8; /* 16x read speed current */
        p[13] = (16 * 176) & 0xff;
        p[16] = (16 * 176) >> 8; /* 16x write speed */
        p[17] = (16 * 176) & 0xff;
        p[18] = (16 * 176) >> 8; /* 16x write speed current */
1197
        p[19] = (16 * 176) & 0xff;
1198
        break;
1199 1200

    default:
1201
        return -1;
1202
    }
1203

1204 1205 1206 1207 1208
    assert(length < 256);
    (*p_outbuf)[0] = page;
    (*p_outbuf)[1] = length;
    *p_outbuf += length + 2;
    return length + 2;
1209 1210
}

1211
static int scsi_disk_emulate_mode_sense(SCSIDiskReq *r, uint8_t *outbuf)
1212
{
1213
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
1214
    uint64_t nb_sectors;
1215 1216
    bool dbd;
    int page, buflen, ret, page_control;
1217
    uint8_t *p;
1218
    uint8_t dev_specific_param;
1219

1220
    dbd = (r->req.cmd.buf[1] & 0x8) != 0;
1221 1222
    page = r->req.cmd.buf[2] & 0x3f;
    page_control = (r->req.cmd.buf[2] & 0xc0) >> 6;
1223
    DPRINTF("Mode Sense(%d) (page %d, xfer %zd, page_control %d)\n",
1224 1225
        (r->req.cmd.buf[0] == MODE_SENSE) ? 6 : 10, page, r->req.cmd.xfer, page_control);
    memset(outbuf, 0, r->req.cmd.xfer);
1226 1227
    p = outbuf;

1228
    if (s->qdev.type == TYPE_DISK) {
P
Paolo Bonzini 已提交
1229
        dev_specific_param = s->features & (1 << SCSI_DISK_F_DPOFUA) ? 0x10 : 0;
1230
        if (blk_is_read_only(s->qdev.conf.blk)) {
1231 1232
            dev_specific_param |= 0x80; /* Readonly.  */
        }
1233
    } else {
1234 1235
        /* MMC prescribes that CD/DVD drives have no block descriptors,
         * and defines no device-specific parameter.  */
P
Paolo Bonzini 已提交
1236
        dev_specific_param = 0x00;
1237
        dbd = true;
1238 1239
    }

1240
    if (r->req.cmd.buf[0] == MODE_SENSE) {
1241 1242 1243 1244 1245 1246 1247 1248 1249
        p[1] = 0; /* Default media type.  */
        p[2] = dev_specific_param;
        p[3] = 0; /* Block descriptor length.  */
        p += 4;
    } else { /* MODE_SENSE_10 */
        p[2] = 0; /* Default media type.  */
        p[3] = dev_specific_param;
        p[6] = p[7] = 0; /* Block descriptor length.  */
        p += 8;
1250 1251
    }

1252
    blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
1253
    if (!dbd && nb_sectors) {
1254
        if (r->req.cmd.buf[0] == MODE_SENSE) {
1255 1256 1257 1258
            outbuf[3] = 8; /* Block descriptor length  */
        } else { /* MODE_SENSE_10 */
            outbuf[7] = 8; /* Block descriptor length  */
        }
P
Paolo Bonzini 已提交
1259
        nb_sectors /= (s->qdev.blocksize / 512);
1260
        if (nb_sectors > 0xffffff) {
1261
            nb_sectors = 0;
1262
        }
1263 1264 1265 1266 1267 1268
        p[0] = 0; /* media density code */
        p[1] = (nb_sectors >> 16) & 0xff;
        p[2] = (nb_sectors >> 8) & 0xff;
        p[3] = nb_sectors & 0xff;
        p[4] = 0; /* reserved */
        p[5] = 0; /* bytes 5-7 are the sector size in bytes */
P
Paolo Bonzini 已提交
1269
        p[6] = s->qdev.blocksize >> 8;
1270 1271 1272 1273
        p[7] = 0;
        p += 8;
    }

1274 1275 1276 1277
    if (page_control == 3) {
        /* Saved Values */
        scsi_check_condition(r, SENSE_CODE(SAVING_PARAMS_NOT_SUPPORTED));
        return -1;
1278 1279
    }

1280 1281 1282 1283 1284 1285 1286 1287 1288
    if (page == 0x3f) {
        for (page = 0; page <= 0x3e; page++) {
            mode_sense_page(s, page, &p, page_control);
        }
    } else {
        ret = mode_sense_page(s, page, &p, page_control);
        if (ret == -1) {
            return -1;
        }
1289 1290 1291
    }

    buflen = p - outbuf;
1292 1293 1294 1295 1296
    /*
     * The mode data length field specifies the length in bytes of the
     * following data that is available to be transferred. The mode data
     * length does not include itself.
     */
1297
    if (r->req.cmd.buf[0] == MODE_SENSE) {
1298 1299 1300 1301 1302
        outbuf[0] = buflen - 1;
    } else { /* MODE_SENSE_10 */
        outbuf[0] = ((buflen - 2) >> 8) & 0xff;
        outbuf[1] = (buflen - 2) & 0xff;
    }
1303 1304 1305
    return buflen;
}

1306 1307 1308 1309 1310 1311 1312 1313 1314
static int scsi_disk_emulate_read_toc(SCSIRequest *req, uint8_t *outbuf)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, req->dev);
    int start_track, format, msf, toclen;
    uint64_t nb_sectors;

    msf = req->cmd.buf[1] & 2;
    format = req->cmd.buf[2] & 0xf;
    start_track = req->cmd.buf[6];
1315
    blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
1316
    DPRINTF("Read TOC (track %d format %d msf %d)\n", start_track, format, msf >> 1);
P
Paolo Bonzini 已提交
1317
    nb_sectors /= s->qdev.blocksize / 512;
1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338
    switch (format) {
    case 0:
        toclen = cdrom_read_toc(nb_sectors, outbuf, msf, start_track);
        break;
    case 1:
        /* multi session : only a single session defined */
        toclen = 12;
        memset(outbuf, 0, 12);
        outbuf[1] = 0x0a;
        outbuf[2] = 0x01;
        outbuf[3] = 0x01;
        break;
    case 2:
        toclen = cdrom_read_toc_raw(nb_sectors, outbuf, msf, start_track);
        break;
    default:
        return -1;
    }
    return toclen;
}

1339
static int scsi_disk_emulate_start_stop(SCSIDiskReq *r)
1340 1341 1342 1343 1344
{
    SCSIRequest *req = &r->req;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, req->dev);
    bool start = req->cmd.buf[4] & 1;
    bool loej = req->cmd.buf[4] & 2; /* load on start, eject on !start */
1345 1346 1347 1348 1349 1350
    int pwrcnd = req->cmd.buf[4] & 0xf0;

    if (pwrcnd) {
        /* eject/load only happens for power condition == 0 */
        return 0;
    }
1351

1352
    if ((s->features & (1 << SCSI_DISK_F_REMOVABLE)) && loej) {
1353 1354
        if (!start && !s->tray_open && s->tray_locked) {
            scsi_check_condition(r,
1355
                                 blk_is_inserted(s->qdev.conf.blk)
1356 1357 1358
                                 ? SENSE_CODE(ILLEGAL_REQ_REMOVAL_PREVENTED)
                                 : SENSE_CODE(NOT_READY_REMOVAL_PREVENTED));
            return -1;
1359
        }
1360 1361

        if (s->tray_open != !start) {
1362
            blk_eject(s->qdev.conf.blk, !start);
1363 1364
            s->tray_open = !start;
        }
1365
    }
1366
    return 0;
1367 1368
}

1369 1370 1371 1372 1373 1374
static void scsi_disk_emulate_read_data(SCSIRequest *req)
{
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);
    int buflen = r->iov.iov_len;

    if (buflen) {
1375
        DPRINTF("Read buf_len=%d\n", buflen);
1376 1377 1378 1379 1380 1381 1382 1383 1384 1385
        r->iov.iov_len = 0;
        r->started = true;
        scsi_req_data(&r->req, buflen);
        return;
    }

    /* This also clears the sense buffer for REQUEST SENSE.  */
    scsi_req_complete(&r->req, GOOD);
}

1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426
static int scsi_disk_check_mode_select(SCSIDiskState *s, int page,
                                       uint8_t *inbuf, int inlen)
{
    uint8_t mode_current[SCSI_MAX_MODE_LEN];
    uint8_t mode_changeable[SCSI_MAX_MODE_LEN];
    uint8_t *p;
    int len, expected_len, changeable_len, i;

    /* The input buffer does not include the page header, so it is
     * off by 2 bytes.
     */
    expected_len = inlen + 2;
    if (expected_len > SCSI_MAX_MODE_LEN) {
        return -1;
    }

    p = mode_current;
    memset(mode_current, 0, inlen + 2);
    len = mode_sense_page(s, page, &p, 0);
    if (len < 0 || len != expected_len) {
        return -1;
    }

    p = mode_changeable;
    memset(mode_changeable, 0, inlen + 2);
    changeable_len = mode_sense_page(s, page, &p, 1);
    assert(changeable_len == len);

    /* Check that unchangeable bits are the same as what MODE SENSE
     * would return.
     */
    for (i = 2; i < len; i++) {
        if (((mode_current[i] ^ inbuf[i - 2]) & ~mode_changeable[i]) != 0) {
            return -1;
        }
    }
    return 0;
}

static void scsi_disk_apply_mode_select(SCSIDiskState *s, int page, uint8_t *p)
{
1427 1428
    switch (page) {
    case MODE_PAGE_CACHING:
1429
        blk_set_enable_write_cache(s->qdev.conf.blk, (p[0] & 4) != 0);
1430 1431 1432 1433 1434
        break;

    default:
        break;
    }
1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494
}

static int mode_select_pages(SCSIDiskReq *r, uint8_t *p, int len, bool change)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

    while (len > 0) {
        int page, subpage, page_len;

        /* Parse both possible formats for the mode page headers.  */
        page = p[0] & 0x3f;
        if (p[0] & 0x40) {
            if (len < 4) {
                goto invalid_param_len;
            }
            subpage = p[1];
            page_len = lduw_be_p(&p[2]);
            p += 4;
            len -= 4;
        } else {
            if (len < 2) {
                goto invalid_param_len;
            }
            subpage = 0;
            page_len = p[1];
            p += 2;
            len -= 2;
        }

        if (subpage) {
            goto invalid_param;
        }
        if (page_len > len) {
            goto invalid_param_len;
        }

        if (!change) {
            if (scsi_disk_check_mode_select(s, page, p, page_len) < 0) {
                goto invalid_param;
            }
        } else {
            scsi_disk_apply_mode_select(s, page, p);
        }

        p += page_len;
        len -= page_len;
    }
    return 0;

invalid_param:
    scsi_check_condition(r, SENSE_CODE(INVALID_PARAM));
    return -1;

invalid_param_len:
    scsi_check_condition(r, SENSE_CODE(INVALID_PARAM_LEN));
    return -1;
}

static void scsi_disk_emulate_mode_select(SCSIDiskReq *r, uint8_t *inbuf)
{
1495
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531
    uint8_t *p = inbuf;
    int cmd = r->req.cmd.buf[0];
    int len = r->req.cmd.xfer;
    int hdr_len = (cmd == MODE_SELECT ? 4 : 8);
    int bd_len;
    int pass;

    /* We only support PF=1, SP=0.  */
    if ((r->req.cmd.buf[1] & 0x11) != 0x10) {
        goto invalid_field;
    }

    if (len < hdr_len) {
        goto invalid_param_len;
    }

    bd_len = (cmd == MODE_SELECT ? p[3] : lduw_be_p(&p[6]));
    len -= hdr_len;
    p += hdr_len;
    if (len < bd_len) {
        goto invalid_param_len;
    }
    if (bd_len != 0 && bd_len != 8) {
        goto invalid_param;
    }

    len -= bd_len;
    p += bd_len;

    /* Ensure no change is made if there is an error!  */
    for (pass = 0; pass < 2; pass++) {
        if (mode_select_pages(r, p, len, pass == 1) < 0) {
            assert(pass == 0);
            return;
        }
    }
1532
    if (!blk_enable_write_cache(s->qdev.conf.blk)) {
1533 1534
        /* The request is used as the AIO opaque value, so add a ref.  */
        scsi_req_ref(&r->req);
1535
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct, 0,
1536
                         BLOCK_ACCT_FLUSH);
1537
        r->req.aiocb = blk_aio_flush(s->qdev.conf.blk, scsi_aio_complete, r);
1538 1539 1540
        return;
    }

1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555
    scsi_req_complete(&r->req, GOOD);
    return;

invalid_param:
    scsi_check_condition(r, SENSE_CODE(INVALID_PARAM));
    return;

invalid_param_len:
    scsi_check_condition(r, SENSE_CODE(INVALID_PARAM_LEN));
    return;

invalid_field:
    scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
}

1556 1557 1558 1559 1560 1561 1562
static inline bool check_lba_range(SCSIDiskState *s,
                                   uint64_t sector_num, uint32_t nb_sectors)
{
    /*
     * The first line tests that no overflow happens when computing the last
     * sector.  The second line tests that the last accessed sector is in
     * range.
1563 1564 1565 1566
     *
     * Careful, the computations should not underflow for nb_sectors == 0,
     * and a 0-block read to the first LBA beyond the end of device is
     * valid.
1567 1568
     */
    return (sector_num <= sector_num + nb_sectors &&
1569
            sector_num + nb_sectors <= s->qdev.max_lba + 1);
1570 1571
}

1572 1573 1574 1575 1576 1577
typedef struct UnmapCBData {
    SCSIDiskReq *r;
    uint8_t *inbuf;
    int count;
} UnmapCBData;

1578 1579 1580
static void scsi_unmap_complete(void *opaque, int ret);

static void scsi_unmap_complete_noio(UnmapCBData *data, int ret)
1581 1582 1583 1584
{
    SCSIDiskReq *r = data->r;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
    uint64_t sector_num;
1585
    uint32_t nb_sectors;
1586

1587 1588
    assert(r->req.aiocb == NULL);

1589
    if (r->req.io_canceled) {
1590
        scsi_req_cancel_complete(&r->req);
1591 1592 1593
        goto done;
    }

1594 1595 1596 1597 1598 1599
    if (ret < 0) {
        if (scsi_handle_rw_error(r, -ret)) {
            goto done;
        }
    }

1600
    if (data->count > 0) {
1601 1602
        sector_num = ldq_be_p(&data->inbuf[0]);
        nb_sectors = ldl_be_p(&data->inbuf[8]) & 0xffffffffULL;
1603
        if (!check_lba_range(s, sector_num, nb_sectors)) {
1604 1605 1606 1607
            scsi_check_condition(r, SENSE_CODE(LBA_OUT_OF_RANGE));
            goto done;
        }

1608 1609 1610 1611
        r->req.aiocb = blk_aio_discard(s->qdev.conf.blk,
                                       sector_num * (s->qdev.blocksize / 512),
                                       nb_sectors * (s->qdev.blocksize / 512),
                                       scsi_unmap_complete, data);
1612 1613 1614 1615 1616
        data->count--;
        data->inbuf += 16;
        return;
    }

1617 1618
    scsi_req_complete(&r->req, GOOD);

1619
done:
1620
    scsi_req_unref(&r->req);
1621 1622 1623
    g_free(data);
}

1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634
static void scsi_unmap_complete(void *opaque, int ret)
{
    UnmapCBData *data = opaque;
    SCSIDiskReq *r = data->r;

    assert(r->req.aiocb != NULL);
    r->req.aiocb = NULL;

    scsi_unmap_complete_noio(data, ret);
}

1635 1636
static void scsi_disk_emulate_unmap(SCSIDiskReq *r, uint8_t *inbuf)
{
1637
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);
1638 1639 1640 1641
    uint8_t *p = inbuf;
    int len = r->req.cmd.xfer;
    UnmapCBData *data;

1642 1643 1644 1645 1646
    /* Reject ANCHOR=1.  */
    if (r->req.cmd.buf[1] & 0x1) {
        goto invalid_field;
    }

1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659
    if (len < 8) {
        goto invalid_param_len;
    }
    if (len < lduw_be_p(&p[0]) + 2) {
        goto invalid_param_len;
    }
    if (len < lduw_be_p(&p[2]) + 8) {
        goto invalid_param_len;
    }
    if (lduw_be_p(&p[2]) & 15) {
        goto invalid_param_len;
    }

1660
    if (blk_is_read_only(s->qdev.conf.blk)) {
1661 1662 1663 1664
        scsi_check_condition(r, SENSE_CODE(WRITE_PROTECTED));
        return;
    }

1665 1666 1667 1668 1669 1670 1671
    data = g_new0(UnmapCBData, 1);
    data->r = r;
    data->inbuf = &p[8];
    data->count = lduw_be_p(&p[2]) >> 4;

    /* The matching unref is in scsi_unmap_complete, before data is freed.  */
    scsi_req_ref(&r->req);
1672
    scsi_unmap_complete_noio(data, 0);
1673 1674 1675 1676
    return;

invalid_param_len:
    scsi_check_condition(r, SENSE_CODE(INVALID_PARAM_LEN));
1677 1678 1679 1680
    return;

invalid_field:
    scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
1681 1682
}

1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698
typedef struct WriteSameCBData {
    SCSIDiskReq *r;
    int64_t sector;
    int nb_sectors;
    QEMUIOVector qiov;
    struct iovec iov;
} WriteSameCBData;

static void scsi_write_same_complete(void *opaque, int ret)
{
    WriteSameCBData *data = opaque;
    SCSIDiskReq *r = data->r;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, r->req.dev);

    assert(r->req.aiocb != NULL);
    r->req.aiocb = NULL;
1699
    block_acct_done(blk_get_stats(s->qdev.conf.blk), &r->acct);
1700
    if (r->req.io_canceled) {
1701
        scsi_req_cancel_complete(&r->req);
1702 1703 1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714
        goto done;
    }

    if (ret < 0) {
        if (scsi_handle_rw_error(r, -ret)) {
            goto done;
        }
    }

    data->nb_sectors -= data->iov.iov_len / 512;
    data->sector += data->iov.iov_len / 512;
    data->iov.iov_len = MIN(data->nb_sectors * 512, data->iov.iov_len);
    if (data->iov.iov_len) {
1715
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct,
1716
                         data->iov.iov_len, BLOCK_ACCT_WRITE);
1717 1718 1719 1720
        /* blk_aio_write doesn't like the qiov size being different from
         * nb_sectors, make sure they match.
         */
        qemu_iovec_init_external(&data->qiov, &data->iov, 1);
1721 1722 1723
        r->req.aiocb = blk_aio_writev(s->qdev.conf.blk, data->sector,
                                      &data->qiov, data->iov.iov_len / 512,
                                      scsi_write_same_complete, data);
1724 1725 1726 1727 1728 1729
        return;
    }

    scsi_req_complete(&r->req, GOOD);

done:
1730
    scsi_req_unref(&r->req);
1731 1732 1733 1734 1735 1736 1737 1738
    qemu_vfree(data->iov.iov_base);
    g_free(data);
}

static void scsi_disk_emulate_write_same(SCSIDiskReq *r, uint8_t *inbuf)
{
    SCSIRequest *req = &r->req;
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, req->dev);
1739
    uint32_t nb_sectors = scsi_data_cdb_xfer(r->req.cmd.buf);
1740 1741 1742 1743 1744 1745 1746 1747 1748 1749
    WriteSameCBData *data;
    uint8_t *buf;
    int i;

    /* Fail if PBDATA=1 or LBDATA=1 or ANCHOR=1.  */
    if (nb_sectors == 0 || (req->cmd.buf[1] & 0x16)) {
        scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
        return;
    }

1750
    if (blk_is_read_only(s->qdev.conf.blk)) {
1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763
        scsi_check_condition(r, SENSE_CODE(WRITE_PROTECTED));
        return;
    }
    if (!check_lba_range(s, r->req.cmd.lba, nb_sectors)) {
        scsi_check_condition(r, SENSE_CODE(LBA_OUT_OF_RANGE));
        return;
    }

    if (buffer_is_zero(inbuf, s->qdev.blocksize)) {
        int flags = (req->cmd.buf[1] & 0x8) ? BDRV_REQ_MAY_UNMAP : 0;

        /* The request is used as the AIO opaque value, so add a ref.  */
        scsi_req_ref(&r->req);
1764
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct,
1765 1766
                         nb_sectors * s->qdev.blocksize,
                        BLOCK_ACCT_WRITE);
1767 1768 1769 1770
        r->req.aiocb = blk_aio_write_zeroes(s->qdev.conf.blk,
                                r->req.cmd.lba * (s->qdev.blocksize / 512),
                                nb_sectors * (s->qdev.blocksize / 512),
                                flags, scsi_aio_complete, r);
1771 1772 1773 1774 1775 1776 1777 1778
        return;
    }

    data = g_new0(WriteSameCBData, 1);
    data->r = r;
    data->sector = r->req.cmd.lba * (s->qdev.blocksize / 512);
    data->nb_sectors = nb_sectors * (s->qdev.blocksize / 512);
    data->iov.iov_len = MIN(data->nb_sectors * 512, SCSI_WRITE_SAME_MAX);
1779 1780
    data->iov.iov_base = buf = blk_blockalign(s->qdev.conf.blk,
                                              data->iov.iov_len);
1781 1782 1783 1784 1785 1786 1787
    qemu_iovec_init_external(&data->qiov, &data->iov, 1);

    for (i = 0; i < data->iov.iov_len; i += s->qdev.blocksize) {
        memcpy(&buf[i], inbuf, s->qdev.blocksize);
    }

    scsi_req_ref(&r->req);
1788
    block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct,
1789
                     data->iov.iov_len, BLOCK_ACCT_WRITE);
1790 1791 1792
    r->req.aiocb = blk_aio_writev(s->qdev.conf.blk, data->sector,
                                  &data->qiov, data->iov.iov_len / 512,
                                  scsi_write_same_complete, data);
1793 1794
}

1795 1796
static void scsi_disk_emulate_write_data(SCSIRequest *req)
{
1797 1798 1799 1800
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);

    if (r->iov.iov_len) {
        int buflen = r->iov.iov_len;
1801
        DPRINTF("Write buf_len=%d\n", buflen);
1802 1803 1804 1805 1806 1807 1808 1809 1810
        r->iov.iov_len = 0;
        scsi_req_data(&r->req, buflen);
        return;
    }

    switch (req->cmd.buf[0]) {
    case MODE_SELECT:
    case MODE_SELECT_10:
        /* This also clears the sense buffer for REQUEST SENSE.  */
1811
        scsi_disk_emulate_mode_select(r, r->iov.iov_base);
1812 1813
        break;

1814 1815 1816 1817
    case UNMAP:
        scsi_disk_emulate_unmap(r, r->iov.iov_base);
        break;

P
Paolo Bonzini 已提交
1818 1819 1820 1821 1822 1823 1824 1825
    case VERIFY_10:
    case VERIFY_12:
    case VERIFY_16:
        if (r->req.status == -1) {
            scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
        }
        break;

1826 1827 1828 1829
    case WRITE_SAME_10:
    case WRITE_SAME_16:
        scsi_disk_emulate_write_same(r, r->iov.iov_base);
        break;
P
Paolo Bonzini 已提交
1830

1831 1832 1833
    default:
        abort();
    }
1834 1835
}

1836
static int32_t scsi_disk_emulate_command(SCSIRequest *req, uint8_t *buf)
1837
{
1838
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);
1839 1840
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, req->dev);
    uint64_t nb_sectors;
1841
    uint8_t *outbuf;
1842
    int buflen;
1843

1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860
    switch (req->cmd.buf[0]) {
    case INQUIRY:
    case MODE_SENSE:
    case MODE_SENSE_10:
    case RESERVE:
    case RESERVE_10:
    case RELEASE:
    case RELEASE_10:
    case START_STOP:
    case ALLOW_MEDIUM_REMOVAL:
    case GET_CONFIGURATION:
    case GET_EVENT_STATUS_NOTIFICATION:
    case MECHANISM_STATUS:
    case REQUEST_SENSE:
        break;

    default:
1861
        if (s->tray_open || !blk_is_inserted(s->qdev.conf.blk)) {
1862 1863 1864 1865 1866 1867
            scsi_check_condition(r, SENSE_CODE(NO_MEDIUM));
            return 0;
        }
        break;
    }

1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880
    /*
     * FIXME: we shouldn't return anything bigger than 4k, but the code
     * requires the buffer to be as big as req->cmd.xfer in several
     * places.  So, do not allow CDBs with a very large ALLOCATION
     * LENGTH.  The real fix would be to modify scsi_read_data and
     * dma_buf_read, so that they return data beyond the buflen
     * as all zeros.
     */
    if (req->cmd.xfer > 65536) {
        goto illegal_request;
    }
    r->buflen = MAX(4096, req->cmd.xfer);

1881
    if (!r->iov.iov_base) {
1882
        r->iov.iov_base = blk_blockalign(s->qdev.conf.blk, r->buflen);
1883 1884
    }

1885
    buflen = req->cmd.xfer;
1886
    outbuf = r->iov.iov_base;
1887
    memset(outbuf, 0, r->buflen);
1888 1889
    switch (req->cmd.buf[0]) {
    case TEST_UNIT_READY:
1890
        assert(!s->tray_open && blk_is_inserted(s->qdev.conf.blk));
H
Hannes Reinecke 已提交
1891
        break;
1892 1893
    case INQUIRY:
        buflen = scsi_disk_emulate_inquiry(req, outbuf);
1894
        if (buflen < 0) {
1895
            goto illegal_request;
1896
        }
H
Hannes Reinecke 已提交
1897
        break;
1898 1899
    case MODE_SENSE:
    case MODE_SENSE_10:
1900
        buflen = scsi_disk_emulate_mode_sense(r, outbuf);
1901
        if (buflen < 0) {
1902
            goto illegal_request;
1903
        }
1904
        break;
1905 1906
    case READ_TOC:
        buflen = scsi_disk_emulate_read_toc(req, outbuf);
1907
        if (buflen < 0) {
1908
            goto illegal_request;
1909
        }
1910
        break;
1911
    case RESERVE:
1912
        if (req->cmd.buf[1] & 1) {
1913
            goto illegal_request;
1914
        }
1915 1916
        break;
    case RESERVE_10:
1917
        if (req->cmd.buf[1] & 3) {
1918
            goto illegal_request;
1919
        }
1920 1921
        break;
    case RELEASE:
1922
        if (req->cmd.buf[1] & 1) {
1923
            goto illegal_request;
1924
        }
1925 1926
        break;
    case RELEASE_10:
1927
        if (req->cmd.buf[1] & 3) {
1928
            goto illegal_request;
1929
        }
1930
        break;
1931
    case START_STOP:
1932
        if (scsi_disk_emulate_start_stop(r) < 0) {
1933
            return 0;
1934
        }
H
Hannes Reinecke 已提交
1935
        break;
1936
    case ALLOW_MEDIUM_REMOVAL:
1937
        s->tray_locked = req->cmd.buf[4] & 1;
1938
        blk_lock_medium(s->qdev.conf.blk, req->cmd.buf[4] & 1);
H
Hannes Reinecke 已提交
1939
        break;
1940
    case READ_CAPACITY_10:
1941
        /* The normal LEN field for this command is zero.  */
H
Hannes Reinecke 已提交
1942
        memset(outbuf, 0, 8);
1943
        blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
1944
        if (!nb_sectors) {
1945
            scsi_check_condition(r, SENSE_CODE(LUN_NOT_READY));
1946
            return 0;
1947
        }
1948 1949 1950
        if ((req->cmd.buf[8] & 1) == 0 && req->cmd.lba) {
            goto illegal_request;
        }
P
Paolo Bonzini 已提交
1951
        nb_sectors /= s->qdev.blocksize / 512;
1952 1953 1954
        /* Returned value is the address of the last sector.  */
        nb_sectors--;
        /* Remember the new size for read/write sanity checking. */
P
Paolo Bonzini 已提交
1955
        s->qdev.max_lba = nb_sectors;
1956
        /* Clip to 2TB, instead of returning capacity modulo 2TB. */
1957
        if (nb_sectors > UINT32_MAX) {
1958
            nb_sectors = UINT32_MAX;
1959
        }
1960 1961 1962 1963 1964 1965
        outbuf[0] = (nb_sectors >> 24) & 0xff;
        outbuf[1] = (nb_sectors >> 16) & 0xff;
        outbuf[2] = (nb_sectors >> 8) & 0xff;
        outbuf[3] = nb_sectors & 0xff;
        outbuf[4] = 0;
        outbuf[5] = 0;
P
Paolo Bonzini 已提交
1966
        outbuf[6] = s->qdev.blocksize >> 8;
1967
        outbuf[7] = 0;
H
Hannes Reinecke 已提交
1968
        break;
1969 1970 1971 1972
    case REQUEST_SENSE:
        /* Just return "NO SENSE".  */
        buflen = scsi_build_sense(NULL, 0, outbuf, r->buflen,
                                  (req->cmd.buf[1] & 1) == 0);
1973 1974 1975
        if (buflen < 0) {
            goto illegal_request;
        }
1976
        break;
1977 1978 1979 1980 1981 1982
    case MECHANISM_STATUS:
        buflen = scsi_emulate_mechanism_status(s, outbuf);
        if (buflen < 0) {
            goto illegal_request;
        }
        break;
1983
    case GET_CONFIGURATION:
1984
        buflen = scsi_get_configuration(s, outbuf);
1985 1986 1987 1988 1989 1990 1991 1992 1993 1994
        if (buflen < 0) {
            goto illegal_request;
        }
        break;
    case GET_EVENT_STATUS_NOTIFICATION:
        buflen = scsi_get_event_status_notification(s, r, outbuf);
        if (buflen < 0) {
            goto illegal_request;
        }
        break;
1995 1996 1997 1998 1999 2000
    case READ_DISC_INFORMATION:
        buflen = scsi_read_disc_information(s, r, outbuf);
        if (buflen < 0) {
            goto illegal_request;
        }
        break;
2001 2002 2003 2004 2005
    case READ_DVD_STRUCTURE:
        buflen = scsi_read_dvd_structure(s, r, outbuf);
        if (buflen < 0) {
            goto illegal_request;
        }
2006
        break;
2007
    case SERVICE_ACTION_IN_16:
2008
        /* Service Action In subcommands. */
2009
        if ((req->cmd.buf[1] & 31) == SAI_READ_CAPACITY_16) {
2010 2011
            DPRINTF("SAI READ CAPACITY(16)\n");
            memset(outbuf, 0, req->cmd.xfer);
2012
            blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
2013
            if (!nb_sectors) {
2014
                scsi_check_condition(r, SENSE_CODE(LUN_NOT_READY));
2015
                return 0;
2016
            }
2017 2018 2019
            if ((req->cmd.buf[14] & 1) == 0 && req->cmd.lba) {
                goto illegal_request;
            }
P
Paolo Bonzini 已提交
2020
            nb_sectors /= s->qdev.blocksize / 512;
2021 2022 2023
            /* Returned value is the address of the last sector.  */
            nb_sectors--;
            /* Remember the new size for read/write sanity checking. */
P
Paolo Bonzini 已提交
2024
            s->qdev.max_lba = nb_sectors;
2025 2026 2027 2028 2029 2030 2031 2032 2033 2034
            outbuf[0] = (nb_sectors >> 56) & 0xff;
            outbuf[1] = (nb_sectors >> 48) & 0xff;
            outbuf[2] = (nb_sectors >> 40) & 0xff;
            outbuf[3] = (nb_sectors >> 32) & 0xff;
            outbuf[4] = (nb_sectors >> 24) & 0xff;
            outbuf[5] = (nb_sectors >> 16) & 0xff;
            outbuf[6] = (nb_sectors >> 8) & 0xff;
            outbuf[7] = nb_sectors & 0xff;
            outbuf[8] = 0;
            outbuf[9] = 0;
P
Paolo Bonzini 已提交
2035
            outbuf[10] = s->qdev.blocksize >> 8;
2036
            outbuf[11] = 0;
C
Christoph Hellwig 已提交
2037 2038
            outbuf[12] = 0;
            outbuf[13] = get_physical_block_exp(&s->qdev.conf);
2039 2040 2041 2042 2043 2044

            /* set TPE bit if the format supports discard */
            if (s->qdev.conf.discard_granularity) {
                outbuf[14] = 0x80;
            }

2045 2046 2047 2048 2049
            /* Protection, exponent and lowest lba field left blank. */
            break;
        }
        DPRINTF("Unsupported Service Action In\n");
        goto illegal_request;
2050 2051 2052
    case SYNCHRONIZE_CACHE:
        /* The request is used as the AIO opaque value, so add a ref.  */
        scsi_req_ref(&r->req);
2053
        block_acct_start(blk_get_stats(s->qdev.conf.blk), &r->acct, 0,
2054
                         BLOCK_ACCT_FLUSH);
2055
        r->req.aiocb = blk_aio_flush(s->qdev.conf.blk, scsi_aio_complete, r);
2056 2057 2058 2059 2060 2061 2062 2063 2064 2065 2066 2067 2068
        return 0;
    case SEEK_10:
        DPRINTF("Seek(10) (sector %" PRId64 ")\n", r->req.cmd.lba);
        if (r->req.cmd.lba > s->qdev.max_lba) {
            goto illegal_lba;
        }
        break;
    case MODE_SELECT:
        DPRINTF("Mode Select(6) (len %lu)\n", (long)r->req.cmd.xfer);
        break;
    case MODE_SELECT_10:
        DPRINTF("Mode Select(10) (len %lu)\n", (long)r->req.cmd.xfer);
        break;
2069 2070 2071
    case UNMAP:
        DPRINTF("Unmap (len %lu)\n", (long)r->req.cmd.xfer);
        break;
P
Paolo Bonzini 已提交
2072 2073 2074
    case VERIFY_10:
    case VERIFY_12:
    case VERIFY_16:
2075
        DPRINTF("Verify (bytchk %d)\n", (req->cmd.buf[1] >> 1) & 3);
P
Paolo Bonzini 已提交
2076 2077 2078 2079
        if (req->cmd.buf[1] & 6) {
            goto illegal_request;
        }
        break;
2080 2081
    case WRITE_SAME_10:
    case WRITE_SAME_16:
2082 2083 2084 2085
        DPRINTF("WRITE SAME %d (len %lu)\n",
                req->cmd.buf[0] == WRITE_SAME_10 ? 10 : 16,
                (long)r->req.cmd.xfer);
        break;
2086
    default:
2087 2088
        DPRINTF("Unknown SCSI command (%2.2x=%s)\n", buf[0],
                scsi_command_name(buf[0]));
2089
        scsi_check_condition(r, SENSE_CODE(INVALID_OPCODE));
2090
        return 0;
2091
    }
2092
    assert(!r->req.aiocb);
2093
    r->iov.iov_len = MIN(r->buflen, req->cmd.xfer);
2094 2095 2096
    if (r->iov.iov_len == 0) {
        scsi_req_complete(&r->req, GOOD);
    }
2097 2098 2099 2100 2101 2102
    if (r->req.cmd.mode == SCSI_XFER_TO_DEV) {
        assert(r->iov.iov_len == req->cmd.xfer);
        return -r->iov.iov_len;
    } else {
        return r->iov.iov_len;
    }
2103 2104

illegal_request:
2105 2106 2107
    if (r->req.status == -1) {
        scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
    }
2108
    return 0;
2109 2110 2111 2112

illegal_lba:
    scsi_check_condition(r, SENSE_CODE(LBA_OUT_OF_RANGE));
    return 0;
2113 2114
}

P
pbrook 已提交
2115 2116 2117 2118 2119
/* Execute a scsi command.  Returns the length of the data expected by the
   command.  This will be Positive for data transfers from the device
   (eg. disk reads), negative for transfers to the device (eg. disk writes),
   and zero if the command does not transfer any data.  */

2120
static int32_t scsi_disk_dma_command(SCSIRequest *req, uint8_t *buf)
P
pbrook 已提交
2121
{
2122 2123
    SCSIDiskReq *r = DO_UPCAST(SCSIDiskReq, req, req);
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, req->dev);
2124
    uint32_t len;
P
pbrook 已提交
2125 2126 2127
    uint8_t command;

    command = buf[0];
2128

2129
    if (s->tray_open || !blk_is_inserted(s->qdev.conf.blk)) {
2130 2131
        scsi_check_condition(r, SENSE_CODE(NO_MEDIUM));
        return 0;
2132 2133
    }

2134
    len = scsi_data_cdb_xfer(r->req.cmd.buf);
P
pbrook 已提交
2135
    switch (command) {
2136 2137
    case READ_6:
    case READ_10:
G
Gerd Hoffmann 已提交
2138 2139
    case READ_12:
    case READ_16:
2140
        DPRINTF("Read (sector %" PRId64 ", count %u)\n", r->req.cmd.lba, len);
2141 2142 2143
        if (r->req.cmd.buf[1] & 0xe0) {
            goto illegal_request;
        }
2144
        if (!check_lba_range(s, r->req.cmd.lba, len)) {
2145
            goto illegal_lba;
2146
        }
P
Paolo Bonzini 已提交
2147 2148
        r->sector = r->req.cmd.lba * (s->qdev.blocksize / 512);
        r->sector_count = len * (s->qdev.blocksize / 512);
P
pbrook 已提交
2149
        break;
2150 2151
    case WRITE_6:
    case WRITE_10:
G
Gerd Hoffmann 已提交
2152 2153
    case WRITE_12:
    case WRITE_16:
2154
    case WRITE_VERIFY_10:
2155 2156
    case WRITE_VERIFY_12:
    case WRITE_VERIFY_16:
2157
        if (blk_is_read_only(s->qdev.conf.blk)) {
2158 2159 2160
            scsi_check_condition(r, SENSE_CODE(WRITE_PROTECTED));
            return 0;
        }
2161
        DPRINTF("Write %s(sector %" PRId64 ", count %u)\n",
2162 2163
                (command & 0xe) == 0xe ? "And Verify " : "",
                r->req.cmd.lba, len);
2164 2165 2166
        if (r->req.cmd.buf[1] & 0xe0) {
            goto illegal_request;
        }
2167
        if (!check_lba_range(s, r->req.cmd.lba, len)) {
2168
            goto illegal_lba;
2169
        }
P
Paolo Bonzini 已提交
2170 2171
        r->sector = r->req.cmd.lba * (s->qdev.blocksize / 512);
        r->sector_count = len * (s->qdev.blocksize / 512);
P
pbrook 已提交
2172
        break;
2173
    default:
2174
        abort();
2175 2176 2177
    illegal_request:
        scsi_check_condition(r, SENSE_CODE(INVALID_FIELD));
        return 0;
2178
    illegal_lba:
2179
        scsi_check_condition(r, SENSE_CODE(LBA_OUT_OF_RANGE));
2180
        return 0;
P
pbrook 已提交
2181
    }
2182
    if (r->sector_count == 0) {
2183
        scsi_req_complete(&r->req, GOOD);
P
pbrook 已提交
2184
    }
2185
    assert(r->iov.iov_len == 0);
2186
    if (r->req.cmd.mode == SCSI_XFER_TO_DEV) {
2187
        return -r->sector_count * 512;
P
pbrook 已提交
2188
    } else {
2189
        return r->sector_count * 512;
P
pbrook 已提交
2190 2191 2192
    }
}

J
Jan Kiszka 已提交
2193 2194 2195 2196 2197
static void scsi_disk_reset(DeviceState *dev)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev.qdev, dev);
    uint64_t nb_sectors;

2198
    scsi_device_purge_requests(&s->qdev, SENSE_CODE(RESET));
J
Jan Kiszka 已提交
2199

2200
    blk_get_geometry(s->qdev.conf.blk, &nb_sectors);
P
Paolo Bonzini 已提交
2201
    nb_sectors /= s->qdev.blocksize / 512;
J
Jan Kiszka 已提交
2202 2203 2204
    if (nb_sectors) {
        nb_sectors--;
    }
P
Paolo Bonzini 已提交
2205
    s->qdev.max_lba = nb_sectors;
2206 2207 2208
    /* reset tray statuses */
    s->tray_locked = 0;
    s->tray_open = 0;
J
Jan Kiszka 已提交
2209 2210
}

2211 2212 2213 2214 2215 2216 2217 2218
static void scsi_disk_resize_cb(void *opaque)
{
    SCSIDiskState *s = opaque;

    /* SPC lists this sense code as available only for
     * direct-access devices.
     */
    if (s->qdev.type == TYPE_DISK) {
2219
        scsi_device_report_change(&s->qdev, SENSE_CODE(CAPACITY_CHANGED));
2220 2221 2222
    }
}

2223
static void scsi_cd_change_media_cb(void *opaque, bool load)
2224
{
2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238
    SCSIDiskState *s = opaque;

    /*
     * When a CD gets changed, we have to report an ejected state and
     * then a loaded state to guests so that they detect tray
     * open/close and media change events.  Guests that do not use
     * GET_EVENT_STATUS_NOTIFICATION to detect such tray open/close
     * states rely on this behavior.
     *
     * media_changed governs the state machine used for unit attention
     * report.  media_event is used by GET EVENT STATUS NOTIFICATION.
     */
    s->media_changed = load;
    s->tray_open = !load;
2239
    scsi_device_set_ua(&s->qdev, SENSE_CODE(UNIT_ATTENTION_NO_MEDIUM));
2240
    s->media_event = true;
2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251
    s->eject_request = false;
}

static void scsi_cd_eject_request_cb(void *opaque, bool force)
{
    SCSIDiskState *s = opaque;

    s->eject_request = true;
    if (force) {
        s->tray_locked = false;
    }
2252 2253
}

2254 2255 2256 2257 2258
static bool scsi_cd_is_tray_open(void *opaque)
{
    return ((SCSIDiskState *)opaque)->tray_open;
}

2259 2260 2261 2262 2263
static bool scsi_cd_is_medium_locked(void *opaque)
{
    return ((SCSIDiskState *)opaque)->tray_locked;
}

2264
static const BlockDevOps scsi_disk_removable_block_ops = {
2265
    .change_media_cb = scsi_cd_change_media_cb,
2266
    .eject_request_cb = scsi_cd_eject_request_cb,
2267
    .is_tray_open = scsi_cd_is_tray_open,
2268
    .is_medium_locked = scsi_cd_is_medium_locked,
2269 2270 2271 2272 2273 2274

    .resize_cb = scsi_disk_resize_cb,
};

static const BlockDevOps scsi_disk_block_ops = {
    .resize_cb = scsi_disk_resize_cb,
2275 2276
};

2277 2278 2279 2280 2281
static void scsi_disk_unit_attention_reported(SCSIDevice *dev)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, dev);
    if (s->media_changed) {
        s->media_changed = false;
2282
        scsi_device_set_ua(&s->qdev, SENSE_CODE(MEDIUM_CHANGED));
2283 2284 2285
    }
}

2286
static void scsi_realize(SCSIDevice *dev, Error **errp)
P
pbrook 已提交
2287
{
2288
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, dev);
F
Fam Zheng 已提交
2289
    Error *err = NULL;
P
pbrook 已提交
2290

2291
    if (!s->qdev.conf.blk) {
2292 2293
        error_setg(errp, "drive property not set");
        return;
2294 2295
    }

2296
    if (!(s->features & (1 << SCSI_DISK_F_REMOVABLE)) &&
2297
        !blk_is_inserted(s->qdev.conf.blk)) {
2298 2299
        error_setg(errp, "Device needs media, but drive is empty");
        return;
2300 2301
    }

2302
    blkconf_serial(&s->qdev.conf, &s->serial);
2303
    blkconf_blocksizes(&s->qdev.conf);
F
Fam Zheng 已提交
2304 2305 2306
    if (dev->type == TYPE_DISK) {
        blkconf_geometry(&dev->conf, NULL, 65535, 255, 255, &err);
        if (err) {
2307 2308
            error_propagate(errp, err);
            return;
F
Fam Zheng 已提交
2309
        }
2310
    }
2311

2312 2313 2314 2315 2316
    if (s->qdev.conf.discard_granularity == -1) {
        s->qdev.conf.discard_granularity =
            MAX(s->qdev.conf.logical_block_size, DEFAULT_DISCARD_GRANULARITY);
    }

2317
    if (!s->version) {
2318
        s->version = g_strdup(qemu_get_version());
2319
    }
2320 2321 2322
    if (!s->vendor) {
        s->vendor = g_strdup("QEMU");
    }
2323

2324
    if (blk_is_sg(s->qdev.conf.blk)) {
2325 2326
        error_setg(errp, "unwanted /dev/sg*");
        return;
2327 2328
    }

2329 2330
    if ((s->features & (1 << SCSI_DISK_F_REMOVABLE)) &&
            !(s->features & (1 << SCSI_DISK_F_NO_REMOVABLE_DEVOPS))) {
2331
        blk_set_dev_ops(s->qdev.conf.blk, &scsi_disk_removable_block_ops, s);
2332
    } else {
2333
        blk_set_dev_ops(s->qdev.conf.blk, &scsi_disk_block_ops, s);
P
pbrook 已提交
2334
    }
2335
    blk_set_guest_block_size(s->qdev.conf.blk, s->qdev.blocksize);
2336

2337
    blk_iostatus_enable(s->qdev.conf.blk);
2338 2339
}

2340
static void scsi_hd_realize(SCSIDevice *dev, Error **errp)
2341
{
2342
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, dev);
2343 2344 2345 2346 2347 2348
    /* can happen for devices without drive. The error message for missing
     * backend will be issued in scsi_realize
     */
    if (s->qdev.conf.blk) {
        blkconf_blocksizes(&s->qdev.conf);
    }
2349 2350
    s->qdev.blocksize = s->qdev.conf.logical_block_size;
    s->qdev.type = TYPE_DISK;
2351 2352 2353
    if (!s->product) {
        s->product = g_strdup("QEMU HARDDISK");
    }
2354
    scsi_realize(&s->qdev, errp);
2355 2356
}

2357
static void scsi_cd_realize(SCSIDevice *dev, Error **errp)
2358
{
2359 2360 2361
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, dev);
    s->qdev.blocksize = 2048;
    s->qdev.type = TYPE_ROM;
2362
    s->features |= 1 << SCSI_DISK_F_REMOVABLE;
2363 2364 2365
    if (!s->product) {
        s->product = g_strdup("QEMU CD-ROM");
    }
2366
    scsi_realize(&s->qdev, errp);
2367 2368
}

2369
static void scsi_disk_realize(SCSIDevice *dev, Error **errp)
2370
{
2371
    DriveInfo *dinfo;
2372
    Error *local_err = NULL;
2373

2374
    if (!dev->conf.blk) {
2375 2376 2377 2378
        scsi_realize(dev, &local_err);
        assert(local_err);
        error_propagate(errp, local_err);
        return;
2379 2380
    }

2381
    dinfo = blk_legacy_dinfo(dev->conf.blk);
2382
    if (dinfo && dinfo->media_cd) {
2383
        scsi_cd_realize(dev, errp);
2384
    } else {
2385
        scsi_hd_realize(dev, errp);
2386
    }
2387 2388
}

2389
static const SCSIReqOps scsi_disk_emulate_reqops = {
P
Paolo Bonzini 已提交
2390
    .size         = sizeof(SCSIDiskReq),
2391
    .free_req     = scsi_free_request,
2392
    .send_command = scsi_disk_emulate_command,
2393 2394
    .read_data    = scsi_disk_emulate_read_data,
    .write_data   = scsi_disk_emulate_write_data,
2395 2396 2397 2398 2399 2400 2401
    .get_buf      = scsi_get_buf,
};

static const SCSIReqOps scsi_disk_dma_reqops = {
    .size         = sizeof(SCSIDiskReq),
    .free_req     = scsi_free_request,
    .send_command = scsi_disk_dma_command,
2402 2403 2404
    .read_data    = scsi_read_data,
    .write_data   = scsi_write_data,
    .get_buf      = scsi_get_buf,
P
Paolo Bonzini 已提交
2405 2406
    .load_request = scsi_disk_load_request,
    .save_request = scsi_disk_save_request,
P
Paolo Bonzini 已提交
2407 2408
};

2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428
static const SCSIReqOps *const scsi_disk_reqops_dispatch[256] = {
    [TEST_UNIT_READY]                 = &scsi_disk_emulate_reqops,
    [INQUIRY]                         = &scsi_disk_emulate_reqops,
    [MODE_SENSE]                      = &scsi_disk_emulate_reqops,
    [MODE_SENSE_10]                   = &scsi_disk_emulate_reqops,
    [START_STOP]                      = &scsi_disk_emulate_reqops,
    [ALLOW_MEDIUM_REMOVAL]            = &scsi_disk_emulate_reqops,
    [READ_CAPACITY_10]                = &scsi_disk_emulate_reqops,
    [READ_TOC]                        = &scsi_disk_emulate_reqops,
    [READ_DVD_STRUCTURE]              = &scsi_disk_emulate_reqops,
    [READ_DISC_INFORMATION]           = &scsi_disk_emulate_reqops,
    [GET_CONFIGURATION]               = &scsi_disk_emulate_reqops,
    [GET_EVENT_STATUS_NOTIFICATION]   = &scsi_disk_emulate_reqops,
    [MECHANISM_STATUS]                = &scsi_disk_emulate_reqops,
    [SERVICE_ACTION_IN_16]            = &scsi_disk_emulate_reqops,
    [REQUEST_SENSE]                   = &scsi_disk_emulate_reqops,
    [SYNCHRONIZE_CACHE]               = &scsi_disk_emulate_reqops,
    [SEEK_10]                         = &scsi_disk_emulate_reqops,
    [MODE_SELECT]                     = &scsi_disk_emulate_reqops,
    [MODE_SELECT_10]                  = &scsi_disk_emulate_reqops,
2429
    [UNMAP]                           = &scsi_disk_emulate_reqops,
2430 2431
    [WRITE_SAME_10]                   = &scsi_disk_emulate_reqops,
    [WRITE_SAME_16]                   = &scsi_disk_emulate_reqops,
P
Paolo Bonzini 已提交
2432 2433 2434
    [VERIFY_10]                       = &scsi_disk_emulate_reqops,
    [VERIFY_12]                       = &scsi_disk_emulate_reqops,
    [VERIFY_16]                       = &scsi_disk_emulate_reqops,
2435 2436 2437 2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448

    [READ_6]                          = &scsi_disk_dma_reqops,
    [READ_10]                         = &scsi_disk_dma_reqops,
    [READ_12]                         = &scsi_disk_dma_reqops,
    [READ_16]                         = &scsi_disk_dma_reqops,
    [WRITE_6]                         = &scsi_disk_dma_reqops,
    [WRITE_10]                        = &scsi_disk_dma_reqops,
    [WRITE_12]                        = &scsi_disk_dma_reqops,
    [WRITE_16]                        = &scsi_disk_dma_reqops,
    [WRITE_VERIFY_10]                 = &scsi_disk_dma_reqops,
    [WRITE_VERIFY_12]                 = &scsi_disk_dma_reqops,
    [WRITE_VERIFY_16]                 = &scsi_disk_dma_reqops,
};

P
Paolo Bonzini 已提交
2449 2450
static SCSIRequest *scsi_new_request(SCSIDevice *d, uint32_t tag, uint32_t lun,
                                     uint8_t *buf, void *hba_private)
P
Paolo Bonzini 已提交
2451 2452 2453
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, d);
    SCSIRequest *req;
2454 2455
    const SCSIReqOps *ops;
    uint8_t command;
P
Paolo Bonzini 已提交
2456

2457 2458 2459 2460 2461 2462 2463
    command = buf[0];
    ops = scsi_disk_reqops_dispatch[command];
    if (!ops) {
        ops = &scsi_disk_emulate_reqops;
    }
    req = scsi_req_alloc(ops, &s->qdev, tag, lun, hba_private);

2464
#ifdef DEBUG_SCSI
2465
    DPRINTF("Command: lun=%d tag=0x%x data=0x%02x", lun, tag, buf[0]);
2466 2467
    {
        int i;
2468
        for (i = 1; i < scsi_cdb_length(buf); i++) {
2469 2470 2471 2472 2473 2474
            printf(" 0x%02x", buf[i]);
        }
        printf("\n");
    }
#endif

P
Paolo Bonzini 已提交
2475 2476 2477
    return req;
}

2478 2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502
#ifdef __linux__
static int get_device_type(SCSIDiskState *s)
{
    uint8_t cmd[16];
    uint8_t buf[36];
    uint8_t sensebuf[8];
    sg_io_hdr_t io_header;
    int ret;

    memset(cmd, 0, sizeof(cmd));
    memset(buf, 0, sizeof(buf));
    cmd[0] = INQUIRY;
    cmd[4] = sizeof(buf);

    memset(&io_header, 0, sizeof(io_header));
    io_header.interface_id = 'S';
    io_header.dxfer_direction = SG_DXFER_FROM_DEV;
    io_header.dxfer_len = sizeof(buf);
    io_header.dxferp = buf;
    io_header.cmdp = cmd;
    io_header.cmd_len = sizeof(cmd);
    io_header.mx_sb_len = sizeof(sensebuf);
    io_header.sbp = sensebuf;
    io_header.timeout = 6000; /* XXX */

2503
    ret = blk_ioctl(s->qdev.conf.blk, SG_IO, &io_header);
2504 2505 2506 2507
    if (ret < 0 || io_header.driver_status || io_header.host_status) {
        return -1;
    }
    s->qdev.type = buf[0];
2508 2509 2510
    if (buf[1] & 0x80) {
        s->features |= 1 << SCSI_DISK_F_REMOVABLE;
    }
2511 2512 2513
    return 0;
}

2514
static void scsi_block_realize(SCSIDevice *dev, Error **errp)
2515 2516 2517 2518 2519
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, dev);
    int sg_version;
    int rc;

2520
    if (!s->qdev.conf.blk) {
2521 2522
        error_setg(errp, "drive property not set");
        return;
2523 2524 2525
    }

    /* check we are using a driver managing SG_IO (version 3 and after) */
2526
    rc = blk_ioctl(s->qdev.conf.blk, SG_GET_VERSION_NUM, &sg_version);
2527
    if (rc < 0) {
2528
        error_setg(errp, "cannot get SG_IO version number: %s.  "
2529
                     "Is this a SCSI device?",
2530
                     strerror(-rc));
2531
        return;
2532 2533
    }
    if (sg_version < 30000) {
2534 2535
        error_setg(errp, "scsi generic interface too old");
        return;
2536 2537 2538 2539 2540
    }

    /* get device type from INQUIRY data */
    rc = get_device_type(s);
    if (rc < 0) {
2541 2542
        error_setg(errp, "INQUIRY failed");
        return;
2543 2544 2545 2546 2547 2548 2549 2550 2551 2552 2553
    }

    /* Make a guess for the block size, we'll fix it when the guest sends.
     * READ CAPACITY.  If they don't, they likely would assume these sizes
     * anyway. (TODO: check in /sys).
     */
    if (s->qdev.type == TYPE_ROM || s->qdev.type == TYPE_WORM) {
        s->qdev.blocksize = 2048;
    } else {
        s->qdev.blocksize = 512;
    }
2554 2555 2556 2557 2558 2559

    /* Makes the scsi-block device not removable by using HMP and QMP eject
     * command.
     */
    s->features |= (1 << SCSI_DISK_F_NO_REMOVABLE_DEVOPS);

2560
    scsi_realize(&s->qdev, errp);
2561 2562
}

2563
static bool scsi_block_is_passthrough(SCSIDiskState *s, uint8_t *buf)
2564 2565 2566 2567 2568 2569
{
    switch (buf[0]) {
    case READ_6:
    case READ_10:
    case READ_12:
    case READ_16:
2570 2571 2572
    case VERIFY_10:
    case VERIFY_12:
    case VERIFY_16:
2573 2574 2575 2576 2577 2578 2579
    case WRITE_6:
    case WRITE_10:
    case WRITE_12:
    case WRITE_16:
    case WRITE_VERIFY_10:
    case WRITE_VERIFY_12:
    case WRITE_VERIFY_16:
2580
        /* If we are not using O_DIRECT, we might read stale data from the
2581 2582 2583
         * host cache if writes were made using other commands than these
         * ones (such as WRITE SAME or EXTENDED COPY, etc.).  So, without
         * O_DIRECT everything must go through SG_IO.
2584
         */
2585
        if (!(blk_get_flags(s->qdev.conf.blk) & BDRV_O_NOCACHE)) {
2586 2587 2588
            break;
        }

2589 2590 2591 2592 2593 2594
        /* MMC writing cannot be done via pread/pwrite, because it sometimes
         * involves writing beyond the maximum LBA or to negative LBA (lead-in).
         * And once you do these writes, reading from the block device is
         * unreliable, too.  It is even possible that reads deliver random data
         * from the host page cache (this is probably a Linux bug).
         *
2595
         * We might use scsi_disk_dma_reqops as long as no writing commands are
2596 2597 2598
         * seen, but performance usually isn't paramount on optical media.  So,
         * just make scsi-block operate the same as scsi-generic for them.
         */
2599
        if (s->qdev.type != TYPE_ROM) {
2600
            return false;
2601
        }
2602 2603 2604 2605
        break;

    default:
        break;
2606 2607
    }

2608 2609 2610 2611 2612 2613 2614 2615 2616 2617 2618 2619 2620 2621 2622 2623 2624
    return true;
}


static SCSIRequest *scsi_block_new_request(SCSIDevice *d, uint32_t tag,
                                           uint32_t lun, uint8_t *buf,
                                           void *hba_private)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, d);

    if (scsi_block_is_passthrough(s, buf)) {
        return scsi_req_alloc(&scsi_generic_req_ops, &s->qdev, tag, lun,
                              hba_private);
    } else {
        return scsi_req_alloc(&scsi_disk_dma_reqops, &s->qdev, tag, lun,
                              hba_private);
    }
2625
}
2626 2627 2628 2629 2630 2631 2632 2633 2634 2635 2636 2637 2638

static int scsi_block_parse_cdb(SCSIDevice *d, SCSICommand *cmd,
                                  uint8_t *buf, void *hba_private)
{
    SCSIDiskState *s = DO_UPCAST(SCSIDiskState, qdev, d);

    if (scsi_block_is_passthrough(s, buf)) {
        return scsi_bus_parse_cdb(&s->qdev, cmd, buf, hba_private);
    } else {
        return scsi_req_parse_cdb(&s->qdev, cmd, buf);
    }
}

2639 2640
#endif

2641 2642 2643 2644 2645 2646
#define DEFINE_SCSI_DISK_PROPERTIES()                                \
    DEFINE_BLOCK_PROPERTIES(SCSIDiskState, qdev.conf),               \
    DEFINE_PROP_STRING("ver", SCSIDiskState, version),               \
    DEFINE_PROP_STRING("serial", SCSIDiskState, serial),             \
    DEFINE_PROP_STRING("vendor", SCSIDiskState, vendor),             \
    DEFINE_PROP_STRING("product", SCSIDiskState, product)
2647

2648 2649
static Property scsi_hd_properties[] = {
    DEFINE_SCSI_DISK_PROPERTIES(),
2650 2651
    DEFINE_PROP_BIT("removable", SCSIDiskState, features,
                    SCSI_DISK_F_REMOVABLE, false),
P
Paolo Bonzini 已提交
2652 2653
    DEFINE_PROP_BIT("dpofua", SCSIDiskState, features,
                    SCSI_DISK_F_DPOFUA, false),
2654
    DEFINE_PROP_UINT64("wwn", SCSIDiskState, wwn, 0),
2655 2656
    DEFINE_PROP_UINT64("port_wwn", SCSIDiskState, port_wwn, 0),
    DEFINE_PROP_UINT16("port_index", SCSIDiskState, port_index, 0),
2657 2658
    DEFINE_PROP_UINT64("max_unmap_size", SCSIDiskState, max_unmap_size,
                       DEFAULT_MAX_UNMAP_SIZE),
2659 2660
    DEFINE_PROP_UINT64("max_io_size", SCSIDiskState, max_io_size,
                       DEFAULT_MAX_IO_SIZE),
2661
    DEFINE_BLOCK_CHS_PROPERTIES(SCSIDiskState, qdev.conf),
2662 2663 2664
    DEFINE_PROP_END_OF_LIST(),
};

P
Paolo Bonzini 已提交
2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679
static const VMStateDescription vmstate_scsi_disk_state = {
    .name = "scsi-disk",
    .version_id = 1,
    .minimum_version_id = 1,
    .fields = (VMStateField[]) {
        VMSTATE_SCSI_DEVICE(qdev, SCSIDiskState),
        VMSTATE_BOOL(media_changed, SCSIDiskState),
        VMSTATE_BOOL(media_event, SCSIDiskState),
        VMSTATE_BOOL(eject_request, SCSIDiskState),
        VMSTATE_BOOL(tray_open, SCSIDiskState),
        VMSTATE_BOOL(tray_locked, SCSIDiskState),
        VMSTATE_END_OF_LIST()
    }
};

2680 2681
static void scsi_hd_class_initfn(ObjectClass *klass, void *data)
{
2682
    DeviceClass *dc = DEVICE_CLASS(klass);
2683 2684
    SCSIDeviceClass *sc = SCSI_DEVICE_CLASS(klass);

2685
    sc->realize      = scsi_hd_realize;
2686 2687
    sc->alloc_req    = scsi_new_request;
    sc->unit_attention_reported = scsi_disk_unit_attention_reported;
2688 2689 2690 2691
    dc->fw_name = "disk";
    dc->desc = "virtual SCSI disk";
    dc->reset = scsi_disk_reset;
    dc->props = scsi_hd_properties;
P
Paolo Bonzini 已提交
2692
    dc->vmsd  = &vmstate_scsi_disk_state;
2693 2694
}

2695
static const TypeInfo scsi_hd_info = {
2696 2697 2698 2699 2700 2701 2702 2703
    .name          = "scsi-hd",
    .parent        = TYPE_SCSI_DEVICE,
    .instance_size = sizeof(SCSIDiskState),
    .class_init    = scsi_hd_class_initfn,
};

static Property scsi_cd_properties[] = {
    DEFINE_SCSI_DISK_PROPERTIES(),
2704
    DEFINE_PROP_UINT64("wwn", SCSIDiskState, wwn, 0),
2705 2706
    DEFINE_PROP_UINT64("port_wwn", SCSIDiskState, port_wwn, 0),
    DEFINE_PROP_UINT16("port_index", SCSIDiskState, port_index, 0),
2707 2708
    DEFINE_PROP_UINT64("max_io_size", SCSIDiskState, max_io_size,
                       DEFAULT_MAX_IO_SIZE),
2709
    DEFINE_PROP_END_OF_LIST(),
2710 2711 2712 2713
};

static void scsi_cd_class_initfn(ObjectClass *klass, void *data)
{
2714
    DeviceClass *dc = DEVICE_CLASS(klass);
2715 2716
    SCSIDeviceClass *sc = SCSI_DEVICE_CLASS(klass);

2717
    sc->realize      = scsi_cd_realize;
2718 2719
    sc->alloc_req    = scsi_new_request;
    sc->unit_attention_reported = scsi_disk_unit_attention_reported;
2720 2721 2722 2723
    dc->fw_name = "disk";
    dc->desc = "virtual SCSI CD-ROM";
    dc->reset = scsi_disk_reset;
    dc->props = scsi_cd_properties;
P
Paolo Bonzini 已提交
2724
    dc->vmsd  = &vmstate_scsi_disk_state;
2725 2726
}

2727
static const TypeInfo scsi_cd_info = {
2728 2729 2730 2731
    .name          = "scsi-cd",
    .parent        = TYPE_SCSI_DEVICE,
    .instance_size = sizeof(SCSIDiskState),
    .class_init    = scsi_cd_class_initfn,
2732 2733
};

2734
#ifdef __linux__
2735
static Property scsi_block_properties[] = {
2736
    DEFINE_PROP_DRIVE("drive", SCSIDiskState, qdev.conf.blk),
2737 2738 2739
    DEFINE_PROP_END_OF_LIST(),
};

2740 2741
static void scsi_block_class_initfn(ObjectClass *klass, void *data)
{
2742
    DeviceClass *dc = DEVICE_CLASS(klass);
2743 2744
    SCSIDeviceClass *sc = SCSI_DEVICE_CLASS(klass);

2745
    sc->realize      = scsi_block_realize;
2746
    sc->alloc_req    = scsi_block_new_request;
2747
    sc->parse_cdb    = scsi_block_parse_cdb;
2748 2749 2750 2751
    dc->fw_name = "disk";
    dc->desc = "SCSI block device passthrough";
    dc->reset = scsi_disk_reset;
    dc->props = scsi_block_properties;
P
Paolo Bonzini 已提交
2752
    dc->vmsd  = &vmstate_scsi_disk_state;
2753 2754
}

2755
static const TypeInfo scsi_block_info = {
2756 2757 2758 2759
    .name          = "scsi-block",
    .parent        = TYPE_SCSI_DEVICE,
    .instance_size = sizeof(SCSIDiskState),
    .class_init    = scsi_block_class_initfn,
2760
};
2761
#endif
2762

2763 2764
static Property scsi_disk_properties[] = {
    DEFINE_SCSI_DISK_PROPERTIES(),
2765 2766
    DEFINE_PROP_BIT("removable", SCSIDiskState, features,
                    SCSI_DISK_F_REMOVABLE, false),
P
Paolo Bonzini 已提交
2767 2768
    DEFINE_PROP_BIT("dpofua", SCSIDiskState, features,
                    SCSI_DISK_F_DPOFUA, false),
2769
    DEFINE_PROP_UINT64("wwn", SCSIDiskState, wwn, 0),
2770 2771
    DEFINE_PROP_UINT64("port_wwn", SCSIDiskState, port_wwn, 0),
    DEFINE_PROP_UINT16("port_index", SCSIDiskState, port_index, 0),
2772 2773
    DEFINE_PROP_UINT64("max_unmap_size", SCSIDiskState, max_unmap_size,
                       DEFAULT_MAX_UNMAP_SIZE),
2774 2775
    DEFINE_PROP_UINT64("max_io_size", SCSIDiskState, max_io_size,
                       DEFAULT_MAX_IO_SIZE),
2776 2777 2778
    DEFINE_PROP_END_OF_LIST(),
};

2779 2780
static void scsi_disk_class_initfn(ObjectClass *klass, void *data)
{
2781
    DeviceClass *dc = DEVICE_CLASS(klass);
2782 2783
    SCSIDeviceClass *sc = SCSI_DEVICE_CLASS(klass);

2784
    sc->realize      = scsi_disk_realize;
2785 2786
    sc->alloc_req    = scsi_new_request;
    sc->unit_attention_reported = scsi_disk_unit_attention_reported;
2787 2788 2789 2790
    dc->fw_name = "disk";
    dc->desc = "virtual SCSI disk or CD-ROM (legacy)";
    dc->reset = scsi_disk_reset;
    dc->props = scsi_disk_properties;
P
Paolo Bonzini 已提交
2791
    dc->vmsd  = &vmstate_scsi_disk_state;
2792 2793
}

2794
static const TypeInfo scsi_disk_info = {
2795 2796 2797 2798
    .name          = "scsi-disk",
    .parent        = TYPE_SCSI_DEVICE,
    .instance_size = sizeof(SCSIDiskState),
    .class_init    = scsi_disk_class_initfn,
2799 2800
};

A
Andreas Färber 已提交
2801
static void scsi_disk_register_types(void)
2802
{
2803 2804
    type_register_static(&scsi_hd_info);
    type_register_static(&scsi_cd_info);
2805
#ifdef __linux__
2806
    type_register_static(&scsi_block_info);
2807
#endif
2808
    type_register_static(&scsi_disk_info);
T
ths 已提交
2809
}
A
Andreas Färber 已提交
2810 2811

type_init(scsi_disk_register_types)