提交 c34688f9 编写于 作者: A Anthony Liguori

Merge remote-tracking branch 'stefanha/block' into staging

# By Liu Yuan (4) and others
# Via Stefan Hajnoczi
* stefanha/block:
  sheepdog: fix loadvm operation
  sheepdog: resend write requests when SD_RES_READONLY is received
  sheepdog: add helper function to reload inode
  sheepdog: add SD_RES_READONLY result code
  sheepdog: cleanup find_vdi_name
  rbd: Fix use after free in rbd_open()
  block: Disable driver-specific options for 1.5
  sheepdog: implement .bdrv_co_is_allocated()
  sheepdog: use BDRV_SECTOR_SIZE
  sheepdog: add discard/trim support for sheepdog
  block/ssh: Require libssh2 >= 1.2.8.

Message-id: 1366976682-10251-1-git-send-email-stefanha@redhat.com
Signed-off-by: NAnthony Liguori <aliguori@us.ibm.com>
...@@ -478,20 +478,20 @@ static int qemu_rbd_open(BlockDriverState *bs, QDict *options, int flags) ...@@ -478,20 +478,20 @@ static int qemu_rbd_open(BlockDriverState *bs, QDict *options, int flags)
} }
filename = qemu_opt_get(opts, "filename"); filename = qemu_opt_get(opts, "filename");
qemu_opts_del(opts);
if (qemu_rbd_parsename(filename, pool, sizeof(pool), if (qemu_rbd_parsename(filename, pool, sizeof(pool),
snap_buf, sizeof(snap_buf), snap_buf, sizeof(snap_buf),
s->name, sizeof(s->name), s->name, sizeof(s->name),
conf, sizeof(conf)) < 0) { conf, sizeof(conf)) < 0) {
return -EINVAL; r = -EINVAL;
goto failed_opts;
} }
clientname = qemu_rbd_parse_clientname(conf, clientname_buf); clientname = qemu_rbd_parse_clientname(conf, clientname_buf);
r = rados_create(&s->cluster, clientname); r = rados_create(&s->cluster, clientname);
if (r < 0) { if (r < 0) {
error_report("error initializing"); error_report("error initializing");
return r; goto failed_opts;
} }
s->snap = NULL; s->snap = NULL;
...@@ -557,6 +557,7 @@ static int qemu_rbd_open(BlockDriverState *bs, QDict *options, int flags) ...@@ -557,6 +557,7 @@ static int qemu_rbd_open(BlockDriverState *bs, QDict *options, int flags)
NULL, qemu_rbd_aio_flush_cb, s); NULL, qemu_rbd_aio_flush_cb, s);
qemu_opts_del(opts);
return 0; return 0;
failed: failed:
...@@ -566,6 +567,8 @@ failed_open: ...@@ -566,6 +567,8 @@ failed_open:
failed_shutdown: failed_shutdown:
rados_shutdown(s->cluster); rados_shutdown(s->cluster);
g_free(s->snap); g_free(s->snap);
failed_opts:
qemu_opts_del(opts);
return r; return r;
} }
......
...@@ -27,6 +27,8 @@ ...@@ -27,6 +27,8 @@
#define SD_OP_CREATE_AND_WRITE_OBJ 0x01 #define SD_OP_CREATE_AND_WRITE_OBJ 0x01
#define SD_OP_READ_OBJ 0x02 #define SD_OP_READ_OBJ 0x02
#define SD_OP_WRITE_OBJ 0x03 #define SD_OP_WRITE_OBJ 0x03
/* 0x04 is used internally by Sheepdog */
#define SD_OP_DISCARD_OBJ 0x05
#define SD_OP_NEW_VDI 0x11 #define SD_OP_NEW_VDI 0x11
#define SD_OP_LOCK_VDI 0x12 #define SD_OP_LOCK_VDI 0x12
...@@ -34,6 +36,7 @@ ...@@ -34,6 +36,7 @@
#define SD_OP_GET_VDI_INFO 0x14 #define SD_OP_GET_VDI_INFO 0x14
#define SD_OP_READ_VDIS 0x15 #define SD_OP_READ_VDIS 0x15
#define SD_OP_FLUSH_VDI 0x16 #define SD_OP_FLUSH_VDI 0x16
#define SD_OP_DEL_VDI 0x17
#define SD_FLAG_CMD_WRITE 0x01 #define SD_FLAG_CMD_WRITE 0x01
#define SD_FLAG_CMD_COW 0x02 #define SD_FLAG_CMD_COW 0x02
...@@ -66,6 +69,7 @@ ...@@ -66,6 +69,7 @@
#define SD_RES_WAIT_FOR_JOIN 0x17 /* Waiting for other nodes joining */ #define SD_RES_WAIT_FOR_JOIN 0x17 /* Waiting for other nodes joining */
#define SD_RES_JOIN_FAILED 0x18 /* Target node had failed to join sheepdog */ #define SD_RES_JOIN_FAILED 0x18 /* Target node had failed to join sheepdog */
#define SD_RES_HALT 0x19 /* Sheepdog is stopped serving IO request */ #define SD_RES_HALT 0x19 /* Sheepdog is stopped serving IO request */
#define SD_RES_READONLY 0x1A /* Object is read-only */
/* /*
* Object ID rules * Object ID rules
...@@ -87,7 +91,6 @@ ...@@ -87,7 +91,6 @@
#define SD_NR_VDIS (1U << 24) #define SD_NR_VDIS (1U << 24)
#define SD_DATA_OBJ_SIZE (UINT64_C(1) << 22) #define SD_DATA_OBJ_SIZE (UINT64_C(1) << 22)
#define SD_MAX_VDI_SIZE (SD_DATA_OBJ_SIZE * MAX_DATA_OBJS) #define SD_MAX_VDI_SIZE (SD_DATA_OBJ_SIZE * MAX_DATA_OBJS)
#define SECTOR_SIZE 512
#define SD_INODE_SIZE (sizeof(SheepdogInode)) #define SD_INODE_SIZE (sizeof(SheepdogInode))
#define CURRENT_VDI_ID 0 #define CURRENT_VDI_ID 0
...@@ -269,6 +272,7 @@ enum AIOCBState { ...@@ -269,6 +272,7 @@ enum AIOCBState {
AIOCB_WRITE_UDATA, AIOCB_WRITE_UDATA,
AIOCB_READ_UDATA, AIOCB_READ_UDATA,
AIOCB_FLUSH_CACHE, AIOCB_FLUSH_CACHE,
AIOCB_DISCARD_OBJ,
}; };
struct SheepdogAIOCB { struct SheepdogAIOCB {
...@@ -298,6 +302,7 @@ typedef struct BDRVSheepdogState { ...@@ -298,6 +302,7 @@ typedef struct BDRVSheepdogState {
char name[SD_MAX_VDI_LEN]; char name[SD_MAX_VDI_LEN];
bool is_snapshot; bool is_snapshot;
uint32_t cache_flags; uint32_t cache_flags;
bool discard_supported;
char *host_spec; char *host_spec;
bool is_unix; bool is_unix;
...@@ -346,6 +351,7 @@ static const char * sd_strerror(int err) ...@@ -346,6 +351,7 @@ static const char * sd_strerror(int err)
{SD_RES_WAIT_FOR_JOIN, "Sheepdog is waiting for other nodes joining"}, {SD_RES_WAIT_FOR_JOIN, "Sheepdog is waiting for other nodes joining"},
{SD_RES_JOIN_FAILED, "Target node had failed to join sheepdog"}, {SD_RES_JOIN_FAILED, "Target node had failed to join sheepdog"},
{SD_RES_HALT, "Sheepdog is stopped serving IO request"}, {SD_RES_HALT, "Sheepdog is stopped serving IO request"},
{SD_RES_READONLY, "Object is read-only"},
}; };
for (i = 0; i < ARRAY_SIZE(errors); ++i) { for (i = 0; i < ARRAY_SIZE(errors); ++i) {
...@@ -600,6 +606,7 @@ static int do_req(int sockfd, SheepdogReq *hdr, void *data, ...@@ -600,6 +606,7 @@ static int do_req(int sockfd, SheepdogReq *hdr, void *data,
static int coroutine_fn add_aio_request(BDRVSheepdogState *s, AIOReq *aio_req, static int coroutine_fn add_aio_request(BDRVSheepdogState *s, AIOReq *aio_req,
struct iovec *iov, int niov, bool create, struct iovec *iov, int niov, bool create,
enum AIOCBState aiocb_type); enum AIOCBState aiocb_type);
static int coroutine_fn resend_aioreq(BDRVSheepdogState *s, AIOReq *aio_req);
static AIOReq *find_pending_req(BDRVSheepdogState *s, uint64_t oid) static AIOReq *find_pending_req(BDRVSheepdogState *s, uint64_t oid)
...@@ -656,7 +663,7 @@ static void coroutine_fn aio_read_response(void *opaque) ...@@ -656,7 +663,7 @@ static void coroutine_fn aio_read_response(void *opaque)
int ret; int ret;
AIOReq *aio_req = NULL; AIOReq *aio_req = NULL;
SheepdogAIOCB *acb; SheepdogAIOCB *acb;
unsigned long idx; uint64_t idx;
if (QLIST_EMPTY(&s->inflight_aio_head)) { if (QLIST_EMPTY(&s->inflight_aio_head)) {
goto out; goto out;
...@@ -727,11 +734,36 @@ static void coroutine_fn aio_read_response(void *opaque) ...@@ -727,11 +734,36 @@ static void coroutine_fn aio_read_response(void *opaque)
rsp.result = SD_RES_SUCCESS; rsp.result = SD_RES_SUCCESS;
} }
break; break;
case AIOCB_DISCARD_OBJ:
switch (rsp.result) {
case SD_RES_INVALID_PARMS:
error_report("sheep(%s) doesn't support discard command",
s->host_spec);
rsp.result = SD_RES_SUCCESS;
s->discard_supported = false;
break;
case SD_RES_SUCCESS:
idx = data_oid_to_idx(aio_req->oid);
s->inode.data_vdi_id[idx] = 0;
break;
default:
break;
}
} }
if (rsp.result != SD_RES_SUCCESS) { switch (rsp.result) {
case SD_RES_SUCCESS:
break;
case SD_RES_READONLY:
ret = resend_aioreq(s, aio_req);
if (ret == SD_RES_SUCCESS) {
goto out;
}
/* fall through */
default:
acb->ret = -EIO; acb->ret = -EIO;
error_report("%s", sd_strerror(rsp.result)); error_report("%s", sd_strerror(rsp.result));
break;
} }
free_aio_req(s, aio_req); free_aio_req(s, aio_req);
...@@ -923,8 +955,9 @@ static int parse_vdiname(BDRVSheepdogState *s, const char *filename, ...@@ -923,8 +955,9 @@ static int parse_vdiname(BDRVSheepdogState *s, const char *filename,
return ret; return ret;
} }
static int find_vdi_name(BDRVSheepdogState *s, char *filename, uint32_t snapid, static int find_vdi_name(BDRVSheepdogState *s, const char *filename,
char *tag, uint32_t *vid, int for_snapshot) uint32_t snapid, const char *tag, uint32_t *vid,
bool lock)
{ {
int ret, fd; int ret, fd;
SheepdogVdiReq hdr; SheepdogVdiReq hdr;
...@@ -945,10 +978,10 @@ static int find_vdi_name(BDRVSheepdogState *s, char *filename, uint32_t snapid, ...@@ -945,10 +978,10 @@ static int find_vdi_name(BDRVSheepdogState *s, char *filename, uint32_t snapid,
strncpy(buf + SD_MAX_VDI_LEN, tag, SD_MAX_VDI_TAG_LEN); strncpy(buf + SD_MAX_VDI_LEN, tag, SD_MAX_VDI_TAG_LEN);
memset(&hdr, 0, sizeof(hdr)); memset(&hdr, 0, sizeof(hdr));
if (for_snapshot) { if (lock) {
hdr.opcode = SD_OP_GET_VDI_INFO;
} else {
hdr.opcode = SD_OP_LOCK_VDI; hdr.opcode = SD_OP_LOCK_VDI;
} else {
hdr.opcode = SD_OP_GET_VDI_INFO;
} }
wlen = SD_MAX_VDI_LEN + SD_MAX_VDI_TAG_LEN; wlen = SD_MAX_VDI_LEN + SD_MAX_VDI_TAG_LEN;
hdr.proto_ver = SD_PROTO_VER; hdr.proto_ver = SD_PROTO_VER;
...@@ -1016,6 +1049,9 @@ static int coroutine_fn add_aio_request(BDRVSheepdogState *s, AIOReq *aio_req, ...@@ -1016,6 +1049,9 @@ static int coroutine_fn add_aio_request(BDRVSheepdogState *s, AIOReq *aio_req,
wlen = datalen; wlen = datalen;
hdr.flags = SD_FLAG_CMD_WRITE | flags; hdr.flags = SD_FLAG_CMD_WRITE | flags;
break; break;
case AIOCB_DISCARD_OBJ:
hdr.opcode = SD_OP_DISCARD_OBJ;
break;
} }
if (s->cache_flags) { if (s->cache_flags) {
...@@ -1126,6 +1162,89 @@ static int write_object(int fd, char *buf, uint64_t oid, int copies, ...@@ -1126,6 +1162,89 @@ static int write_object(int fd, char *buf, uint64_t oid, int copies,
create, cache_flags); create, cache_flags);
} }
/* update inode with the latest state */
static int reload_inode(BDRVSheepdogState *s, uint32_t snapid, const char *tag)
{
SheepdogInode *inode;
int ret = 0, fd;
uint32_t vid = 0;
fd = connect_to_sdog(s);
if (fd < 0) {
return -EIO;
}
inode = g_malloc(sizeof(s->inode));
ret = find_vdi_name(s, s->name, snapid, tag, &vid, false);
if (ret) {
goto out;
}
ret = read_object(fd, (char *)inode, vid_to_vdi_oid(vid),
s->inode.nr_copies, sizeof(*inode), 0, s->cache_flags);
if (ret < 0) {
goto out;
}
if (inode->vdi_id != s->inode.vdi_id) {
memcpy(&s->inode, inode, sizeof(s->inode));
}
out:
g_free(inode);
closesocket(fd);
return ret;
}
static int coroutine_fn resend_aioreq(BDRVSheepdogState *s, AIOReq *aio_req)
{
SheepdogAIOCB *acb = aio_req->aiocb;
bool create = false;
int ret;
ret = reload_inode(s, 0, "");
if (ret < 0) {
return ret;
}
aio_req->oid = vid_to_data_oid(s->inode.vdi_id,
data_oid_to_idx(aio_req->oid));
/* check whether this request becomes a CoW one */
if (acb->aiocb_type == AIOCB_WRITE_UDATA) {
int idx = data_oid_to_idx(aio_req->oid);
AIOReq *areq;
if (s->inode.data_vdi_id[idx] == 0) {
create = true;
goto out;
}
if (is_data_obj_writable(&s->inode, idx)) {
goto out;
}
/* link to the pending list if there is another CoW request to
* the same object */
QLIST_FOREACH(areq, &s->inflight_aio_head, aio_siblings) {
if (areq != aio_req && areq->oid == aio_req->oid) {
dprintf("simultaneous CoW to %" PRIx64 "\n", aio_req->oid);
QLIST_REMOVE(aio_req, aio_siblings);
QLIST_INSERT_HEAD(&s->pending_aio_head, aio_req, aio_siblings);
return SD_RES_SUCCESS;
}
}
aio_req->base_oid = vid_to_data_oid(s->inode.data_vdi_id[idx], idx);
aio_req->flags |= SD_FLAG_CMD_COW;
create = true;
}
out:
return add_aio_request(s, aio_req, acb->qiov->iov, acb->qiov->niov,
create, acb->aiocb_type);
}
/* TODO Convert to fine grained options */ /* TODO Convert to fine grained options */
static QemuOptsList runtime_opts = { static QemuOptsList runtime_opts = {
.name = "sheepdog", .name = "sheepdog",
...@@ -1184,7 +1303,7 @@ static int sd_open(BlockDriverState *bs, QDict *options, int flags) ...@@ -1184,7 +1303,7 @@ static int sd_open(BlockDriverState *bs, QDict *options, int flags)
goto out; goto out;
} }
ret = find_vdi_name(s, vdi, snapid, tag, &vid, 0); ret = find_vdi_name(s, vdi, snapid, tag, &vid, true);
if (ret) { if (ret) {
goto out; goto out;
} }
...@@ -1197,6 +1316,7 @@ static int sd_open(BlockDriverState *bs, QDict *options, int flags) ...@@ -1197,6 +1316,7 @@ static int sd_open(BlockDriverState *bs, QDict *options, int flags)
if (flags & BDRV_O_NOCACHE) { if (flags & BDRV_O_NOCACHE) {
s->cache_flags = SD_FLAG_CMD_DIRECT; s->cache_flags = SD_FLAG_CMD_DIRECT;
} }
s->discard_supported = true;
if (snapid || tag[0] != '\0') { if (snapid || tag[0] != '\0') {
dprintf("%" PRIx32 " snapshot inode was open.\n", vid); dprintf("%" PRIx32 " snapshot inode was open.\n", vid);
...@@ -1223,7 +1343,7 @@ static int sd_open(BlockDriverState *bs, QDict *options, int flags) ...@@ -1223,7 +1343,7 @@ static int sd_open(BlockDriverState *bs, QDict *options, int flags)
s->min_dirty_data_idx = UINT32_MAX; s->min_dirty_data_idx = UINT32_MAX;
s->max_dirty_data_idx = 0; s->max_dirty_data_idx = 0;
bs->total_sectors = s->inode.vdi_size / SECTOR_SIZE; bs->total_sectors = s->inode.vdi_size / BDRV_SECTOR_SIZE;
pstrcpy(s->name, sizeof(s->name), vdi); pstrcpy(s->name, sizeof(s->name), vdi);
qemu_co_mutex_init(&s->lock); qemu_co_mutex_init(&s->lock);
qemu_opts_del(opts); qemu_opts_del(opts);
...@@ -1547,6 +1667,43 @@ out: ...@@ -1547,6 +1667,43 @@ out:
sd_finish_aiocb(acb); sd_finish_aiocb(acb);
} }
/* Delete current working VDI on the snapshot chain */
static bool sd_delete(BDRVSheepdogState *s)
{
unsigned int wlen = SD_MAX_VDI_LEN, rlen = 0;
SheepdogVdiReq hdr = {
.opcode = SD_OP_DEL_VDI,
.vdi_id = s->inode.vdi_id,
.data_length = wlen,
.flags = SD_FLAG_CMD_WRITE,
};
SheepdogVdiRsp *rsp = (SheepdogVdiRsp *)&hdr;
int fd, ret;
fd = connect_to_sdog(s);
if (fd < 0) {
return false;
}
ret = do_req(fd, (SheepdogReq *)&hdr, s->name, &wlen, &rlen);
closesocket(fd);
if (ret) {
return false;
}
switch (rsp->result) {
case SD_RES_NO_VDI:
error_report("%s was already deleted", s->name);
/* fall through */
case SD_RES_SUCCESS:
break;
default:
error_report("%s, %s", sd_strerror(rsp->result), s->name);
return false;
}
return true;
}
/* /*
* Create a writable VDI from a snapshot * Create a writable VDI from a snapshot
*/ */
...@@ -1555,12 +1712,20 @@ static int sd_create_branch(BDRVSheepdogState *s) ...@@ -1555,12 +1712,20 @@ static int sd_create_branch(BDRVSheepdogState *s)
int ret, fd; int ret, fd;
uint32_t vid; uint32_t vid;
char *buf; char *buf;
bool deleted;
dprintf("%" PRIx32 " is snapshot.\n", s->inode.vdi_id); dprintf("%" PRIx32 " is snapshot.\n", s->inode.vdi_id);
buf = g_malloc(SD_INODE_SIZE); buf = g_malloc(SD_INODE_SIZE);
ret = do_sd_create(s, s->name, s->inode.vdi_size, s->inode.vdi_id, &vid, 1); /*
* Even If deletion fails, we will just create extra snapshot based on
* the workding VDI which was supposed to be deleted. So no need to
* false bail out.
*/
deleted = sd_delete(s);
ret = do_sd_create(s, s->name, s->inode.vdi_size, s->inode.vdi_id, &vid,
!deleted);
if (ret) { if (ret) {
goto out; goto out;
} }
...@@ -1610,10 +1775,10 @@ static int coroutine_fn sd_co_rw_vector(void *p) ...@@ -1610,10 +1775,10 @@ static int coroutine_fn sd_co_rw_vector(void *p)
{ {
SheepdogAIOCB *acb = p; SheepdogAIOCB *acb = p;
int ret = 0; int ret = 0;
unsigned long len, done = 0, total = acb->nb_sectors * SECTOR_SIZE; unsigned long len, done = 0, total = acb->nb_sectors * BDRV_SECTOR_SIZE;
unsigned long idx = acb->sector_num * SECTOR_SIZE / SD_DATA_OBJ_SIZE; unsigned long idx = acb->sector_num * BDRV_SECTOR_SIZE / SD_DATA_OBJ_SIZE;
uint64_t oid; uint64_t oid;
uint64_t offset = (acb->sector_num * SECTOR_SIZE) % SD_DATA_OBJ_SIZE; uint64_t offset = (acb->sector_num * BDRV_SECTOR_SIZE) % SD_DATA_OBJ_SIZE;
BDRVSheepdogState *s = acb->common.bs->opaque; BDRVSheepdogState *s = acb->common.bs->opaque;
SheepdogInode *inode = &s->inode; SheepdogInode *inode = &s->inode;
AIOReq *aio_req; AIOReq *aio_req;
...@@ -1662,6 +1827,15 @@ static int coroutine_fn sd_co_rw_vector(void *p) ...@@ -1662,6 +1827,15 @@ static int coroutine_fn sd_co_rw_vector(void *p)
flags = SD_FLAG_CMD_COW; flags = SD_FLAG_CMD_COW;
} }
break; break;
case AIOCB_DISCARD_OBJ:
/*
* We discard the object only when the whole object is
* 1) allocated 2) trimmed. Otherwise, simply skip it.
*/
if (len != SD_DATA_OBJ_SIZE || inode->data_vdi_id[idx] == 0) {
goto done;
}
break;
default: default:
break; break;
} }
...@@ -1723,7 +1897,7 @@ static coroutine_fn int sd_co_writev(BlockDriverState *bs, int64_t sector_num, ...@@ -1723,7 +1897,7 @@ static coroutine_fn int sd_co_writev(BlockDriverState *bs, int64_t sector_num,
int ret; int ret;
if (bs->growable && sector_num + nb_sectors > bs->total_sectors) { if (bs->growable && sector_num + nb_sectors > bs->total_sectors) {
ret = sd_truncate(bs, (sector_num + nb_sectors) * SECTOR_SIZE); ret = sd_truncate(bs, (sector_num + nb_sectors) * BDRV_SECTOR_SIZE);
if (ret < 0) { if (ret < 0) {
return ret; return ret;
} }
...@@ -1867,22 +2041,24 @@ cleanup: ...@@ -1867,22 +2041,24 @@ cleanup:
return ret; return ret;
} }
/*
* We implement rollback(loadvm) operation to the specified snapshot by
* 1) switch to the snapshot
* 2) rely on sd_create_branch to delete working VDI and
* 3) create a new working VDI based on the speicified snapshot
*/
static int sd_snapshot_goto(BlockDriverState *bs, const char *snapshot_id) static int sd_snapshot_goto(BlockDriverState *bs, const char *snapshot_id)
{ {
BDRVSheepdogState *s = bs->opaque; BDRVSheepdogState *s = bs->opaque;
BDRVSheepdogState *old_s; BDRVSheepdogState *old_s;
char vdi[SD_MAX_VDI_LEN], tag[SD_MAX_VDI_TAG_LEN]; char tag[SD_MAX_VDI_TAG_LEN];
char *buf = NULL;
uint32_t vid;
uint32_t snapid = 0; uint32_t snapid = 0;
int ret = 0, fd; int ret = 0;
old_s = g_malloc(sizeof(BDRVSheepdogState)); old_s = g_malloc(sizeof(BDRVSheepdogState));
memcpy(old_s, s, sizeof(BDRVSheepdogState)); memcpy(old_s, s, sizeof(BDRVSheepdogState));
pstrcpy(vdi, sizeof(vdi), s->name);
snapid = strtoul(snapshot_id, NULL, 10); snapid = strtoul(snapshot_id, NULL, 10);
if (snapid) { if (snapid) {
tag[0] = 0; tag[0] = 0;
...@@ -1890,30 +2066,11 @@ static int sd_snapshot_goto(BlockDriverState *bs, const char *snapshot_id) ...@@ -1890,30 +2066,11 @@ static int sd_snapshot_goto(BlockDriverState *bs, const char *snapshot_id)
pstrcpy(tag, sizeof(tag), s->name); pstrcpy(tag, sizeof(tag), s->name);
} }
ret = find_vdi_name(s, vdi, snapid, tag, &vid, 1); ret = reload_inode(s, snapid, tag);
if (ret) {
error_report("Failed to find_vdi_name");
goto out;
}
fd = connect_to_sdog(s);
if (fd < 0) {
ret = fd;
goto out;
}
buf = g_malloc(SD_INODE_SIZE);
ret = read_object(fd, buf, vid_to_vdi_oid(vid), s->inode.nr_copies,
SD_INODE_SIZE, 0, s->cache_flags);
closesocket(fd);
if (ret) { if (ret) {
goto out; goto out;
} }
memcpy(&s->inode, buf, sizeof(s->inode));
if (!s->inode.vm_state_size) { if (!s->inode.vm_state_size) {
error_report("Invalid snapshot"); error_report("Invalid snapshot");
ret = -ENOENT; ret = -ENOENT;
...@@ -1922,14 +2079,12 @@ static int sd_snapshot_goto(BlockDriverState *bs, const char *snapshot_id) ...@@ -1922,14 +2079,12 @@ static int sd_snapshot_goto(BlockDriverState *bs, const char *snapshot_id)
s->is_snapshot = true; s->is_snapshot = true;
g_free(buf);
g_free(old_s); g_free(old_s);
return 0; return 0;
out: out:
/* recover bdrv_sd_state */ /* recover bdrv_sd_state */
memcpy(s, old_s, sizeof(BDRVSheepdogState)); memcpy(s, old_s, sizeof(BDRVSheepdogState));
g_free(buf);
g_free(old_s); g_free(old_s);
error_report("failed to open. recover old bdrv_sd_state."); error_report("failed to open. recover old bdrv_sd_state.");
...@@ -2107,6 +2262,67 @@ static int sd_load_vmstate(BlockDriverState *bs, uint8_t *data, ...@@ -2107,6 +2262,67 @@ static int sd_load_vmstate(BlockDriverState *bs, uint8_t *data,
} }
static coroutine_fn int sd_co_discard(BlockDriverState *bs, int64_t sector_num,
int nb_sectors)
{
SheepdogAIOCB *acb;
QEMUIOVector dummy;
BDRVSheepdogState *s = bs->opaque;
int ret;
if (!s->discard_supported) {
return 0;
}
acb = sd_aio_setup(bs, &dummy, sector_num, nb_sectors);
acb->aiocb_type = AIOCB_DISCARD_OBJ;
acb->aio_done_func = sd_finish_aiocb;
ret = sd_co_rw_vector(acb);
if (ret <= 0) {
qemu_aio_release(acb);
return ret;
}
qemu_coroutine_yield();
return acb->ret;
}
static coroutine_fn int
sd_co_is_allocated(BlockDriverState *bs, int64_t sector_num, int nb_sectors,
int *pnum)
{
BDRVSheepdogState *s = bs->opaque;
SheepdogInode *inode = &s->inode;
unsigned long start = sector_num * BDRV_SECTOR_SIZE / SD_DATA_OBJ_SIZE,
end = DIV_ROUND_UP((sector_num + nb_sectors) *
BDRV_SECTOR_SIZE, SD_DATA_OBJ_SIZE);
unsigned long idx;
int ret = 1;
for (idx = start; idx < end; idx++) {
if (inode->data_vdi_id[idx] == 0) {
break;
}
}
if (idx == start) {
/* Get the longest length of unallocated sectors */
ret = 0;
for (idx = start + 1; idx < end; idx++) {
if (inode->data_vdi_id[idx] != 0) {
break;
}
}
}
*pnum = (idx - start) * SD_DATA_OBJ_SIZE / BDRV_SECTOR_SIZE;
if (*pnum > nb_sectors) {
*pnum = nb_sectors;
}
return ret;
}
static QEMUOptionParameter sd_create_options[] = { static QEMUOptionParameter sd_create_options[] = {
{ {
.name = BLOCK_OPT_SIZE, .name = BLOCK_OPT_SIZE,
...@@ -2139,6 +2355,8 @@ static BlockDriver bdrv_sheepdog = { ...@@ -2139,6 +2355,8 @@ static BlockDriver bdrv_sheepdog = {
.bdrv_co_readv = sd_co_readv, .bdrv_co_readv = sd_co_readv,
.bdrv_co_writev = sd_co_writev, .bdrv_co_writev = sd_co_writev,
.bdrv_co_flush_to_disk = sd_co_flush_to_disk, .bdrv_co_flush_to_disk = sd_co_flush_to_disk,
.bdrv_co_discard = sd_co_discard,
.bdrv_co_is_allocated = sd_co_is_allocated,
.bdrv_snapshot_create = sd_snapshot_create, .bdrv_snapshot_create = sd_snapshot_create,
.bdrv_snapshot_goto = sd_snapshot_goto, .bdrv_snapshot_goto = sd_snapshot_goto,
...@@ -2164,6 +2382,8 @@ static BlockDriver bdrv_sheepdog_tcp = { ...@@ -2164,6 +2382,8 @@ static BlockDriver bdrv_sheepdog_tcp = {
.bdrv_co_readv = sd_co_readv, .bdrv_co_readv = sd_co_readv,
.bdrv_co_writev = sd_co_writev, .bdrv_co_writev = sd_co_writev,
.bdrv_co_flush_to_disk = sd_co_flush_to_disk, .bdrv_co_flush_to_disk = sd_co_flush_to_disk,
.bdrv_co_discard = sd_co_discard,
.bdrv_co_is_allocated = sd_co_is_allocated,
.bdrv_snapshot_create = sd_snapshot_create, .bdrv_snapshot_create = sd_snapshot_create,
.bdrv_snapshot_goto = sd_snapshot_goto, .bdrv_snapshot_goto = sd_snapshot_goto,
...@@ -2189,6 +2409,8 @@ static BlockDriver bdrv_sheepdog_unix = { ...@@ -2189,6 +2409,8 @@ static BlockDriver bdrv_sheepdog_unix = {
.bdrv_co_readv = sd_co_readv, .bdrv_co_readv = sd_co_readv,
.bdrv_co_writev = sd_co_writev, .bdrv_co_writev = sd_co_writev,
.bdrv_co_flush_to_disk = sd_co_flush_to_disk, .bdrv_co_flush_to_disk = sd_co_flush_to_disk,
.bdrv_co_discard = sd_co_discard,
.bdrv_co_is_allocated = sd_co_is_allocated,
.bdrv_snapshot_create = sd_snapshot_create, .bdrv_snapshot_create = sd_snapshot_create,
.bdrv_snapshot_goto = sd_snapshot_goto, .bdrv_snapshot_goto = sd_snapshot_goto,
......
...@@ -1656,10 +1656,120 @@ QemuOptsList qemu_drive_opts = { ...@@ -1656,10 +1656,120 @@ QemuOptsList qemu_drive_opts = {
.name = "drive", .name = "drive",
.head = QTAILQ_HEAD_INITIALIZER(qemu_drive_opts.head), .head = QTAILQ_HEAD_INITIALIZER(qemu_drive_opts.head),
.desc = { .desc = {
/* {
* no elements => accept any params .name = "bus",
* validation will happen later .type = QEMU_OPT_NUMBER,
*/ .help = "bus number",
},{
.name = "unit",
.type = QEMU_OPT_NUMBER,
.help = "unit number (i.e. lun for scsi)",
},{
.name = "if",
.type = QEMU_OPT_STRING,
.help = "interface (ide, scsi, sd, mtd, floppy, pflash, virtio)",
},{
.name = "index",
.type = QEMU_OPT_NUMBER,
.help = "index number",
},{
.name = "cyls",
.type = QEMU_OPT_NUMBER,
.help = "number of cylinders (ide disk geometry)",
},{
.name = "heads",
.type = QEMU_OPT_NUMBER,
.help = "number of heads (ide disk geometry)",
},{
.name = "secs",
.type = QEMU_OPT_NUMBER,
.help = "number of sectors (ide disk geometry)",
},{
.name = "trans",
.type = QEMU_OPT_STRING,
.help = "chs translation (auto, lba. none)",
},{
.name = "media",
.type = QEMU_OPT_STRING,
.help = "media type (disk, cdrom)",
},{
.name = "snapshot",
.type = QEMU_OPT_BOOL,
.help = "enable/disable snapshot mode",
},{
.name = "file",
.type = QEMU_OPT_STRING,
.help = "disk image",
},{
.name = "discard",
.type = QEMU_OPT_STRING,
.help = "discard operation (ignore/off, unmap/on)",
},{
.name = "cache",
.type = QEMU_OPT_STRING,
.help = "host cache usage (none, writeback, writethrough, "
"directsync, unsafe)",
},{
.name = "aio",
.type = QEMU_OPT_STRING,
.help = "host AIO implementation (threads, native)",
},{
.name = "format",
.type = QEMU_OPT_STRING,
.help = "disk format (raw, qcow2, ...)",
},{
.name = "serial",
.type = QEMU_OPT_STRING,
.help = "disk serial number",
},{
.name = "rerror",
.type = QEMU_OPT_STRING,
.help = "read error action",
},{
.name = "werror",
.type = QEMU_OPT_STRING,
.help = "write error action",
},{
.name = "addr",
.type = QEMU_OPT_STRING,
.help = "pci address (virtio only)",
},{
.name = "readonly",
.type = QEMU_OPT_BOOL,
.help = "open drive file as read-only",
},{
.name = "iops",
.type = QEMU_OPT_NUMBER,
.help = "limit total I/O operations per second",
},{
.name = "iops_rd",
.type = QEMU_OPT_NUMBER,
.help = "limit read operations per second",
},{
.name = "iops_wr",
.type = QEMU_OPT_NUMBER,
.help = "limit write operations per second",
},{
.name = "bps",
.type = QEMU_OPT_NUMBER,
.help = "limit total bytes per second",
},{
.name = "bps_rd",
.type = QEMU_OPT_NUMBER,
.help = "limit read bytes per second",
},{
.name = "bps_wr",
.type = QEMU_OPT_NUMBER,
.help = "limit write bytes per second",
},{
.name = "copy-on-read",
.type = QEMU_OPT_BOOL,
.help = "copy read data from backing file into image file",
},{
.name = "boot",
.type = QEMU_OPT_BOOL,
.help = "(deprecated, ignored)",
},
{ /* end of list */ } { /* end of list */ }
}, },
}; };
...@@ -2364,35 +2364,19 @@ fi ...@@ -2364,35 +2364,19 @@ fi
########################################## ##########################################
# libssh2 probe # libssh2 probe
min_libssh2_version=1.2.8
if test "$libssh2" != "no" ; then if test "$libssh2" != "no" ; then
cat > $TMPC <<EOF if $pkg_config --atleast-version=$min_libssh2_version libssh2 >/dev/null 2>&1
#include <stdio.h> then
#include <libssh2.h>
#include <libssh2_sftp.h>
int main(void) {
LIBSSH2_SESSION *session;
session = libssh2_session_init ();
(void) libssh2_sftp_init (session);
return 0;
}
EOF
if $pkg_config libssh2 --modversion >/dev/null 2>&1; then
libssh2_cflags=`$pkg_config libssh2 --cflags` libssh2_cflags=`$pkg_config libssh2 --cflags`
libssh2_libs=`$pkg_config libssh2 --libs` libssh2_libs=`$pkg_config libssh2 --libs`
else
libssh2_cflags=
libssh2_libs="-lssh2"
fi
if compile_prog "$libssh2_cflags" "$libssh2_libs" ; then
libssh2=yes libssh2=yes
libs_tools="$libssh2_libs $libs_tools" libs_tools="$libssh2_libs $libs_tools"
libs_softmmu="$libssh2_libs $libs_softmmu" libs_softmmu="$libssh2_libs $libs_softmmu"
QEMU_CFLAGS="$QEMU_CFLAGS $libssh2_cflags" QEMU_CFLAGS="$QEMU_CFLAGS $libssh2_cflags"
else else
if test "$libssh2" = "yes" ; then if test "$libssh2" = "yes" ; then
feature_not_found "libssh2" error_exit "libssh2 >= $min_libssh2_version required for --enable-libssh2"
fi fi
libssh2=no libssh2=no
fi fi
......
...@@ -57,6 +57,6 @@ ...@@ -57,6 +57,6 @@
048 img auto quick 048 img auto quick
049 rw auto 049 rw auto
050 rw auto backing quick 050 rw auto backing quick
051 rw auto #051 rw auto
052 rw auto backing 052 rw auto backing
053 rw auto 053 rw auto
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册