Merge remote-tracking branch 'bonzini/nbd-next' into staging

* bonzini/nbd-next:
  nbd: obey FUA on reads
  nbd: do not include block_int.h
  nbd: do not block in nbd_wr_sync if no data at all is available
  nbd: consistently return negative errno values
  nbd: consistently check for <0 or >=0
  nbd: consistently use ssize_t
  nbd: avoid out of bounds access to recv_coroutine array
This commit is contained in:
Anthony Liguori 2012-04-23 09:58:01 -05:00
commit bec8eb8136
4 changed files with 212 additions and 159 deletions

View File

@ -150,11 +150,19 @@ static int nbd_have_request(void *opaque)
static void nbd_reply_ready(void *opaque) static void nbd_reply_ready(void *opaque)
{ {
BDRVNBDState *s = opaque; BDRVNBDState *s = opaque;
int i; uint64_t i;
int ret;
if (s->reply.handle == 0) { if (s->reply.handle == 0) {
/* No reply already in flight. Fetch a header. */ /* No reply already in flight. Fetch a header. It is possible
if (nbd_receive_reply(s->sock, &s->reply) < 0) { * that another thread has done the same thing in parallel, so
* the socket is not readable anymore.
*/
ret = nbd_receive_reply(s->sock, &s->reply);
if (ret == -EAGAIN) {
return;
}
if (ret < 0) {
s->reply.handle = 0; s->reply.handle = 0;
goto fail; goto fail;
} }
@ -164,6 +172,10 @@ static void nbd_reply_ready(void *opaque)
* handler acts as a synchronization point and ensures that only * handler acts as a synchronization point and ensures that only
* one coroutine is called until the reply finishes. */ * one coroutine is called until the reply finishes. */
i = HANDLE_TO_INDEX(s, s->reply.handle); i = HANDLE_TO_INDEX(s, s->reply.handle);
if (i >= MAX_NBD_REQUESTS) {
goto fail;
}
if (s->recv_coroutine[i]) { if (s->recv_coroutine[i]) {
qemu_coroutine_enter(s->recv_coroutine[i], NULL); qemu_coroutine_enter(s->recv_coroutine[i], NULL);
return; return;
@ -193,11 +205,10 @@ static int nbd_co_send_request(BDRVNBDState *s, struct nbd_request *request,
qemu_aio_set_fd_handler(s->sock, nbd_reply_ready, nbd_restart_write, qemu_aio_set_fd_handler(s->sock, nbd_reply_ready, nbd_restart_write,
nbd_have_request, NULL, s); nbd_have_request, NULL, s);
rc = nbd_send_request(s->sock, request); rc = nbd_send_request(s->sock, request);
if (rc != -1 && iov) { if (rc >= 0 && iov) {
ret = qemu_co_sendv(s->sock, iov, request->len, offset); ret = qemu_co_sendv(s->sock, iov, request->len, offset);
if (ret != request->len) { if (ret != request->len) {
errno = -EIO; return -EIO;
rc = -1;
} }
} }
qemu_aio_set_fd_handler(s->sock, nbd_reply_ready, NULL, qemu_aio_set_fd_handler(s->sock, nbd_reply_ready, NULL,
@ -256,7 +267,7 @@ static int nbd_establish_connection(BlockDriverState *bs)
} }
/* Failed to establish connection */ /* Failed to establish connection */
if (sock == -1) { if (sock < 0) {
logout("Failed to establish connection to NBD server\n"); logout("Failed to establish connection to NBD server\n");
return -errno; return -errno;
} }
@ -264,10 +275,10 @@ static int nbd_establish_connection(BlockDriverState *bs)
/* NBD handshake */ /* NBD handshake */
ret = nbd_receive_negotiate(sock, s->export_name, &s->nbdflags, &size, ret = nbd_receive_negotiate(sock, s->export_name, &s->nbdflags, &size,
&blocksize); &blocksize);
if (ret == -1) { if (ret < 0) {
logout("Failed to negotiate with the NBD server\n"); logout("Failed to negotiate with the NBD server\n");
closesocket(sock); closesocket(sock);
return -errno; return ret;
} }
/* Now that we're connected, set the socket to be non-blocking and /* Now that we're connected, set the socket to be non-blocking and
@ -327,14 +338,16 @@ static int nbd_co_readv_1(BlockDriverState *bs, int64_t sector_num,
BDRVNBDState *s = bs->opaque; BDRVNBDState *s = bs->opaque;
struct nbd_request request; struct nbd_request request;
struct nbd_reply reply; struct nbd_reply reply;
ssize_t ret;
request.type = NBD_CMD_READ; request.type = NBD_CMD_READ;
request.from = sector_num * 512; request.from = sector_num * 512;
request.len = nb_sectors * 512; request.len = nb_sectors * 512;
nbd_coroutine_start(s, &request); nbd_coroutine_start(s, &request);
if (nbd_co_send_request(s, &request, NULL, 0) == -1) { ret = nbd_co_send_request(s, &request, NULL, 0);
reply.error = errno; if (ret < 0) {
reply.error = -ret;
} else { } else {
nbd_co_receive_reply(s, &request, &reply, qiov->iov, offset); nbd_co_receive_reply(s, &request, &reply, qiov->iov, offset);
} }
@ -350,6 +363,7 @@ static int nbd_co_writev_1(BlockDriverState *bs, int64_t sector_num,
BDRVNBDState *s = bs->opaque; BDRVNBDState *s = bs->opaque;
struct nbd_request request; struct nbd_request request;
struct nbd_reply reply; struct nbd_reply reply;
ssize_t ret;
request.type = NBD_CMD_WRITE; request.type = NBD_CMD_WRITE;
if (!bdrv_enable_write_cache(bs) && (s->nbdflags & NBD_FLAG_SEND_FUA)) { if (!bdrv_enable_write_cache(bs) && (s->nbdflags & NBD_FLAG_SEND_FUA)) {
@ -360,8 +374,9 @@ static int nbd_co_writev_1(BlockDriverState *bs, int64_t sector_num,
request.len = nb_sectors * 512; request.len = nb_sectors * 512;
nbd_coroutine_start(s, &request); nbd_coroutine_start(s, &request);
if (nbd_co_send_request(s, &request, qiov->iov, offset) == -1) { ret = nbd_co_send_request(s, &request, qiov->iov, offset);
reply.error = errno; if (ret < 0) {
reply.error = -ret;
} else { } else {
nbd_co_receive_reply(s, &request, &reply, NULL, 0); nbd_co_receive_reply(s, &request, &reply, NULL, 0);
} }
@ -412,6 +427,7 @@ static int nbd_co_flush(BlockDriverState *bs)
BDRVNBDState *s = bs->opaque; BDRVNBDState *s = bs->opaque;
struct nbd_request request; struct nbd_request request;
struct nbd_reply reply; struct nbd_reply reply;
ssize_t ret;
if (!(s->nbdflags & NBD_FLAG_SEND_FLUSH)) { if (!(s->nbdflags & NBD_FLAG_SEND_FLUSH)) {
return 0; return 0;
@ -426,8 +442,9 @@ static int nbd_co_flush(BlockDriverState *bs)
request.len = 0; request.len = 0;
nbd_coroutine_start(s, &request); nbd_coroutine_start(s, &request);
if (nbd_co_send_request(s, &request, NULL, 0) == -1) { ret = nbd_co_send_request(s, &request, NULL, 0);
reply.error = errno; if (ret < 0) {
reply.error = -ret;
} else { } else {
nbd_co_receive_reply(s, &request, &reply, NULL, 0); nbd_co_receive_reply(s, &request, &reply, NULL, 0);
} }
@ -441,6 +458,7 @@ static int nbd_co_discard(BlockDriverState *bs, int64_t sector_num,
BDRVNBDState *s = bs->opaque; BDRVNBDState *s = bs->opaque;
struct nbd_request request; struct nbd_request request;
struct nbd_reply reply; struct nbd_reply reply;
ssize_t ret;
if (!(s->nbdflags & NBD_FLAG_SEND_TRIM)) { if (!(s->nbdflags & NBD_FLAG_SEND_TRIM)) {
return 0; return 0;
@ -450,8 +468,9 @@ static int nbd_co_discard(BlockDriverState *bs, int64_t sector_num,
request.len = nb_sectors * 512; request.len = nb_sectors * 512;
nbd_coroutine_start(s, &request); nbd_coroutine_start(s, &request);
if (nbd_co_send_request(s, &request, NULL, 0) == -1) { ret = nbd_co_send_request(s, &request, NULL, 0);
reply.error = errno; if (ret < 0) {
reply.error = -ret;
} else { } else {
nbd_co_receive_reply(s, &request, &reply, NULL, 0); nbd_co_receive_reply(s, &request, &reply, NULL, 0);
} }

267
nbd.c
View File

@ -18,7 +18,6 @@
#include "nbd.h" #include "nbd.h"
#include "block.h" #include "block.h"
#include "block_int.h"
#include "qemu-coroutine.h" #include "qemu-coroutine.h"
@ -78,12 +77,10 @@
/* That's all folks */ /* That's all folks */
#define read_sync(fd, buffer, size) nbd_wr_sync(fd, buffer, size, true) ssize_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read)
#define write_sync(fd, buffer, size) nbd_wr_sync(fd, buffer, size, false)
size_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read)
{ {
size_t offset = 0; size_t offset = 0;
int err;
if (qemu_in_coroutine()) { if (qemu_in_coroutine()) {
if (do_read) { if (do_read) {
@ -102,12 +99,16 @@ size_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read)
len = send(fd, buffer + offset, size - offset, 0); len = send(fd, buffer + offset, size - offset, 0);
} }
if (len == -1) if (len < 0) {
errno = socket_error(); err = socket_error();
/* recoverable error */ /* recoverable error */
if (len == -1 && (errno == EAGAIN || errno == EINTR)) { if (err == EINTR || (offset > 0 && err == EAGAIN)) {
continue; continue;
}
/* unrecoverable error */
return -err;
} }
/* eof */ /* eof */
@ -115,17 +116,32 @@ size_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read)
break; break;
} }
/* unrecoverable error */
if (len == -1) {
return 0;
}
offset += len; offset += len;
} }
return offset; return offset;
} }
static ssize_t read_sync(int fd, void *buffer, size_t size)
{
/* Sockets are kept in blocking mode in the negotiation phase. After
* that, a non-readable socket simply means that another thread stole
* our request/reply. Synchronization is done with recv_coroutine, so
* that this is coroutine-safe.
*/
return nbd_wr_sync(fd, buffer, size, true);
}
static ssize_t write_sync(int fd, void *buffer, size_t size)
{
int ret;
do {
/* For writes, we do expect the socket to be writable. */
ret = nbd_wr_sync(fd, buffer, size, false);
} while (ret == -EAGAIN);
return ret;
}
static void combine_addr(char *buf, size_t len, const char* address, static void combine_addr(char *buf, size_t len, const char* address,
uint16_t port) uint16_t port)
{ {
@ -193,6 +209,7 @@ int unix_socket_outgoing(const char *path)
static int nbd_send_negotiate(int csock, off_t size, uint32_t flags) static int nbd_send_negotiate(int csock, off_t size, uint32_t flags)
{ {
char buf[8 + 8 + 8 + 128]; char buf[8 + 8 + 8 + 128];
int rc;
/* Negotiate /* Negotiate
[ 0 .. 7] passwd ("NBDMAGIC") [ 0 .. 7] passwd ("NBDMAGIC")
@ -202,6 +219,9 @@ static int nbd_send_negotiate(int csock, off_t size, uint32_t flags)
[28 .. 151] reserved (0) [28 .. 151] reserved (0)
*/ */
socket_set_block(csock);
rc = -EINVAL;
TRACE("Beginning negotiation."); TRACE("Beginning negotiation.");
memcpy(buf, "NBDMAGIC", 8); memcpy(buf, "NBDMAGIC", 8);
cpu_to_be64w((uint64_t*)(buf + 8), 0x00420281861253LL); cpu_to_be64w((uint64_t*)(buf + 8), 0x00420281861253LL);
@ -213,13 +233,14 @@ static int nbd_send_negotiate(int csock, off_t size, uint32_t flags)
if (write_sync(csock, buf, sizeof(buf)) != sizeof(buf)) { if (write_sync(csock, buf, sizeof(buf)) != sizeof(buf)) {
LOG("write failed"); LOG("write failed");
errno = EINVAL; goto fail;
return -1;
} }
TRACE("Negotiation succeeded."); TRACE("Negotiation succeeded.");
rc = 0;
return 0; fail:
socket_set_nonblock(csock);
return rc;
} }
int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags, int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
@ -228,20 +249,22 @@ int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
char buf[256]; char buf[256];
uint64_t magic, s; uint64_t magic, s;
uint16_t tmp; uint16_t tmp;
int rc;
TRACE("Receiving negotiation."); TRACE("Receiving negotiation.");
socket_set_block(csock);
rc = -EINVAL;
if (read_sync(csock, buf, 8) != 8) { if (read_sync(csock, buf, 8) != 8) {
LOG("read failed"); LOG("read failed");
errno = EINVAL; goto fail;
return -1;
} }
buf[8] = '\0'; buf[8] = '\0';
if (strlen(buf) == 0) { if (strlen(buf) == 0) {
LOG("server connection closed"); LOG("server connection closed");
errno = EINVAL; goto fail;
return -1;
} }
TRACE("Magic is %c%c%c%c%c%c%c%c", TRACE("Magic is %c%c%c%c%c%c%c%c",
@ -256,14 +279,12 @@ int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
if (memcmp(buf, "NBDMAGIC", 8) != 0) { if (memcmp(buf, "NBDMAGIC", 8) != 0) {
LOG("Invalid magic received"); LOG("Invalid magic received");
errno = EINVAL; goto fail;
return -1;
} }
if (read_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) { if (read_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) {
LOG("read failed"); LOG("read failed");
errno = EINVAL; goto fail;
return -1;
} }
magic = be64_to_cpu(magic); magic = be64_to_cpu(magic);
TRACE("Magic is 0x%" PRIx64, magic); TRACE("Magic is 0x%" PRIx64, magic);
@ -276,61 +297,52 @@ int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
TRACE("Checking magic (opts_magic)"); TRACE("Checking magic (opts_magic)");
if (magic != 0x49484156454F5054LL) { if (magic != 0x49484156454F5054LL) {
LOG("Bad magic received"); LOG("Bad magic received");
errno = EINVAL; goto fail;
return -1;
} }
if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) { if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) {
LOG("flags read failed"); LOG("flags read failed");
errno = EINVAL; goto fail;
return -1;
} }
*flags = be16_to_cpu(tmp) << 16; *flags = be16_to_cpu(tmp) << 16;
/* reserved for future use */ /* reserved for future use */
if (write_sync(csock, &reserved, sizeof(reserved)) != if (write_sync(csock, &reserved, sizeof(reserved)) !=
sizeof(reserved)) { sizeof(reserved)) {
LOG("write failed (reserved)"); LOG("write failed (reserved)");
errno = EINVAL; goto fail;
return -1;
} }
/* write the export name */ /* write the export name */
magic = cpu_to_be64(magic); magic = cpu_to_be64(magic);
if (write_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) { if (write_sync(csock, &magic, sizeof(magic)) != sizeof(magic)) {
LOG("write failed (magic)"); LOG("write failed (magic)");
errno = EINVAL; goto fail;
return -1;
} }
opt = cpu_to_be32(NBD_OPT_EXPORT_NAME); opt = cpu_to_be32(NBD_OPT_EXPORT_NAME);
if (write_sync(csock, &opt, sizeof(opt)) != sizeof(opt)) { if (write_sync(csock, &opt, sizeof(opt)) != sizeof(opt)) {
LOG("write failed (opt)"); LOG("write failed (opt)");
errno = EINVAL; goto fail;
return -1;
} }
namesize = cpu_to_be32(strlen(name)); namesize = cpu_to_be32(strlen(name));
if (write_sync(csock, &namesize, sizeof(namesize)) != if (write_sync(csock, &namesize, sizeof(namesize)) !=
sizeof(namesize)) { sizeof(namesize)) {
LOG("write failed (namesize)"); LOG("write failed (namesize)");
errno = EINVAL; goto fail;
return -1;
} }
if (write_sync(csock, (char*)name, strlen(name)) != strlen(name)) { if (write_sync(csock, (char*)name, strlen(name)) != strlen(name)) {
LOG("write failed (name)"); LOG("write failed (name)");
errno = EINVAL; goto fail;
return -1;
} }
} else { } else {
TRACE("Checking magic (cli_magic)"); TRACE("Checking magic (cli_magic)");
if (magic != 0x00420281861253LL) { if (magic != 0x00420281861253LL) {
LOG("Bad magic received"); LOG("Bad magic received");
errno = EINVAL; goto fail;
return -1;
} }
} }
if (read_sync(csock, &s, sizeof(s)) != sizeof(s)) { if (read_sync(csock, &s, sizeof(s)) != sizeof(s)) {
LOG("read failed"); LOG("read failed");
errno = EINVAL; goto fail;
return -1;
} }
*size = be64_to_cpu(s); *size = be64_to_cpu(s);
*blocksize = 1024; *blocksize = 1024;
@ -339,24 +351,25 @@ int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
if (!name) { if (!name) {
if (read_sync(csock, flags, sizeof(*flags)) != sizeof(*flags)) { if (read_sync(csock, flags, sizeof(*flags)) != sizeof(*flags)) {
LOG("read failed (flags)"); LOG("read failed (flags)");
errno = EINVAL; goto fail;
return -1;
} }
*flags = be32_to_cpup(flags); *flags = be32_to_cpup(flags);
} else { } else {
if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) { if (read_sync(csock, &tmp, sizeof(tmp)) != sizeof(tmp)) {
LOG("read failed (tmp)"); LOG("read failed (tmp)");
errno = EINVAL; goto fail;
return -1;
} }
*flags |= be32_to_cpu(tmp); *flags |= be32_to_cpu(tmp);
} }
if (read_sync(csock, &buf, 124) != 124) { if (read_sync(csock, &buf, 124) != 124) {
LOG("read failed (buf)"); LOG("read failed (buf)");
errno = EINVAL; goto fail;
return -1;
} }
return 0; rc = 0;
fail:
socket_set_nonblock(csock);
return rc;
} }
#ifdef __linux__ #ifdef __linux__
@ -364,29 +377,26 @@ int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize)
{ {
TRACE("Setting NBD socket"); TRACE("Setting NBD socket");
if (ioctl(fd, NBD_SET_SOCK, csock) == -1) { if (ioctl(fd, NBD_SET_SOCK, csock) < 0) {
int serrno = errno; int serrno = errno;
LOG("Failed to set NBD socket"); LOG("Failed to set NBD socket");
errno = serrno; return -serrno;
return -1;
} }
TRACE("Setting block size to %lu", (unsigned long)blocksize); TRACE("Setting block size to %lu", (unsigned long)blocksize);
if (ioctl(fd, NBD_SET_BLKSIZE, blocksize) == -1) { if (ioctl(fd, NBD_SET_BLKSIZE, blocksize) < 0) {
int serrno = errno; int serrno = errno;
LOG("Failed setting NBD block size"); LOG("Failed setting NBD block size");
errno = serrno; return -serrno;
return -1;
} }
TRACE("Setting size to %zd block(s)", (size_t)(size / blocksize)); TRACE("Setting size to %zd block(s)", (size_t)(size / blocksize));
if (ioctl(fd, NBD_SET_SIZE_BLOCKS, size / blocksize) == -1) { if (ioctl(fd, NBD_SET_SIZE_BLOCKS, size / blocksize) < 0) {
int serrno = errno; int serrno = errno;
LOG("Failed setting size (in blocks)"); LOG("Failed setting size (in blocks)");
errno = serrno; return -serrno;
return -1;
} }
if (flags & NBD_FLAG_READ_ONLY) { if (flags & NBD_FLAG_READ_ONLY) {
@ -396,8 +406,7 @@ int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize)
if (ioctl(fd, BLKROSET, (unsigned long) &read_only) < 0) { if (ioctl(fd, BLKROSET, (unsigned long) &read_only) < 0) {
int serrno = errno; int serrno = errno;
LOG("Failed setting read-only attribute"); LOG("Failed setting read-only attribute");
errno = serrno; return -serrno;
return -1;
} }
} }
@ -405,8 +414,7 @@ int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize)
&& errno != ENOTTY) { && errno != ENOTTY) {
int serrno = errno; int serrno = errno;
LOG("Failed setting flags"); LOG("Failed setting flags");
errno = serrno; return -serrno;
return -1;
} }
TRACE("Negotiation ended"); TRACE("Negotiation ended");
@ -430,7 +438,7 @@ int nbd_client(int fd)
TRACE("Doing NBD loop"); TRACE("Doing NBD loop");
ret = ioctl(fd, NBD_DO_IT); ret = ioctl(fd, NBD_DO_IT);
if (ret == -1 && errno == EPIPE) { if (ret < 0 && errno == EPIPE) {
/* NBD_DO_IT normally returns EPIPE when someone has disconnected /* NBD_DO_IT normally returns EPIPE when someone has disconnected
* the socket via NBD_DISCONNECT. We do not want to return 1 in * the socket via NBD_DISCONNECT. We do not want to return 1 in
* that case. * that case.
@ -453,26 +461,24 @@ int nbd_client(int fd)
#else #else
int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize) int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize)
{ {
errno = ENOTSUP; return -ENOTSUP;
return -1;
} }
int nbd_disconnect(int fd) int nbd_disconnect(int fd)
{ {
errno = ENOTSUP; return -ENOTSUP;
return -1;
} }
int nbd_client(int fd) int nbd_client(int fd)
{ {
errno = ENOTSUP; return -ENOTSUP;
return -1;
} }
#endif #endif
int nbd_send_request(int csock, struct nbd_request *request) ssize_t nbd_send_request(int csock, struct nbd_request *request)
{ {
uint8_t buf[4 + 4 + 8 + 8 + 4]; uint8_t buf[4 + 4 + 8 + 8 + 4];
ssize_t ret;
cpu_to_be32w((uint32_t*)buf, NBD_REQUEST_MAGIC); cpu_to_be32w((uint32_t*)buf, NBD_REQUEST_MAGIC);
cpu_to_be32w((uint32_t*)(buf + 4), request->type); cpu_to_be32w((uint32_t*)(buf + 4), request->type);
@ -484,23 +490,32 @@ int nbd_send_request(int csock, struct nbd_request *request)
"{ .from = %" PRIu64", .len = %u, .handle = %" PRIu64", .type=%i}", "{ .from = %" PRIu64", .len = %u, .handle = %" PRIu64", .type=%i}",
request->from, request->len, request->handle, request->type); request->from, request->len, request->handle, request->type);
if (write_sync(csock, buf, sizeof(buf)) != sizeof(buf)) { ret = write_sync(csock, buf, sizeof(buf));
if (ret < 0) {
return ret;
}
if (ret != sizeof(buf)) {
LOG("writing to socket failed"); LOG("writing to socket failed");
errno = EINVAL; return -EINVAL;
return -1;
} }
return 0; return 0;
} }
static int nbd_receive_request(int csock, struct nbd_request *request) static ssize_t nbd_receive_request(int csock, struct nbd_request *request)
{ {
uint8_t buf[4 + 4 + 8 + 8 + 4]; uint8_t buf[4 + 4 + 8 + 8 + 4];
uint32_t magic; uint32_t magic;
ssize_t ret;
if (read_sync(csock, buf, sizeof(buf)) != sizeof(buf)) { ret = read_sync(csock, buf, sizeof(buf));
if (ret < 0) {
return ret;
}
if (ret != sizeof(buf)) {
LOG("read failed"); LOG("read failed");
errno = EINVAL; return -EINVAL;
return -1;
} }
/* Request /* Request
@ -523,23 +538,25 @@ static int nbd_receive_request(int csock, struct nbd_request *request)
if (magic != NBD_REQUEST_MAGIC) { if (magic != NBD_REQUEST_MAGIC) {
LOG("invalid magic (got 0x%x)", magic); LOG("invalid magic (got 0x%x)", magic);
errno = EINVAL; return -EINVAL;
return -1;
} }
return 0; return 0;
} }
int nbd_receive_reply(int csock, struct nbd_reply *reply) ssize_t nbd_receive_reply(int csock, struct nbd_reply *reply)
{ {
uint8_t buf[NBD_REPLY_SIZE]; uint8_t buf[NBD_REPLY_SIZE];
uint32_t magic; uint32_t magic;
ssize_t ret;
memset(buf, 0xAA, sizeof(buf)); ret = read_sync(csock, buf, sizeof(buf));
if (ret < 0) {
return ret;
}
if (read_sync(csock, buf, sizeof(buf)) != sizeof(buf)) { if (ret != sizeof(buf)) {
LOG("read failed"); LOG("read failed");
errno = EINVAL; return -EINVAL;
return -1;
} }
/* Reply /* Reply
@ -558,15 +575,15 @@ int nbd_receive_reply(int csock, struct nbd_reply *reply)
if (magic != NBD_REPLY_MAGIC) { if (magic != NBD_REPLY_MAGIC) {
LOG("invalid magic (got 0x%x)", magic); LOG("invalid magic (got 0x%x)", magic);
errno = EINVAL; return -EINVAL;
return -1;
} }
return 0; return 0;
} }
static int nbd_send_reply(int csock, struct nbd_reply *reply) static ssize_t nbd_send_reply(int csock, struct nbd_reply *reply)
{ {
uint8_t buf[4 + 4 + 8]; uint8_t buf[4 + 4 + 8];
ssize_t ret;
/* Reply /* Reply
[ 0 .. 3] magic (NBD_REPLY_MAGIC) [ 0 .. 3] magic (NBD_REPLY_MAGIC)
@ -579,10 +596,14 @@ static int nbd_send_reply(int csock, struct nbd_reply *reply)
TRACE("Sending response to client"); TRACE("Sending response to client");
if (write_sync(csock, buf, sizeof(buf)) != sizeof(buf)) { ret = write_sync(csock, buf, sizeof(buf));
if (ret < 0) {
return ret;
}
if (ret != sizeof(buf)) {
LOG("writing to socket failed"); LOG("writing to socket failed");
errno = EINVAL; return -EINVAL;
return -1;
} }
return 0; return 0;
} }
@ -681,7 +702,7 @@ NBDExport *nbd_export_new(BlockDriverState *bs, off_t dev_offset,
exp->bs = bs; exp->bs = bs;
exp->dev_offset = dev_offset; exp->dev_offset = dev_offset;
exp->nbdflags = nbdflags; exp->nbdflags = nbdflags;
exp->size = size == -1 ? exp->bs->total_sectors * 512 : size; exp->size = size == -1 ? bdrv_getlength(bs) : size;
return exp; return exp;
} }
@ -702,12 +723,12 @@ static int nbd_can_read(void *opaque);
static void nbd_read(void *opaque); static void nbd_read(void *opaque);
static void nbd_restart_write(void *opaque); static void nbd_restart_write(void *opaque);
static int nbd_co_send_reply(NBDRequest *req, struct nbd_reply *reply, static ssize_t nbd_co_send_reply(NBDRequest *req, struct nbd_reply *reply,
int len) int len)
{ {
NBDClient *client = req->client; NBDClient *client = req->client;
int csock = client->sock; int csock = client->sock;
int rc, ret; ssize_t rc, ret;
qemu_co_mutex_lock(&client->send_lock); qemu_co_mutex_lock(&client->send_lock);
qemu_set_fd_handler2(csock, nbd_can_read, nbd_read, qemu_set_fd_handler2(csock, nbd_can_read, nbd_read,
@ -716,22 +737,15 @@ static int nbd_co_send_reply(NBDRequest *req, struct nbd_reply *reply,
if (!len) { if (!len) {
rc = nbd_send_reply(csock, reply); rc = nbd_send_reply(csock, reply);
if (rc == -1) {
rc = -errno;
}
} else { } else {
socket_set_cork(csock, 1); socket_set_cork(csock, 1);
rc = nbd_send_reply(csock, reply); rc = nbd_send_reply(csock, reply);
if (rc != -1) { if (rc >= 0) {
ret = qemu_co_send(csock, req->data, len); ret = qemu_co_send(csock, req->data, len);
if (ret != len) { if (ret != len) {
errno = EIO; rc = -EIO;
rc = -1;
} }
} }
if (rc == -1) {
rc = -errno;
}
socket_set_cork(csock, 0); socket_set_cork(csock, 0);
} }
@ -741,15 +755,18 @@ static int nbd_co_send_reply(NBDRequest *req, struct nbd_reply *reply,
return rc; return rc;
} }
static int nbd_co_receive_request(NBDRequest *req, struct nbd_request *request) static ssize_t nbd_co_receive_request(NBDRequest *req, struct nbd_request *request)
{ {
NBDClient *client = req->client; NBDClient *client = req->client;
int csock = client->sock; int csock = client->sock;
int rc; ssize_t rc;
client->recv_coroutine = qemu_coroutine_self(); client->recv_coroutine = qemu_coroutine_self();
if (nbd_receive_request(csock, request) == -1) { rc = nbd_receive_request(csock, request);
rc = -EIO; if (rc < 0) {
if (rc != -EAGAIN) {
rc = -EIO;
}
goto out; goto out;
} }
@ -792,11 +809,14 @@ static void nbd_trip(void *opaque)
NBDExport *exp = client->exp; NBDExport *exp = client->exp;
struct nbd_request request; struct nbd_request request;
struct nbd_reply reply; struct nbd_reply reply;
int ret; ssize_t ret;
TRACE("Reading request."); TRACE("Reading request.");
ret = nbd_co_receive_request(req, &request); ret = nbd_co_receive_request(req, &request);
if (ret == -EAGAIN) {
goto done;
}
if (ret == -EIO) { if (ret == -EIO) {
goto out; goto out;
} }
@ -822,6 +842,15 @@ static void nbd_trip(void *opaque)
case NBD_CMD_READ: case NBD_CMD_READ:
TRACE("Request type is READ"); TRACE("Request type is READ");
if (request.type & NBD_CMD_FLAG_FUA) {
ret = bdrv_co_flush(exp->bs);
if (ret < 0) {
LOG("flush failed");
reply.error = -ret;
goto error_reply;
}
}
ret = bdrv_read(exp->bs, (request.from + exp->dev_offset) / 512, ret = bdrv_read(exp->bs, (request.from + exp->dev_offset) / 512,
req->data, request.len / 512); req->data, request.len / 512);
if (ret < 0) { if (ret < 0) {
@ -862,8 +891,9 @@ static void nbd_trip(void *opaque)
} }
} }
if (nbd_co_send_reply(req, &reply, 0) < 0) if (nbd_co_send_reply(req, &reply, 0) < 0) {
goto out; goto out;
}
break; break;
case NBD_CMD_DISC: case NBD_CMD_DISC:
TRACE("Request type is DISCONNECT"); TRACE("Request type is DISCONNECT");
@ -877,9 +907,9 @@ static void nbd_trip(void *opaque)
LOG("flush failed"); LOG("flush failed");
reply.error = -ret; reply.error = -ret;
} }
if (nbd_co_send_reply(req, &reply, 0) < 0) {
if (nbd_co_send_reply(req, &reply, 0) < 0)
goto out; goto out;
}
break; break;
case NBD_CMD_TRIM: case NBD_CMD_TRIM:
TRACE("Request type is TRIM"); TRACE("Request type is TRIM");
@ -889,21 +919,24 @@ static void nbd_trip(void *opaque)
LOG("discard failed"); LOG("discard failed");
reply.error = -ret; reply.error = -ret;
} }
if (nbd_co_send_reply(req, &reply, 0) < 0) if (nbd_co_send_reply(req, &reply, 0) < 0) {
goto out; goto out;
}
break; break;
default: default:
LOG("invalid request type (%u) received", request.type); LOG("invalid request type (%u) received", request.type);
invalid_request: invalid_request:
reply.error = -EINVAL; reply.error = -EINVAL;
error_reply: error_reply:
if (nbd_co_send_reply(req, &reply, 0) == -1) if (nbd_co_send_reply(req, &reply, 0) < 0) {
goto out; goto out;
}
break; break;
} }
TRACE("Request/Reply complete"); TRACE("Request/Reply complete");
done:
nbd_request_put(req); nbd_request_put(req);
return; return;
@ -941,7 +974,7 @@ NBDClient *nbd_client_new(NBDExport *exp, int csock,
void (*close)(NBDClient *)) void (*close)(NBDClient *))
{ {
NBDClient *client; NBDClient *client;
if (nbd_send_negotiate(csock, exp->size, exp->nbdflags) == -1) { if (nbd_send_negotiate(csock, exp->size, exp->nbdflags) < 0) {
return NULL; return NULL;
} }
client = g_malloc0(sizeof(NBDClient)); client = g_malloc0(sizeof(NBDClient));

6
nbd.h
View File

@ -59,7 +59,7 @@ enum {
#define NBD_BUFFER_SIZE (1024*1024) #define NBD_BUFFER_SIZE (1024*1024)
size_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read); ssize_t nbd_wr_sync(int fd, void *buffer, size_t size, bool do_read);
int tcp_socket_outgoing(const char *address, uint16_t port); int tcp_socket_outgoing(const char *address, uint16_t port);
int tcp_socket_incoming(const char *address, uint16_t port); int tcp_socket_incoming(const char *address, uint16_t port);
int tcp_socket_outgoing_spec(const char *address_and_port); int tcp_socket_outgoing_spec(const char *address_and_port);
@ -70,8 +70,8 @@ int unix_socket_incoming(const char *path);
int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags, int nbd_receive_negotiate(int csock, const char *name, uint32_t *flags,
off_t *size, size_t *blocksize); off_t *size, size_t *blocksize);
int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize); int nbd_init(int fd, int csock, uint32_t flags, off_t size, size_t blocksize);
int nbd_send_request(int csock, struct nbd_request *request); ssize_t nbd_send_request(int csock, struct nbd_request *request);
int nbd_receive_reply(int csock, struct nbd_reply *reply); ssize_t nbd_receive_reply(int csock, struct nbd_reply *reply);
int nbd_client(int fd); int nbd_client(int fd);
int nbd_disconnect(int fd); int nbd_disconnect(int fd);

View File

@ -17,7 +17,7 @@
*/ */
#include "qemu-common.h" #include "qemu-common.h"
#include "block_int.h" #include "block.h"
#include "nbd.h" #include "nbd.h"
#include <stdarg.h> #include <stdarg.h>
@ -126,8 +126,7 @@ static int find_partition(BlockDriverState *bs, int partition,
} }
if (data[510] != 0x55 || data[511] != 0xaa) { if (data[510] != 0x55 || data[511] != 0xaa) {
errno = -EINVAL; return -EINVAL;
return -1;
} }
for (i = 0; i < 4; i++) { for (i = 0; i < 4; i++) {
@ -165,8 +164,7 @@ static int find_partition(BlockDriverState *bs, int partition,
} }
} }
errno = -ENOENT; return -ENOENT;
return -1;
} }
static void termsig_handler(int signum) static void termsig_handler(int signum)
@ -186,7 +184,7 @@ static void *show_parts(void *arg)
* modprobe nbd max_part=63 * modprobe nbd max_part=63
*/ */
nbd = open(device, O_RDWR); nbd = open(device, O_RDWR);
if (nbd != -1) { if (nbd >= 0) {
close(nbd); close(nbd);
} }
return NULL; return NULL;
@ -203,25 +201,25 @@ static void *nbd_client_thread(void *arg)
pthread_t show_parts_thread; pthread_t show_parts_thread;
sock = unix_socket_outgoing(sockpath); sock = unix_socket_outgoing(sockpath);
if (sock == -1) { if (sock < 0) {
goto out; goto out;
} }
ret = nbd_receive_negotiate(sock, NULL, &nbdflags, ret = nbd_receive_negotiate(sock, NULL, &nbdflags,
&size, &blocksize); &size, &blocksize);
if (ret == -1) { if (ret < 0) {
goto out; goto out;
} }
fd = open(device, O_RDWR); fd = open(device, O_RDWR);
if (fd == -1) { if (fd < 0) {
/* Linux-only, we can use %m in printf. */ /* Linux-only, we can use %m in printf. */
fprintf(stderr, "Failed to open %s: %m", device); fprintf(stderr, "Failed to open %s: %m", device);
goto out; goto out;
} }
ret = nbd_init(fd, sock, nbdflags, size, blocksize); ret = nbd_init(fd, sock, nbdflags, size, blocksize);
if (ret == -1) { if (ret < 0) {
goto out; goto out;
} }
@ -268,7 +266,7 @@ static void nbd_accept(void *opaque)
int fd = accept(server_fd, (struct sockaddr *)&addr, &addr_len); int fd = accept(server_fd, (struct sockaddr *)&addr, &addr_len);
nbd_started = true; nbd_started = true;
if (fd != -1 && nbd_client_new(exp, fd, nbd_client_closed)) { if (fd >= 0 && nbd_client_new(exp, fd, nbd_client_closed)) {
nb_fds++; nb_fds++;
} }
} }
@ -410,9 +408,9 @@ int main(int argc, char **argv)
if (disconnect) { if (disconnect) {
fd = open(argv[optind], O_RDWR); fd = open(argv[optind], O_RDWR);
if (fd == -1) if (fd < 0) {
err(EXIT_FAILURE, "Cannot open %s", argv[optind]); err(EXIT_FAILURE, "Cannot open %s", argv[optind]);
}
nbd_disconnect(fd); nbd_disconnect(fd);
close(fd); close(fd);
@ -427,7 +425,7 @@ int main(int argc, char **argv)
pid_t pid; pid_t pid;
int ret; int ret;
if (qemu_pipe(stderr_fd) == -1) { if (qemu_pipe(stderr_fd) < 0) {
err(EXIT_FAILURE, "Error setting up communication pipe"); err(EXIT_FAILURE, "Error setting up communication pipe");
} }
@ -441,7 +439,7 @@ int main(int argc, char **argv)
/* Temporarily redirect stderr to the parent's pipe... */ /* Temporarily redirect stderr to the parent's pipe... */
dup2(stderr_fd[1], STDERR_FILENO); dup2(stderr_fd[1], STDERR_FILENO);
if (ret == -1) { if (ret < 0) {
err(EXIT_FAILURE, "Failed to daemonize"); err(EXIT_FAILURE, "Failed to daemonize");
} }
@ -459,11 +457,11 @@ int main(int argc, char **argv)
while ((ret = read(stderr_fd[0], buf, 1024)) > 0) { while ((ret = read(stderr_fd[0], buf, 1024)) > 0) {
errors = true; errors = true;
ret = qemu_write_full(STDERR_FILENO, buf, ret); ret = qemu_write_full(STDERR_FILENO, buf, ret);
if (ret == -1) { if (ret < 0) {
exit(EXIT_FAILURE); exit(EXIT_FAILURE);
} }
} }
if (ret == -1) { if (ret < 0) {
err(EXIT_FAILURE, "Cannot read from daemon"); err(EXIT_FAILURE, "Cannot read from daemon");
} }
@ -489,11 +487,14 @@ int main(int argc, char **argv)
err(EXIT_FAILURE, "Failed to bdrv_open '%s'", argv[optind]); err(EXIT_FAILURE, "Failed to bdrv_open '%s'", argv[optind]);
} }
fd_size = bs->total_sectors * 512; fd_size = bdrv_getlength(bs);
if (partition != -1 && if (partition != -1) {
find_partition(bs, partition, &dev_offset, &fd_size)) { ret = find_partition(bs, partition, &dev_offset, &fd_size);
err(EXIT_FAILURE, "Could not find partition %d", partition); if (ret < 0) {
errno = -ret;
err(EXIT_FAILURE, "Could not find partition %d", partition);
}
} }
exp = nbd_export_new(bs, dev_offset, fd_size, nbdflags); exp = nbd_export_new(bs, dev_offset, fd_size, nbdflags);
@ -504,7 +505,7 @@ int main(int argc, char **argv)
fd = tcp_socket_incoming(bindto, port); fd = tcp_socket_incoming(bindto, port);
} }
if (fd == -1) { if (fd < 0) {
return 1; return 1;
} }