/* * buse - block-device userspace extensions * Copyright (C) 2013 Adam Cozzette * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with this program; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ #include #include #include #include #include #include #include #include #include #include #include #include #include "buse.h" /* * These helper functions were taken from cliserv.h in the nbd distribution. */ #ifdef WORDS_BIGENDIAN u_int64_t ntohll(u_int64_t a) { return a; } #else u_int64_t ntohll(u_int64_t a) { u_int32_t lo = a & 0xffffffff; u_int32_t hi = a >> 32U; lo = ntohl(lo); hi = ntohl(hi); return ((u_int64_t) lo) << 32U | hi; } #endif #define htonll ntohll static int read_all(int fd, void *buf, size_t count) { int bytes_read; while (count > 0) { bytes_read = read(fd, buf, count); assert(bytes_read > 0); buf = (char *)buf + bytes_read; count -= bytes_read; } assert(count == 0); return 0; } static int write_all(int fd, const void *buf, size_t count) { int bytes_written; while (count > 0) { bytes_written = write(fd, buf, count); assert(bytes_written > 0); buf = (char *)buf + bytes_written; count -= bytes_written; } assert(count == 0); return 0; } int buse_main(int argc, char *argv[], const struct buse_operations *aop, void *userdata) { int sp[2]; int nbd, sk, err, tmp_fd; u_int64_t from; u_int32_t len, bytes_read; char *dev_file; struct nbd_request request; struct nbd_reply reply; void *chunk; (void) userdata; assert(argc == 3); dev_file = argv[2]; assert(!socketpair(AF_UNIX, SOCK_STREAM, 0, sp)); nbd = open(dev_file, O_RDWR); assert(nbd != -1); assert(ioctl(nbd, NBD_SET_SIZE, aop->size) != -1); assert(ioctl(nbd, NBD_CLEAR_SOCK) != -1); if (!fork()) { /* The child needs to continue setting things up. */ close(sp[0]); sk = sp[1]; assert(ioctl(nbd, NBD_SET_SOCK, sk) != -1); err = ioctl(nbd, NBD_DO_IT); fprintf(stderr, "nbd device terminated with code %d\n", err); if (err == -1) fprintf(stderr, "%s\n", strerror(errno)); assert(ioctl(nbd, NBD_CLEAR_QUE) != -1); assert(ioctl(nbd, NBD_CLEAR_SOCK) != -1); exit(0); } /* The parent opens the device file at least once, to make sure the * partition table is updated. Then it closes it and starts serving up * requests. */ tmp_fd = open(dev_file, O_RDONLY); assert(tmp_fd != -1); close(tmp_fd); close(sp[1]); sk = sp[0]; reply.magic = htonl(NBD_REPLY_MAGIC); reply.error = htonl(0); while (1) { bytes_read = read(sk, &request, sizeof(request)); assert(bytes_read == sizeof(request)); memcpy(reply.handle, request.handle, sizeof(reply.handle)); len = ntohl(request.len); from = ntohll(request.from); assert(request.magic == htonl(NBD_REQUEST_MAGIC)); switch(ntohl(request.type)) { /* I may at some point need to deal with the the fact that the * official nbd server has a maximum buffer size, and divides up * oversized requests into multiple pieces. This applies to reads * and writes. */ case NBD_CMD_READ: /* fprintf(stderr, "Request for read of size %d\n", len); */ chunk = malloc(len + sizeof(struct nbd_reply)); aop->read((char *)chunk + sizeof(struct nbd_reply), len, from); memcpy(chunk, &reply, sizeof(struct nbd_reply)); write_all(sk, chunk, len + sizeof(struct nbd_reply)); free(chunk); break; case NBD_CMD_WRITE: /* fprintf(stderr, "Request for write of size %d\n", len); */ chunk = malloc(len); read_all(sk, chunk, len); aop->write(chunk, len, from); free(chunk); write_all(sk, &reply, sizeof(struct nbd_reply)); break; case NBD_CMD_DISC: /* Handle a disconnect request. */ aop->disc(); return 0; case NBD_CMD_FLUSH: aop->flush(); break; case NBD_CMD_TRIM: aop->trim(from, len); break; default: assert(0); } } return 0; }