carlwgeorge / rpms / qemu

Forked from rpms/qemu a year ago
Clone
0fb2b27
From: Paolo Bonzini <pbonzini@redhat.com>
0fb2b27
Date: Mon, 21 Aug 2017 18:58:56 +0200
59eb7ad
Subject: [PATCH] scsi: add persistent reservation manager using qemu-pr-helper
0fb2b27
0fb2b27
This adds a concrete subclass of pr-manager that talks to qemu-pr-helper.
0fb2b27
0fb2b27
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
0fb2b27
---
0fb2b27
 scsi/Makefile.objs       |   2 +-
a056f39
 scsi/pr-manager-helper.c | 302 +++++++++++++++++++++++++++++++++++++++
0fb2b27
 2 files changed, 303 insertions(+), 1 deletion(-)
0fb2b27
 create mode 100644 scsi/pr-manager-helper.c
0fb2b27
0fb2b27
diff --git a/scsi/Makefile.objs b/scsi/Makefile.objs
0fb2b27
index 5496d2ae6a..4d25e476cf 100644
0fb2b27
--- a/scsi/Makefile.objs
0fb2b27
+++ b/scsi/Makefile.objs
0fb2b27
@@ -1,3 +1,3 @@
0fb2b27
 block-obj-y += utils.o
0fb2b27
 
0fb2b27
-block-obj-$(CONFIG_LINUX) += pr-manager.o
0fb2b27
+block-obj-$(CONFIG_LINUX) += pr-manager.o pr-manager-helper.o
0fb2b27
diff --git a/scsi/pr-manager-helper.c b/scsi/pr-manager-helper.c
0fb2b27
new file mode 100644
0fb2b27
index 0000000000..82ff6b6123
0fb2b27
--- /dev/null
0fb2b27
+++ b/scsi/pr-manager-helper.c
0fb2b27
@@ -0,0 +1,302 @@
0fb2b27
+/*
0fb2b27
+ * Persistent reservation manager that talks to qemu-pr-helper
0fb2b27
+ *
0fb2b27
+ * Copyright (c) 2017 Red Hat, Inc.
0fb2b27
+ *
0fb2b27
+ * Author: Paolo Bonzini <pbonzini@redhat.com>
0fb2b27
+ *
0fb2b27
+ * This code is licensed under the LGPL v2.1 or later.
0fb2b27
+ *
0fb2b27
+ */
0fb2b27
+
0fb2b27
+#include "qemu/osdep.h"
0fb2b27
+#include "qapi/error.h"
0fb2b27
+#include "scsi/constants.h"
0fb2b27
+#include "scsi/pr-manager.h"
0fb2b27
+#include "scsi/utils.h"
0fb2b27
+#include "io/channel.h"
0fb2b27
+#include "io/channel-socket.h"
0fb2b27
+#include "pr-helper.h"
0fb2b27
+
0fb2b27
+#include <scsi/sg.h>
0fb2b27
+
0fb2b27
+#define PR_MAX_RECONNECT_ATTEMPTS 5
0fb2b27
+
0fb2b27
+#define TYPE_PR_MANAGER_HELPER "pr-manager-helper"
0fb2b27
+
0fb2b27
+#define PR_MANAGER_HELPER(obj) \
0fb2b27
+     OBJECT_CHECK(PRManagerHelper, (obj), \
0fb2b27
+                  TYPE_PR_MANAGER_HELPER)
0fb2b27
+
0fb2b27
+typedef struct PRManagerHelper {
0fb2b27
+    /* <private> */
0fb2b27
+    PRManager parent;
0fb2b27
+
0fb2b27
+    char *path;
0fb2b27
+
0fb2b27
+    QemuMutex lock;
0fb2b27
+    QIOChannel *ioc;
0fb2b27
+} PRManagerHelper;
0fb2b27
+
0fb2b27
+/* Called with lock held.  */
0fb2b27
+static int pr_manager_helper_read(PRManagerHelper *pr_mgr,
0fb2b27
+                                  void *buf, int sz, Error **errp)
0fb2b27
+{
0fb2b27
+    ssize_t r = qio_channel_read_all(pr_mgr->ioc, buf, sz, errp);
0fb2b27
+
0fb2b27
+    if (r < 0) {
0fb2b27
+        object_unref(OBJECT(pr_mgr->ioc));
0fb2b27
+        pr_mgr->ioc = NULL;
0fb2b27
+        return -EINVAL;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    return 0;
0fb2b27
+}
0fb2b27
+
0fb2b27
+/* Called with lock held.  */
0fb2b27
+static int pr_manager_helper_write(PRManagerHelper *pr_mgr,
0fb2b27
+                                   int fd,
0fb2b27
+                                   const void *buf, int sz, Error **errp)
0fb2b27
+{
0fb2b27
+    size_t nfds = (fd != -1);
0fb2b27
+    while (sz > 0) {
0fb2b27
+        struct iovec iov;
0fb2b27
+        ssize_t n_written;
0fb2b27
+
0fb2b27
+        iov.iov_base = (void *)buf;
0fb2b27
+        iov.iov_len = sz;
0fb2b27
+        n_written = qio_channel_writev_full(QIO_CHANNEL(pr_mgr->ioc), &iov, 1,
0fb2b27
+                                            nfds ? &fd : NULL, nfds, errp);
0fb2b27
+
0fb2b27
+        if (n_written <= 0) {
0fb2b27
+            assert(n_written != QIO_CHANNEL_ERR_BLOCK);
0fb2b27
+            object_unref(OBJECT(pr_mgr->ioc));
0fb2b27
+            return n_written < 0 ? -EINVAL : 0;
0fb2b27
+        }
0fb2b27
+
0fb2b27
+        nfds = 0;
0fb2b27
+        buf += n_written;
0fb2b27
+        sz -= n_written;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    return 0;
0fb2b27
+}
0fb2b27
+
0fb2b27
+/* Called with lock held.  */
0fb2b27
+static int pr_manager_helper_initialize(PRManagerHelper *pr_mgr,
0fb2b27
+                                        Error **errp)
0fb2b27
+{
0fb2b27
+    char *path = g_strdup(pr_mgr->path);
0fb2b27
+    SocketAddress saddr = {
0fb2b27
+        .type = SOCKET_ADDRESS_TYPE_UNIX,
0fb2b27
+        .u.q_unix.path = path
0fb2b27
+    };
0fb2b27
+    QIOChannelSocket *sioc = qio_channel_socket_new();
0fb2b27
+    Error *local_err = NULL;
0fb2b27
+
0fb2b27
+    uint32_t flags;
0fb2b27
+    int r;
0fb2b27
+
0fb2b27
+    assert(!pr_mgr->ioc);
0fb2b27
+    qio_channel_set_name(QIO_CHANNEL(sioc), "pr-manager-helper");
0fb2b27
+    qio_channel_socket_connect_sync(sioc,
0fb2b27
+                                    &saddr,
0fb2b27
+                                    &local_err);
0fb2b27
+    g_free(path);
0fb2b27
+    if (local_err) {
0fb2b27
+        object_unref(OBJECT(sioc));
0fb2b27
+        error_propagate(errp, local_err);
0fb2b27
+        return -ENOTCONN;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    qio_channel_set_delay(QIO_CHANNEL(sioc), false);
0fb2b27
+    pr_mgr->ioc = QIO_CHANNEL(sioc);
0fb2b27
+
0fb2b27
+    /* A simple feature negotation protocol, even though there is
0fb2b27
+     * no optional feature right now.
0fb2b27
+     */
0fb2b27
+    r = pr_manager_helper_read(pr_mgr, &flags, sizeof(flags), errp);
0fb2b27
+    if (r < 0) {
0fb2b27
+        goto out_close;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    flags = 0;
0fb2b27
+    r = pr_manager_helper_write(pr_mgr, -1, &flags, sizeof(flags), errp);
0fb2b27
+    if (r < 0) {
0fb2b27
+        goto out_close;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    return 0;
0fb2b27
+
0fb2b27
+out_close:
0fb2b27
+    object_unref(OBJECT(pr_mgr->ioc));
0fb2b27
+    pr_mgr->ioc = NULL;
0fb2b27
+    return r;
0fb2b27
+}
0fb2b27
+
0fb2b27
+static int pr_manager_helper_run(PRManager *p,
0fb2b27
+                                 int fd, struct sg_io_hdr *io_hdr)
0fb2b27
+{
0fb2b27
+    PRManagerHelper *pr_mgr = PR_MANAGER_HELPER(p);
0fb2b27
+
0fb2b27
+    uint32_t len;
0fb2b27
+    PRHelperResponse resp;
0fb2b27
+    int ret;
0fb2b27
+    int expected_dir;
0fb2b27
+    int attempts;
0fb2b27
+    uint8_t cdb[PR_HELPER_CDB_SIZE] = { 0 };
0fb2b27
+
0fb2b27
+    if (!io_hdr->cmd_len || io_hdr->cmd_len > PR_HELPER_CDB_SIZE) {
0fb2b27
+        return -EINVAL;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    memcpy(cdb, io_hdr->cmdp, io_hdr->cmd_len);
0fb2b27
+    assert(cdb[0] == PERSISTENT_RESERVE_OUT || cdb[0] == PERSISTENT_RESERVE_IN);
0fb2b27
+    expected_dir =
0fb2b27
+        (cdb[0] == PERSISTENT_RESERVE_OUT ? SG_DXFER_TO_DEV : SG_DXFER_FROM_DEV);
0fb2b27
+    if (io_hdr->dxfer_direction != expected_dir) {
0fb2b27
+        return -EINVAL;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    len = scsi_cdb_xfer(cdb);
0fb2b27
+    if (io_hdr->dxfer_len < len || len > PR_HELPER_DATA_SIZE) {
0fb2b27
+        return -EINVAL;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    qemu_mutex_lock(&pr_mgr->lock);
0fb2b27
+
0fb2b27
+    /* Try to reconnect while sending the CDB.  */
0fb2b27
+    for (attempts = 0; attempts < PR_MAX_RECONNECT_ATTEMPTS; attempts++) {
0fb2b27
+        if (!pr_mgr->ioc) {
0fb2b27
+            ret = pr_manager_helper_initialize(pr_mgr, NULL);
0fb2b27
+            if (ret < 0) {
0fb2b27
+                qemu_mutex_unlock(&pr_mgr->lock);
0fb2b27
+                g_usleep(G_USEC_PER_SEC);
0fb2b27
+                qemu_mutex_lock(&pr_mgr->lock);
0fb2b27
+                continue;
0fb2b27
+            }
0fb2b27
+        }
0fb2b27
+
0fb2b27
+        ret = pr_manager_helper_write(pr_mgr, fd, cdb, ARRAY_SIZE(cdb), NULL);
0fb2b27
+        if (ret >= 0) {
0fb2b27
+            break;
0fb2b27
+        }
0fb2b27
+    }
0fb2b27
+    if (ret < 0) {
0fb2b27
+        goto out;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    /* After sending the CDB, any communications failure causes the
0fb2b27
+     * command to fail.  The failure is transient, retrying the command
0fb2b27
+     * will invoke pr_manager_helper_initialize again.
0fb2b27
+     */
0fb2b27
+    if (expected_dir == SG_DXFER_TO_DEV) {
0fb2b27
+        io_hdr->resid = io_hdr->dxfer_len - len;
0fb2b27
+        ret = pr_manager_helper_write(pr_mgr, -1, io_hdr->dxferp, len, NULL);
0fb2b27
+        if (ret < 0) {
0fb2b27
+            goto out;
0fb2b27
+        }
0fb2b27
+    }
0fb2b27
+    ret = pr_manager_helper_read(pr_mgr, &resp, sizeof(resp), NULL);
0fb2b27
+    if (ret < 0) {
0fb2b27
+        goto out;
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    resp.result = be32_to_cpu(resp.result);
0fb2b27
+    resp.sz = be32_to_cpu(resp.sz);
0fb2b27
+    if (io_hdr->dxfer_direction == SG_DXFER_FROM_DEV) {
0fb2b27
+        assert(resp.sz <= io_hdr->dxfer_len);
0fb2b27
+        ret = pr_manager_helper_read(pr_mgr, io_hdr->dxferp, resp.sz, NULL);
0fb2b27
+        if (ret < 0) {
0fb2b27
+            goto out;
0fb2b27
+        }
0fb2b27
+        io_hdr->resid = io_hdr->dxfer_len - resp.sz;
0fb2b27
+    } else {
0fb2b27
+        assert(resp.sz == 0);
0fb2b27
+    }
0fb2b27
+
0fb2b27
+    io_hdr->status = resp.result;
0fb2b27
+    if (resp.result == CHECK_CONDITION) {
0fb2b27
+        io_hdr->driver_status = SG_ERR_DRIVER_SENSE;
0fb2b27
+        io_hdr->sb_len_wr = MIN(io_hdr->mx_sb_len, PR_HELPER_SENSE_SIZE);
0fb2b27
+        memcpy(io_hdr->sbp, resp.sense, io_hdr->sb_len_wr);
0fb2b27
+    }
0fb2b27
+
0fb2b27
+out:
0fb2b27
+    if (ret < 0) {
0fb2b27
+        int sense_len = scsi_build_sense(io_hdr->sbp,
0fb2b27
+                                         SENSE_CODE(LUN_COMM_FAILURE));
0fb2b27
+        io_hdr->driver_status = SG_ERR_DRIVER_SENSE;
0fb2b27
+        io_hdr->sb_len_wr = MIN(io_hdr->mx_sb_len, sense_len);
0fb2b27
+        io_hdr->status = CHECK_CONDITION;
0fb2b27
+    }
0fb2b27
+    qemu_mutex_unlock(&pr_mgr->lock);
0fb2b27
+    return ret;
0fb2b27
+}
0fb2b27
+
0fb2b27
+static void pr_manager_helper_complete(UserCreatable *uc, Error **errp)
0fb2b27
+{
0fb2b27
+    PRManagerHelper *pr_mgr = PR_MANAGER_HELPER(uc);
0fb2b27
+
0fb2b27
+    qemu_mutex_lock(&pr_mgr->lock);
0fb2b27
+    pr_manager_helper_initialize(pr_mgr, errp);
0fb2b27
+    qemu_mutex_unlock(&pr_mgr->lock);
0fb2b27
+}
0fb2b27
+
0fb2b27
+static char *get_path(Object *obj, Error **errp)
0fb2b27
+{
0fb2b27
+    PRManagerHelper *pr_mgr = PR_MANAGER_HELPER(obj);
0fb2b27
+
0fb2b27
+    return g_strdup(pr_mgr->path);
0fb2b27
+}
0fb2b27
+
0fb2b27
+static void set_path(Object *obj, const char *str, Error **errp)
0fb2b27
+{
0fb2b27
+    PRManagerHelper *pr_mgr = PR_MANAGER_HELPER(obj);
0fb2b27
+
0fb2b27
+    g_free(pr_mgr->path);
0fb2b27
+    pr_mgr->path = g_strdup(str);
0fb2b27
+}
0fb2b27
+
0fb2b27
+static void pr_manager_helper_instance_finalize(Object *obj)
0fb2b27
+{
0fb2b27
+    PRManagerHelper *pr_mgr = PR_MANAGER_HELPER(obj);
0fb2b27
+
0fb2b27
+    object_unref(OBJECT(pr_mgr->ioc));
0fb2b27
+    qemu_mutex_destroy(&pr_mgr->lock);
0fb2b27
+}
0fb2b27
+
0fb2b27
+static void pr_manager_helper_instance_init(Object *obj)
0fb2b27
+{
0fb2b27
+    PRManagerHelper *pr_mgr = PR_MANAGER_HELPER(obj);
0fb2b27
+
0fb2b27
+    qemu_mutex_init(&pr_mgr->lock);
0fb2b27
+}
0fb2b27
+
0fb2b27
+static void pr_manager_helper_class_init(ObjectClass *klass,
0fb2b27
+                                         void *class_data G_GNUC_UNUSED)
0fb2b27
+{
0fb2b27
+    PRManagerClass *prmgr_klass = PR_MANAGER_CLASS(klass);
0fb2b27
+    UserCreatableClass *uc_klass = USER_CREATABLE_CLASS(klass);
0fb2b27
+
0fb2b27
+    object_class_property_add_str(klass, "path", get_path, set_path,
0fb2b27
+                                  &error_abort);
0fb2b27
+    uc_klass->complete = pr_manager_helper_complete;
0fb2b27
+    prmgr_klass->run = pr_manager_helper_run;
0fb2b27
+}
0fb2b27
+
0fb2b27
+static const TypeInfo pr_manager_helper_info = {
0fb2b27
+    .parent = TYPE_PR_MANAGER,
0fb2b27
+    .name = TYPE_PR_MANAGER_HELPER,
0fb2b27
+    .instance_size = sizeof(PRManagerHelper),
0fb2b27
+    .instance_init = pr_manager_helper_instance_init,
0fb2b27
+    .instance_finalize = pr_manager_helper_instance_finalize,
0fb2b27
+    .class_init = pr_manager_helper_class_init,
0fb2b27
+};
0fb2b27
+
0fb2b27
+static void pr_manager_helper_register_types(void)
0fb2b27
+{
0fb2b27
+    type_register_static(&pr_manager_helper_info);
0fb2b27
+}
0fb2b27
+
0fb2b27
+type_init(pr_manager_helper_register_types);