diff -up nfs-utils-1.2.3/configure.ac.orig nfs-utils-1.2.3/configure.ac
--- nfs-utils-1.2.3/configure.ac.orig 2010-10-04 15:47:06.581340251 -0400
+++ nfs-utils-1.2.3/configure.ac 2010-10-04 15:48:00.049475138 -0400
@@ -72,11 +72,15 @@ AC_ARG_ENABLE(nfsv4,
enable_nfsv4=yes)
if test "$enable_nfsv4" = yes; then
AC_DEFINE(NFS4_SUPPORTED, 1, [Define this if you want NFSv4 support compiled in])
+ BLKMAPD=blkmapd
IDMAPD=idmapd
+ SPNFSD=spnfsd
else
enable_nfsv4=
+ BLKMAPD=
IDMAPD=
fi
+ AC_SUBST(BLKMAPD)
AC_SUBST(IDMAPD)
AC_SUBST(enable_nfsv4)
AM_CONDITIONAL(CONFIG_NFSV4, [test "$enable_nfsv4" = "yes"])
@@ -439,9 +443,11 @@ AC_CONFIG_FILES([
tools/mountstats/Makefile
tools/nfs-iostat/Makefile
utils/Makefile
+ utils/blkmapd/Makefile
utils/exportfs/Makefile
utils/gssd/Makefile
utils/idmapd/Makefile
+ utils/spnfsd/Makefile
utils/mount/Makefile
utils/mountd/Makefile
utils/nfsd/Makefile
diff -up nfs-utils-1.2.3/support/include/nfslib.h.orig nfs-utils-1.2.3/support/include/nfslib.h
--- nfs-utils-1.2.3/support/include/nfslib.h.orig 2010-09-28 08:24:16.000000000 -0400
+++ nfs-utils-1.2.3/support/include/nfslib.h 2010-10-04 15:48:00.069391711 -0400
@@ -89,6 +89,7 @@ struct exportent {
char * e_fslocdata;
char * e_uuid;
struct sec_entry e_secinfo[SECFLAVOR_COUNT+1];
+ int e_pnfs;
};
struct rmtabent {
diff -up nfs-utils-1.2.3/support/include/nfs/nfs.h.orig nfs-utils-1.2.3/support/include/nfs/nfs.h
--- nfs-utils-1.2.3/support/include/nfs/nfs.h.orig 2010-09-28 08:24:16.000000000 -0400
+++ nfs-utils-1.2.3/support/include/nfs/nfs.h 2010-10-04 15:48:00.050474882 -0400
@@ -47,6 +47,7 @@ struct nfs_fh_old {
#define NFSCTL_GETFH 6 /* get an fh (used by mountd) */
#define NFSCTL_GETFD 7 /* get an fh by path (used by mountd) */
#define NFSCTL_GETFS 8 /* get an fh by path with max size (used by mountd) */
+#define NFSCTL_FD2FH 9 /* get a fh from a fd */
#define NFSCTL_UDPBIT (1 << (17 - 1))
#define NFSCTL_TCPBIT (1 << (18 - 1))
@@ -136,6 +137,11 @@ struct nfsctl_fsparm {
int gd_maxlen;
};
+/* FD2FH */
+struct nfsctl_fd2fh {
+ int fd;
+};
+
/*
* This is the argument union.
*/
@@ -149,6 +155,7 @@ struct nfsctl_arg {
struct nfsctl_fhparm u_getfh;
struct nfsctl_fdparm u_getfd;
struct nfsctl_fsparm u_getfs;
+ struct nfsctl_fd2fh u_fd2fh;
} u;
#define ca_svc u.u_svc
#define ca_client u.u_client
@@ -157,6 +164,7 @@ struct nfsctl_arg {
#define ca_getfh u.u_getfh
#define ca_getfd u.u_getfd
#define ca_getfs u.u_getfs
+#define ca_fd2fh u.u_fd2fh
#define ca_authd u.u_authd
};
diff -up nfs-utils-1.2.3/support/nfs/exports.c.orig nfs-utils-1.2.3/support/nfs/exports.c
--- nfs-utils-1.2.3/support/nfs/exports.c.orig 2010-10-04 15:47:06.589340404 -0400
+++ nfs-utils-1.2.3/support/nfs/exports.c 2010-10-04 15:48:00.070350101 -0400
@@ -107,6 +107,7 @@ static void init_exportent (struct expor
ee->e_nsquids = 0;
ee->e_nsqgids = 0;
ee->e_uuid = NULL;
+ ee->e_pnfs = 0;
}
struct exportent *
@@ -299,6 +300,8 @@ putexportent(struct exportent *ep)
}
fprintf(fp, "anonuid=%d,anongid=%d", ep->e_anonuid, ep->e_anongid);
secinfo_show(fp, ep);
+ if (ep->e_pnfs)
+ fprintf(fp, ",pnfs");
fprintf(fp, ")\n");
}
@@ -557,6 +560,10 @@ parseopts(char *cp, struct exportent *ep
clearflags(NFSEXP_NOACL, active, ep);
else if (strcmp(opt, "no_acl") == 0)
setflags(NFSEXP_NOACL, active, ep);
+ else if (strcmp(opt, "pnfs") == 0)
+ ep->e_pnfs = 1;
+ else if (strcmp(opt, "no_pnfs") == 0)
+ ep->e_pnfs = 0;
else if (strncmp(opt, "anonuid=", 8) == 0) {
char *oe;
ep->e_anonuid = strtol(opt+8, &oe, 10);
diff -up nfs-utils-1.2.3/utils/blkmapd/atomicio.c.orig nfs-utils-1.2.3/utils/blkmapd/atomicio.c
--- nfs-utils-1.2.3/utils/blkmapd/atomicio.c.orig 2010-10-04 15:48:00.071418550 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/atomicio.c 2010-10-04 15:48:00.071418550 -0400
@@ -0,0 +1,54 @@
+/*
+ * Copyright (c) 2002 Marius Aamodt Eriksen <marius@monkey.org>
+ * Copyright (c) 1995,1999 Theo de Raadt. All rights reserved.
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <sys/types.h>
+#include <unistd.h>
+#include <errno.h>
+
+/*
+ * ensure all of data on socket comes through. f==read || f==write
+ */
+ssize_t atomicio(ssize_t(*f) (int, void *, size_t), int fd, void *_s, size_t n)
+{
+ char *s = _s;
+ ssize_t res, pos = 0;
+
+ while (n > pos) {
+ res = (f) (fd, s + pos, n - pos);
+ switch (res) {
+ case -1:
+ if (errno == EINTR || errno == EAGAIN)
+ continue;
+ case 0:
+ if (pos != 0)
+ return pos;
+ return res;
+ default:
+ pos += res;
+ }
+ }
+ return pos;
+}
diff -up nfs-utils-1.2.3/utils/blkmapd/cfg.c.orig nfs-utils-1.2.3/utils/blkmapd/cfg.c
--- nfs-utils-1.2.3/utils/blkmapd/cfg.c.orig 2010-10-04 15:48:00.072379352 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/cfg.c 2010-10-04 15:48:00.072379352 -0400
@@ -0,0 +1,248 @@
+/*
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <sys/param.h>
+#include <sys/stat.h>
+#include <linux/errno.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <unistd.h>
+#include <string.h>
+#include <fcntl.h>
+#include <ctype.h>
+
+#include "device-discovery.h"
+#include "cfg.h"
+
+char *conf_path = "/etc/blkmapd.conf";
+
+struct scan_root_list *scan_root_list_head;
+
+void bl_release_list(void)
+{
+ struct scan_root_list *root = scan_root_list_head;
+ struct scan_device_list *disk;
+
+ while (root) {
+ disk = root->disk;
+ while (disk) {
+ root->disk = disk->next;
+ free(disk->name);
+ free(disk);
+ disk = root->disk;
+ }
+ scan_root_list_head = root->next;
+ free(root->name);
+ free(root);
+ root = scan_root_list_head;
+ }
+}
+
+struct scan_root_list *bl_alloc_root_list(char *name, int all_disk)
+{
+ struct scan_root_list *root;
+
+ root = malloc(sizeof(struct scan_root_list));
+ if (!root)
+ goto nomem;
+
+ root->name = strdup(name);
+ if (!root->name)
+ goto nomem;
+ root->next = scan_root_list_head;
+ root->all_disk = all_disk;
+ scan_root_list_head = root;
+ return root;
+
+ nomem:
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ if (root)
+ free(root);
+ return NULL;
+}
+
+struct scan_device_list *bl_alloc_device_list(struct scan_root_list *root,
+ char *name)
+{
+ struct scan_device_list *device;
+
+ device = malloc(sizeof(struct scan_device_list));
+ if (!device)
+ goto nomem;
+
+ device->name = strdup(name);
+ if (!device->name)
+ goto nomem;
+ device->next = root->disk;
+ root->disk = device;
+ return device;
+
+ nomem:
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ if (device)
+ free(device);
+ return NULL;
+}
+
+struct scan_device_list *bl_insert_device_list(struct scan_root_list *root,
+ char *name)
+{
+ struct scan_device_list *device = root->disk;
+
+ /* Check whether this device has been inserted */
+ while (device) {
+ if (device->name && !strcmp(device->name, name))
+ return device;
+ device = device->next;
+ }
+
+ return bl_alloc_device_list(root, name);
+}
+
+struct scan_root_list *bl_insert_root_list(char *name, int all_disk)
+{
+ struct scan_root_list *root = scan_root_list_head;
+
+ /* Check whether this root has been inserted */
+ while (root) {
+ if (root->name && !strcmp(root->name, name))
+ return root;
+ root = root->next;
+ }
+
+ return bl_alloc_root_list(name, all_disk);
+}
+
+int bl_parse_line(char *line, struct scan_root_list **bl_root)
+{
+ char *root, *device, *end;
+
+ root = strdup(line);
+ end = root + strlen(line);
+
+ /* Skip comments */
+ if (*root == '#')
+ return 0;
+
+ /* Trim leading space */
+ while (*root != '\0' && isspace(*root))
+ root++;
+ if (*root == '\0')
+ return 0;
+
+ /* Trim trailing space and set "end" to last char */
+ while ((isspace(*end) || (*end == '\0')) && (end > root))
+ end--;
+
+ /* For lines ending with '/' or '/','*': add as a dir root */
+ if ((*end == '/') ||
+ ((*end == '*') && (end - root >= 1) && (*(end - 1) == '/'))) {
+ if (*end == '*')
+ end--;
+ if (*end == '/')
+ end--;
+ *(end + 1) = '\0';
+ *bl_root = bl_insert_root_list(root, 1);
+ return 0;
+ }
+
+ /* Other lines: add as a device */
+ device = end;
+ while ((*device != '/') && (device > root))
+ device--;
+ if (device == root) {
+ BL_LOG_ERR("%s: invalid config line\n", __func__);
+ return -1;
+ }
+ *device = '\0';
+ *bl_root = bl_insert_root_list(root, 0);
+ if (*bl_root == NULL)
+ return -ENOMEM;
+ if (*end == '*')
+ end--;
+ *(end + 1) = '\0';
+ if (bl_insert_device_list(*bl_root, device + 1) == NULL)
+ return -ENOMEM;
+
+ return 0;
+}
+
+int bl_set_default_conf(void)
+{
+ struct scan_root_list *root = NULL;
+ int rv;
+
+ bl_release_list();
+ rv = bl_parse_line("/dev/sd*", &root);
+ if (rv < 0)
+ return rv;
+ rv = bl_parse_line("/dev/mapper/", &root);
+ return rv;
+}
+
+int bl_parse_conf(char *buf)
+{
+ char *tmp = buf, *line = buf, *end = buf + strlen(buf);
+ struct scan_root_list *bl_root = NULL;
+ int rv;
+
+ while (tmp < end) {
+ if (*tmp == '\n') {
+ *tmp = '\0';
+ rv = bl_parse_line(line, &bl_root);
+ if (rv < 0)
+ return rv;
+ line = tmp + 1;
+ }
+ tmp++;
+ }
+
+ return 0;
+}
+
+int bl_cfg_init(void)
+{
+ struct scan_root_list *root = NULL;
+ FILE *f = NULL;
+ char buf[PATH_MAX];
+ int rv = 0;
+
+ f = fopen(conf_path, "r");
+ if (f == NULL)
+ rv = bl_set_default_conf();
+ else {
+ while (fgets(buf, sizeof buf, f) != NULL) {
+ rv = bl_parse_line(buf, &root);
+ if (rv < 0)
+ break;
+ }
+ }
+ if (!scan_root_list_head)
+ rv = -EINVAL;
+
+ if (f)
+ fclose(f);
+ return rv;
+}
diff -up nfs-utils-1.2.3/utils/blkmapd/cfg.h.orig nfs-utils-1.2.3/utils/blkmapd/cfg.h
--- nfs-utils-1.2.3/utils/blkmapd/cfg.h.orig 2010-10-04 15:48:00.072379352 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/cfg.h 2010-10-04 15:48:00.072379352 -0400
@@ -0,0 +1,47 @@
+/*
+ * bl-cfg.h
+ *
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+#ifndef BL_CFG_H
+#define BL_CFG_H
+
+extern char *conf_path;
+extern struct scan_root_list *scan_root_list_head;
+
+struct scan_device_list {
+ struct scan_device_list *next;
+ char *name;
+};
+
+struct scan_root_list {
+ struct scan_root_list *next;
+ unsigned int all_disk;
+ char *name;
+ struct scan_device_list *disk;
+};
+
+int bl_cfg_init(void);
+
+#endif
diff -up nfs-utils-1.2.3/utils/blkmapd/device-discovery.c.orig nfs-utils-1.2.3/utils/blkmapd/device-discovery.c
--- nfs-utils-1.2.3/utils/blkmapd/device-discovery.c.orig 2010-10-04 15:48:00.073350775 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/device-discovery.c 2010-10-04 15:48:00.073350775 -0400
@@ -0,0 +1,502 @@
+/*
+ * device-discovery.c: main function, discovering device and processing
+ * pipe request from kernel.
+ *
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <string.h>
+#include <dirent.h>
+#include <ctype.h>
+#include <linux/kdev_t.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <sys/ioctl.h>
+#include <sys/mount.h>
+#include <sys/select.h>
+#include <fcntl.h>
+#include <unistd.h>
+#include <libgen.h>
+#include <errno.h>
+#include <scsi/scsi.h>
+#include <scsi/scsi_ioctl.h>
+#include <scsi/sg.h>
+#include "device-discovery.h"
+#include "cfg.h"
+
+#define BL_PIPE_FILE "/var/lib/nfs/rpc_pipefs/bl_device_pipe"
+#define PID_FILE "/var/run/blkmapd.pid"
+
+struct bl_disk *visible_disk_list;
+
+struct bl_disk_path *bl_get_path(const char *filepath,
+ struct bl_disk_path *paths)
+{
+ struct bl_disk_path *tmp = paths;
+ while (tmp) {
+ if (!strcmp(tmp->full_path, filepath))
+ break;
+ tmp = tmp->next;
+ }
+ return tmp;
+}
+
+/* Check whether valid_path is a substring(partition) of path */
+int bl_is_partition(struct bl_disk_path *valid_path, struct bl_disk_path *path)
+{
+ if (!strncmp(valid_path->full_path, path->full_path,
+ strlen(valid_path->full_path)))
+ return 1;
+
+ return 0;
+}
+
+/*
+ * For multipath devices, devices state could be PASSIVE/ACTIVE/PSEUDO,
+ * where PSEUDO > ACTIVE > PASSIVE. Device with highest state is used to
+ * create pseudo device. So if state is higher, the device path needs to
+ * be updated.
+ * If device-mapper multipath support is a must, pseudo devices should
+ * exist for each multipath device. If not, active device path will be
+ * chosen for device creation.
+ * Treat partition as invalid path.
+ */
+int bl_update_path(struct bl_disk_path *path, enum bl_path_state_e state,
+ struct bl_disk *disk)
+{
+ struct bl_disk_path *valid_path = disk->valid_path;
+
+ if (valid_path) {
+ if (valid_path->state >= state) {
+ if (bl_is_partition(valid_path, path))
+ return 0;
+ }
+ }
+ return 1;
+}
+
+void bl_release_disk(void)
+{
+ struct bl_disk *disk;
+ struct bl_disk_path *path = NULL;
+
+ while (visible_disk_list) {
+ disk = visible_disk_list;
+ path = disk->paths;
+ while (path) {
+ disk->paths = path->next;
+ free(path->full_path);
+ free(path);
+ path = disk->paths;
+ }
+ if (disk->serial)
+ free(disk->serial);
+ visible_disk_list = disk->next;
+ free(disk);
+ }
+}
+
+void bl_add_disk(char *filepath)
+{
+ struct bl_disk *disk = NULL;
+ int fd = 0;
+ struct stat sb;
+ off_t size = 0;
+ struct bl_serial *serial = NULL;
+ enum bl_path_state_e ap_state = BL_PATH_STATE_PASSIVE;
+ struct bl_disk_path *diskpath = NULL, *path = NULL;
+ dev_t dev;
+
+ BL_LOG_ERR("%s: %s\n", __func__, filepath);
+
+ fd = open(filepath, O_RDONLY | O_LARGEFILE);
+ if (fd < 0)
+ return;
+
+ if (fstat(fd, &sb)) {
+ close(fd);
+ return;
+ }
+
+ if (!sb.st_size)
+ ioctl(fd, BLKGETSIZE, &size);
+ else
+ size = sb.st_size;
+
+ if (!size) {
+ close(fd);
+ return;
+ }
+
+ dev = sb.st_rdev;
+ serial = bldev_read_serial(fd, filepath);
+
+ for (disk = visible_disk_list; disk != NULL; disk = disk->next) {
+ /* Already scanned or a partition?
+ * XXX: if released each time, maybe not need to compare
+ */
+ if ((serial->len == disk->serial->len) &&
+ !memcmp(serial->data, disk->serial->data, serial->len)) {
+ diskpath = bl_get_path(filepath, disk->paths);
+ break;
+ }
+ }
+
+ if (disk && diskpath) {
+ close(fd);
+ return;
+ }
+
+ bldev_read_ap_state(fd, &ap_state);
+ close(fd);
+
+ /*
+ * Not sure how to identify a pseudo device created by
+ * device-mapper, so leave /dev/mapper for now.
+ */
+ if (strncmp(filepath, "/dev/mapper", 11) == 0)
+ ap_state = BL_PATH_STATE_PSEUDO;
+
+ /* add path */
+ path = malloc(sizeof(struct bl_disk_path));
+ if (!path) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ goto out_err;
+ }
+ path->next = NULL;
+ path->state = ap_state;
+ path->full_path = strdup(filepath);
+ if (!path->full_path)
+ goto out_err;
+
+ if (!disk) { /* add disk */
+ disk = malloc(sizeof(struct bl_disk));
+ if (!disk) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ goto out_err;
+ }
+ disk->next = visible_disk_list;
+ disk->dev = dev;
+ disk->size = size;
+ disk->serial = serial;
+ disk->valid_path = path;
+ disk->paths = path;
+ visible_disk_list = disk;
+ } else {
+ path->next = disk->paths;
+ disk->paths = path;
+ /* check whether we need to update disk info */
+ if (bl_update_path(path, path->state, disk)) {
+ disk->dev = dev;
+ disk->size = size;
+ disk->valid_path = path;
+ }
+ }
+ return;
+
+ out_err:
+ if (path) {
+ if (path->full_path)
+ free(path->full_path);
+ free(path);
+ }
+ return;
+}
+
+void bl_devicescan(const char *filename, struct scan_root_list *root)
+{
+ /* scan all disks */
+ char filepath[PATH_MAX];
+ struct scan_device_list *device;
+
+ if (!strcmp(filename, ".") || !strcmp(filename, ".."))
+ return;
+
+ memset(filepath, 0, sizeof(filepath));
+ if (strlen(filename) < (PATH_MAX - strlen(root->name) - 2))
+ sprintf(filepath, "%s/%s", root->name, filename);
+ else {
+ BL_LOG_ERR("%s: name too long\n", __func__);
+ return;
+ }
+ if (root->all_disk)
+ goto valid;
+
+ device = root->disk;
+ while (device) {
+ /* If device->name is a subset of filename, this disk should be
+ * valid for scanning.
+ * For example, device->name is "sd", filename is "sda".
+ */
+ if (device->name
+ && !memcmp(filename, device->name, strlen(device->name)))
+ goto valid;
+ device = device->next;
+ }
+
+ return;
+
+ valid:
+ /*
+ * sg device is not a real device, but a device created according
+ * to each scsi device. It won't be used for pseudo device creation.
+ * I moved it here, so that sg devices will not be scanned.
+ */
+ if (!strncmp(filepath, "/dev/sg", 7))
+ return;
+ bl_add_disk(filepath);
+ return;
+}
+
+int bl_discover_devices(void)
+{
+ DIR *dir;
+ struct dirent *dp;
+ struct scan_root_list *root = scan_root_list_head;
+
+ /* release previous list */
+ bl_release_disk();
+
+ /* scan all disks */
+ while (root) {
+ dir = opendir(root->name);
+ if (dir == NULL) {
+ root = root->next;
+ continue;
+ }
+
+ while ((dp = readdir(dir)) != NULL)
+ bl_devicescan(dp->d_name, root);
+
+ root = root->next;
+ closedir(dir);
+ }
+
+ return 0;
+}
+
+/* process kernel request
+ * return 0: request processed, and no more request waiting;
+ * return 1: request processed, and more requests waiting;
+ * return < 0: error
+ */
+int bl_disk_inquiry_process(int fd)
+{
+ int ret = 0;
+ struct pipefs_hdr *head = NULL, *tmp;
+ char *buf = NULL;
+ uint32_t major, minor;
+ uint16_t buflen;
+ unsigned int len = 0;
+
+ head = calloc(1, sizeof(struct pipefs_hdr));
+ if (!head) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ return -ENOMEM;
+ }
+
+ /* read request */
+ if (atomicio(read, fd, head, sizeof(*head)) != sizeof(*head)) {
+ /* Note that an error in this or the next read is pretty
+ * catastrophic, as there is no good way to resync into
+ * the pipe's stream.
+ */
+ BL_LOG_ERR("Read pipefs head error!\n");
+ ret = -EIO;
+ goto out;
+ }
+
+ buflen = head->totallen - sizeof(*head);
+ buf = malloc(buflen);
+ if (!buf) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ ret = -ENOMEM;
+ goto out;
+ }
+
+ if (atomicio(read, fd, buf, buflen) != buflen) {
+ BL_LOG_ERR("Read pipefs content error!\n");
+ ret = -EIO;
+ goto out;
+ }
+
+ head->status = BL_DEVICE_REQUEST_PROC;
+ switch (head->type) {
+ case BL_DEVICE_MOUNT:
+ if (!process_deviceinfo(buf, buflen, &major, &minor)) {
+ head->status = BL_DEVICE_REQUEST_ERR;
+ goto out;
+ }
+ tmp = realloc(head, sizeof(major) + sizeof(minor) +
+ sizeof(struct pipefs_hdr));
+ if (!tmp) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ ret = -ENOMEM;
+ goto out;
+ }
+ head = tmp;
+ memcpy((void *)head + sizeof(struct pipefs_hdr),
+ &major, sizeof(major));
+ memcpy((void *)head + sizeof(struct pipefs_hdr) + sizeof(major),
+ &minor, sizeof(minor));
+ len = sizeof(major) + sizeof(minor);
+ break;
+ case BL_DEVICE_UMOUNT:
+ if (!dm_device_remove_all((uint64_t *) buf))
+ head->status = BL_DEVICE_REQUEST_ERR;
+ bl_discover_devices();
+ break;
+ default:
+ head->status = BL_DEVICE_REQUEST_ERR;
+ }
+
+ head->totallen = sizeof(struct pipefs_hdr) + len;
+ /* write to pipefs */
+ if (atomicio((void *)write, fd, head, head->totallen)
+ != head->totallen) {
+ BL_LOG_ERR("Write pipefs error!\n");
+ ret = -EIO;
+ }
+
+ out:
+ if (buf)
+ free(buf);
+ if (head)
+ free(head);
+ return ret;
+}
+
+/* TODO: set bl_process_stop to 1 in command */
+unsigned int bl_process_stop;
+
+int bl_run_disk_inquiry_process(int fd)
+{
+ fd_set rset;
+ struct timeval tv;
+ int ret;
+
+ bl_process_stop = 0;
+
+ for (;;) {
+ if (bl_process_stop)
+ return 1;
+ FD_ZERO(&rset);
+ FD_SET(fd, &rset);
+ ret = 0;
+ tv.tv_sec = BL_DEVICE_DISCOVERY_INTERVAL;
+ switch (select(fd + 1, &rset, NULL, NULL, &tv)) {
+ case -1:
+ if (errno == EINTR)
+ continue;
+ else {
+ ret = -errno;
+ goto out;
+ }
+ case 0:
+ goto out;
+ default:
+ if (FD_ISSET(fd, &rset))
+ ret = bl_disk_inquiry_process(fd);
+ }
+ }
+ out:
+ return ret;
+}
+
+/* Daemon */
+int main(int argc, char **argv)
+{
+ int fd, opt, fg = 0, ret = 1;
+ struct stat statbuf;
+ char pidbuf[64];
+
+ while ((opt = getopt(argc, argv, "c:f")) != -1) {
+ switch (opt) {
+ case 'c':
+ conf_path = optarg;
+ break;
+ case 'f':
+ fg = 1;
+ break;
+ }
+ }
+
+ if (!stat(PID_FILE, &statbuf)) {
+ fprintf(stderr, "Pid file already existed\n");
+ return -1;
+ }
+
+ if (!fg && daemon(0, 0) != 0) {
+ fprintf(stderr, "Daemonize failed\n");
+ return -1;
+ }
+
+ openlog("blkmapd", LOG_PID, 0);
+ fd = open(PID_FILE, O_WRONLY | O_CREAT, 0644);
+ if (fd < 0) {
+ BL_LOG_ERR("Create pid file failed\n");
+ return -1;
+ }
+
+ if (lockf(fd, F_TLOCK, 0) < 0) {
+ BL_LOG_ERR("Lock pid file failed\n");
+ close(fd);
+ return -1;
+ }
+ ftruncate(fd, 0);
+ sprintf(pidbuf, "%d\n", getpid());
+ write(fd, pidbuf, strlen(pidbuf));
+
+ /* open pipe file */
+ fd = open(BL_PIPE_FILE, O_RDWR);
+ if (fd < 0) {
+ BL_LOG_ERR("open pipe file error\n");
+ return -1;
+ }
+
+ ret = bl_cfg_init();
+ if (ret < 0) {
+ if (ret == -ENOENT)
+ BL_LOG_WARNING("Config file not exist, use default\n");
+ else {
+ BL_LOG_ERR("Open/read Block pNFS config file error\n");
+ return -1;
+ }
+ }
+
+ while (1) {
+ /* discover device when needed */
+ bl_discover_devices();
+
+ ret = bl_run_disk_inquiry_process(fd);
+ if (ret < 0) {
+ /* what should we do with process error? */
+ BL_LOG_ERR("inquiry process return %d\n", ret);
+ }
+ }
+ close(fd);
+ return ret;
+}
diff -up nfs-utils-1.2.3/utils/blkmapd/device-discovery.h.orig nfs-utils-1.2.3/utils/blkmapd/device-discovery.h
--- nfs-utils-1.2.3/utils/blkmapd/device-discovery.h.orig 2010-10-04 15:48:00.073350775 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/device-discovery.h 2010-10-04 15:48:00.073350775 -0400
@@ -0,0 +1,162 @@
+/*
+ * bl-device-discovery.h
+ *
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+#ifndef BL_DEVICE_DISCOVERY_H
+#define BL_DEVICE_DISCOVERY_H
+
+#define BL_DEVICE_DISCOVERY_INTERVAL 60
+
+#include <stdint.h>
+#include <syslog.h>
+
+enum blk_vol_type {
+ BLOCK_VOLUME_SIMPLE = 0, /* maps to a single LU */
+ BLOCK_VOLUME_SLICE = 1, /* slice of another volume */
+ BLOCK_VOLUME_CONCAT = 2, /* concatenation of multiple volumes */
+ BLOCK_VOLUME_STRIPE = 3, /* striped across multiple volumes */
+ BLOCK_VOLUME_PSEUDO = 4,
+};
+
+/* All disk offset/lengths are stored in 512-byte sectors */
+struct bl_volume {
+ uint32_t bv_type;
+ off_t bv_size;
+ struct bl_volume **bv_vols;
+ int bv_vol_n;
+ union {
+ dev_t bv_dev; /* for BLOCK_VOLUME_SIMPLE(PSEUDO) */
+ off_t bv_stripe_unit; /* for BLOCK_VOLUME_STRIPE(CONCAT) */
+ off_t bv_offset; /* for BLOCK_VOLUME_SLICE */
+ } param;
+};
+
+struct bl_sig_comp {
+ int64_t bs_offset; /* In bytes */
+ uint32_t bs_length; /* In bytes */
+ char *bs_string;
+};
+
+/* Maximum number of signatures components in a simple volume */
+# define BLOCK_MAX_SIG_COMP 16
+
+struct bl_sig {
+ int si_num_comps;
+ struct bl_sig_comp si_comps[BLOCK_MAX_SIG_COMP];
+};
+
+/*
+ * Multipath support: ACTIVE or PSEUDO device is valid,
+ * PASSIVE is a standby for ACTIVE.
+ */
+enum bl_path_state_e {
+ BL_PATH_STATE_PASSIVE = 1,
+ BL_PATH_STATE_ACTIVE = 2,
+ BL_PATH_STATE_PSEUDO = 3,
+};
+
+struct bl_serial {
+ int len;
+ char *data;
+};
+
+struct bl_disk_path {
+ struct bl_disk_path *next;
+ char *full_path;
+ enum bl_path_state_e state;
+};
+
+struct bl_disk {
+ struct bl_disk *next;
+ struct bl_serial *serial;
+ dev_t dev;
+ off_t size;
+ struct bl_disk_path *valid_path;
+ struct bl_disk_path *paths;
+};
+
+struct bl_dev_id {
+ unsigned char type;
+ unsigned char ids;
+ unsigned char reserve;
+ unsigned char len;
+ char data[0];
+};
+
+struct pipefs_hdr {
+ uint32_t msgid;
+ uint8_t type;
+ uint8_t flags;
+ uint16_t totallen; /* length of entire message, including hdr */
+ uint32_t status;
+};
+
+#define BL_DEVICE_UMOUNT 0x0 /* Umount--delete devices */
+#define BL_DEVICE_MOUNT 0x1 /* Mount--create devices */
+#define BL_DEVICE_REQUEST_INIT 0x0 /* Start request */
+#define BL_DEVICE_REQUEST_PROC 0x1 /* User process succeeds */
+#define BL_DEVICE_REQUEST_ERR 0x2 /* User process fails */
+
+uint32_t *blk_overflow(uint32_t * p, uint32_t * end, size_t nbytes);
+
+#define BLK_READBUF(p, e, nbytes) do { \
+ p = blk_overflow(p, e, nbytes); \
+ if (!p) {\
+ goto out_err;\
+ } \
+} while (0)
+
+#define READ32(x) (x) = ntohl(*p++)
+
+#define READ64(x) do { \
+ (x) = (uint64_t)ntohl(*p++) << 32; \
+ (x) |= ntohl(*p++); \
+} while (0)
+
+#define READ_SECTOR(x) do { \
+ READ64(tmp); \
+ if (tmp & 0x1ff) { \
+ goto out_err; \
+ } \
+ (x) = tmp >> 9; \
+} while (0)
+
+extern struct bl_disk *visible_disk_list;
+uint64_t dm_device_create(struct bl_volume *vols, int num_vols);
+int dm_device_remove_all(uint64_t *dev);
+uint64_t process_deviceinfo(const char *dev_addr_buf,
+ unsigned int dev_addr_len,
+ uint32_t *major, uint32_t *minor);
+
+extern ssize_t atomicio(ssize_t(*f) (int, void *, size_t),
+ int fd, void *_s, size_t n);
+extern struct bl_serial *bldev_read_serial(int fd, const char *filename);
+extern void bldev_read_ap_state(int fd, enum bl_path_state_e *ap_state_out);
+extern int bl_discover_devices(void);
+
+#define BL_LOG_WARNING(fmt...) syslog(LOG_WARNING, fmt)
+#define BL_LOG_ERR(fmt...) syslog(LOG_ERR, fmt)
+#define BL_LOG_DEBUG(fmt...) syslog(LOG_DEBUG, fmt)
+#endif
diff -up nfs-utils-1.2.3/utils/blkmapd/device-inq.c.orig nfs-utils-1.2.3/utils/blkmapd/device-inq.c
--- nfs-utils-1.2.3/utils/blkmapd/device-inq.c.orig 2010-10-04 15:48:00.074563030 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/device-inq.c 2010-10-04 15:48:00.074563030 -0400
@@ -0,0 +1,235 @@
+/*
+ * device-inq.c: inquire SCSI device information.
+ *
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ * All rights reserved.
+ *
+ * This program refers to "SCSI Primary Commands - 3 (SPC-3)
+ * at http://www.t10.org and sg_inq.c in sg3_utils-1.26 for
+ * Linux OS SCSI subsystem, by D. Gilbert.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+#include <stdlib.h>
+#include <stdio.h>
+#include <string.h>
+#include <dirent.h>
+#include <ctype.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <sys/ioctl.h>
+#include <sys/mount.h>
+#include <sys/select.h>
+#include <fcntl.h>
+#include <unistd.h>
+#include <libgen.h>
+#include <errno.h>
+#include <scsi/scsi.h>
+#include <scsi/scsi_ioctl.h>
+#include <scsi/sg.h>
+#include "device-discovery.h"
+
+#define DEF_ALLOC_LEN 255
+#define MX_ALLOC_LEN (0xc000 + 0x80)
+
+struct bl_serial *bl_create_scsi_string(int len, const char *bytes)
+{
+ struct bl_serial *s;
+ s = malloc(sizeof(*s) + len);
+ if (s) {
+ s->data = (char *)&s[1];
+ s->len = len;
+ memcpy(s->data, bytes, len);
+ }
+ return s;
+}
+
+void bl_free_scsi_string(struct bl_serial *str)
+{
+ if (str)
+ free(str);
+}
+
+#define sg_io_ok(io_hdr) \
+ ((((io_hdr).status & 0x7e) == 0) && \
+ ((io_hdr).host_status == 0) && \
+ (((io_hdr).driver_status & 0x0f) == 0))
+
+static int sg_timeout = 1 * 1000;
+
+static int bldev_inquire_page(int fd, int page, char *buffer, int len)
+{
+ unsigned char cmd[] = { INQUIRY, 0, 0, 0, 0, 0 };
+ unsigned char sense_b[28];
+ struct sg_io_hdr io_hdr;
+ if (page >= 0) {
+ cmd[1] = 1;
+ cmd[2] = page;
+ }
+ cmd[3] = (unsigned char)((len >> 8) & 0xff);
+ cmd[4] = (unsigned char)(len & 0xff);
+
+ memset(&io_hdr, 0, sizeof(struct sg_io_hdr));
+ io_hdr.interface_id = 'S';
+ io_hdr.cmd_len = sizeof(cmd);
+ io_hdr.mx_sb_len = sizeof(sense_b);
+ io_hdr.dxfer_direction = SG_DXFER_FROM_DEV;
+ io_hdr.dxfer_len = len;
+ io_hdr.dxferp = buffer;
+ io_hdr.cmdp = cmd;
+ io_hdr.sbp = sense_b;
+ io_hdr.timeout = sg_timeout;
+ if (ioctl(fd, SG_IO, &io_hdr) < 0)
+ return -1;
+
+ if (sg_io_ok(io_hdr))
+ return 0;
+ return -1;
+}
+
+int bldev_inquire_pages(int fd, int page, char **buffer)
+{
+ int status = 0;
+ char *tmp;
+ int len;
+
+ *buffer = calloc(DEF_ALLOC_LEN, sizeof(char));
+ if (!*buffer) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ return -ENOMEM;
+ }
+
+ status = bldev_inquire_page(fd, page, *buffer, DEF_ALLOC_LEN);
+ if (status)
+ goto out;
+
+ status = -1;
+ if ((*(*buffer + 1) & 0xff) != page)
+ goto out;
+
+ len = (*(*buffer + 2) << 8) + *(*buffer + 3) + 4;
+ if (len > MX_ALLOC_LEN) {
+ BL_LOG_ERR("SCSI response length too long: %d\n", len);
+ goto out;
+ }
+ if (len > DEF_ALLOC_LEN) {
+ tmp = realloc(*buffer, len);
+ if (!tmp) {
+ BL_LOG_ERR("%s: Out of memory!\n", __func__);
+ status = -ENOMEM;
+ goto out;
+ }
+ *buffer = tmp;
+ status = bldev_inquire_page(fd, page, *buffer, len);
+ if (status)
+ goto out;
+ }
+ status = 0;
+ out:
+ return status;
+}
+
+/* For EMC multipath devices, use VPD page (0xc0) to get status.
+ * For other devices, return ACTIVE for now
+ */
+void bldev_read_ap_state(int fd, enum bl_path_state_e *ap_state_out)
+{
+ int status = 0;
+ char *buffer;
+
+ *ap_state_out = BL_PATH_STATE_ACTIVE;
+
+ status = bldev_inquire_pages(fd, 0xc0, &buffer);
+ if (status)
+ goto out;
+
+ if (buffer[4] < 0x02)
+ *ap_state_out = BL_PATH_STATE_PASSIVE;
+ out:
+ if (buffer)
+ free(buffer);
+ return;
+}
+
+struct bl_serial *bldev_read_serial(int fd, const char *filename)
+{
+ struct bl_serial *serial_out = NULL;
+ int status = 0, pos, len;
+ char *buffer;
+ struct bl_dev_id *dev_root, *dev_id;
+ unsigned int current_id = 0;
+
+ status = bldev_inquire_pages(fd, 0x83, &buffer);
+ if (status)
+ goto out;
+
+ dev_root = (struct bl_dev_id *)buffer;
+
+ pos = 0;
+ current_id = 0;
+ len = dev_root->len;
+ while (pos < (len - sizeof(struct bl_dev_id) + sizeof(unsigned char))) {
+ dev_id = (struct bl_dev_id *)&(dev_root->data[pos]);
+ if ((dev_id->ids & 0xf) < current_id)
+ continue;
+ switch (dev_id->ids & 0xf) {
+ /* We process SCSI ID with four ID cases: 0, 1, 2 and 3.
+ * When more than one ID is available, priority is
+ * 3>2>1>0.
+ */
+ case 2: /* EUI-64 based */
+ if ((dev_id->len != 8) && (dev_id->len != 12) &&
+ (dev_id->len != 16)) {
+ BL_LOG_ERR("EUI-64 only decodes 8, "
+ "12 and 16\n");
+ break;
+ }
+ case 3: /* NAA */
+ /* TODO: NAA validity judgement too complicated,
+ * so just ingore it here.
+ */
+ if ((dev_id->type & 0xf) != 1) {
+ BL_LOG_ERR("Binary code_set expected\n");
+ break;
+ }
+ case 0: /* vendor specific */
+ case 1: /* T10 vendor identification */
+ current_id = dev_id->ids & 0xf;
+ if (serial_out)
+ bl_free_scsi_string(serial_out);
+ serial_out = bl_create_scsi_string(dev_id->len,
+ dev_id->data);
+ break;
+ default:
+ break;
+ }
+ if (current_id == 3)
+ break;
+ pos += (dev_id->len + sizeof(struct bl_dev_id) -
+ sizeof(unsigned char));
+ }
+ out:
+ if (!serial_out)
+ serial_out = bl_create_scsi_string(strlen(filename), filename);
+ if (buffer)
+ free(buffer);
+ return serial_out;
+}
diff -up nfs-utils-1.2.3/utils/blkmapd/device-process.c.orig nfs-utils-1.2.3/utils/blkmapd/device-process.c
--- nfs-utils-1.2.3/utils/blkmapd/device-process.c.orig 2010-10-04 15:48:00.075557769 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/device-process.c 2010-10-04 15:48:00.075557769 -0400
@@ -0,0 +1,394 @@
+/*
+ * device-process.c: detailed processing of device information sent
+ * from kernel.
+ *
+ * Copyright (c) 2006 The Regents of the University of Michigan.
+ * All rights reserved.
+ *
+ * Andy Adamson <andros@citi.umich.edu>
+ * Fred Isaman <iisaman@umich.edu>
+ *
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ *
+ * Used codes in linux/fs/nfs/blocklayout/blocklayoutdev.c.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <libdevmapper.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <unistd.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <sys/user.h>
+#include <fcntl.h>
+#include <errno.h>
+#include <arpa/inet.h>
+#include <linux/kdev_t.h>
+#include "device-discovery.h"
+
+uint32_t *blk_overflow(uint32_t * p, uint32_t * end, size_t nbytes)
+{
+ uint32_t *q = p + ((nbytes + 3) >> 2);
+ if (q > end || q < p)
+ return NULL;
+ return p;
+}
+
+static int decode_blk_signature(uint32_t **pp, uint32_t *end,
+ struct bl_sig *sig)
+{
+ int i, tmp;
+ uint32_t *p = *pp;
+
+ BLK_READBUF(p, end, 4);
+ READ32(sig->si_num_comps);
+ if (sig->si_num_comps == 0) {
+ BL_LOG_ERR("0 components in sig\n");
+ goto out_err;
+ }
+ if (sig->si_num_comps >= BLOCK_MAX_SIG_COMP) {
+ BL_LOG_ERR("number of sig comps %i >= BLOCK_MAX_SIG_COMP\n",
+ sig->si_num_comps);
+ goto out_err;
+ }
+ for (i = 0; i < sig->si_num_comps; i++) {
+ BLK_READBUF(p, end, 12);
+ READ64(sig->si_comps[i].bs_offset);
+ READ32(tmp);
+ sig->si_comps[i].bs_length = tmp;
+ BLK_READBUF(p, end, tmp);
+ /* Note we rely here on fact that sig is used immediately
+ * for mapping, then thrown away.
+ */
+ sig->si_comps[i].bs_string = (char *)p;
+ BL_LOG_ERR("%s: si_comps[%d]: bs_length %d, bs_string %s\n",
+ __func__, i, sig->si_comps[i].bs_length,
+ sig->si_comps[i].bs_string);
+ p += ((tmp + 3) >> 2);
+ }
+ *pp = p;
+ return 0;
+ out_err:
+ return -EIO;
+}
+
+/* Read signature from device
+ * return 0: read successfully
+ * return -1: error
+ */
+int
+read_cmp_blk_sig(const char *dev_name, struct bl_sig_comp *comp,
+ int64_t bs_offset)
+{
+ int fd, ret = -1;
+ char *sig = NULL;
+
+ fd = open(dev_name, O_RDONLY | O_LARGEFILE);
+ if (fd < 0) {
+ BL_LOG_ERR("%s could not be opened for read\n", dev_name);
+ goto error;
+ }
+
+ sig = (char *)malloc(comp->bs_length);
+ if (!sig) {
+ BL_LOG_ERR("%s: Out of memory\n", __func__);
+ goto error;
+ }
+
+ if (lseek64(fd, bs_offset, SEEK_SET) == -1) {
+ BL_LOG_ERR("File %s lseek error\n", dev_name);
+ goto error;
+ }
+
+ if (atomicio(read, fd, sig, comp->bs_length) != comp->bs_length) {
+ BL_LOG_ERR("File %s read error\n", dev_name);
+ goto error;
+ }
+
+ BL_LOG_ERR
+ ("%s: %s sig: %s, bs_string: %s, bs_length: %d, bs_offset: %lld\n",
+ __func__, dev_name, sig, comp->bs_string, comp->bs_length,
+ (long long)bs_offset);
+ ret = memcmp(sig, comp->bs_string, comp->bs_length);
+
+ error:
+ if (sig)
+ free(sig);
+ if (fd >= 0)
+ close(fd);
+ return ret;
+}
+
+/*
+ * All signatures in sig must be found on disk for verification.
+ * Returns True if sig matches, False otherwise.
+ */
+static int verify_sig(struct bl_disk *disk, struct bl_sig *sig)
+{
+ struct bl_sig_comp *comp;
+ int i, ret;
+ int64_t bs_offset;
+
+ for (i = 0; i < sig->si_num_comps; i++) {
+ comp = &sig->si_comps[i];
+ bs_offset = comp->bs_offset;
+ if (bs_offset < 0)
+ bs_offset += (((int64_t) disk->size) << 9);
+ BL_LOG_ERR("%s: bs_offset: %lld\n",
+ __func__, (long long) bs_offset);
+ ret = read_cmp_blk_sig(disk->valid_path->full_path,
+ comp, bs_offset);
+ if (ret)
+ return 0;
+ }
+ return 1;
+}
+
+/*
+ * map_sig_to_device()
+ * Given a signature, walk the list of visible disks searching for
+ * a match. Returns True if mapping was done, False otherwise.
+ *
+ * While we're at it, fill in the vol->bv_size.
+ */
+static int map_sig_to_device(struct bl_sig *sig, struct bl_volume *vol)
+{
+ int mapped = 0;
+ struct bl_disk *disk = visible_disk_list;
+ char *filepath = 0;
+ struct bl_disk *lolDisk = disk;
+
+ while (lolDisk) {
+ BL_LOG_ERR("%s: visible_disk_list: %s\n", __func__,
+ lolDisk->valid_path->full_path);
+ lolDisk = lolDisk->next;
+ }
+
+ /* scan disk list to find out match device */
+ while (disk) {
+ /* FIXME: should we use better algorithm for disk scan? */
+ mapped = verify_sig(disk, sig);
+ if (mapped) {
+ vol->param.bv_dev = disk->dev;
+ filepath = disk->valid_path->full_path;
+ vol->bv_size = disk->size;
+ break;
+ }
+ disk = disk->next;
+ }
+ return mapped;
+}
+
+/* We are given an array of XDR encoded array indices, each of which should
+ * refer to a previously decoded device. Translate into a list of pointers
+ * to the appropriate pnfs_blk_volume's.
+ */
+static int set_vol_array(uint32_t **pp, uint32_t *end,
+ struct bl_volume *vols, int working)
+{
+ int i, index;
+ uint32_t *p = *pp;
+ struct bl_volume **array = vols[working].bv_vols;
+ for (i = 0; i < vols[working].bv_vol_n; i++) {
+ BLK_READBUF(p, end, 4);
+ READ32(index);
+ if ((index < 0) || (index >= working)) {
+ BL_LOG_ERR("set_vol_array: Id %i out of range\n",
+ index);
+ goto out_err;
+ }
+ array[i] = &vols[index];
+ }
+ *pp = p;
+ return 0;
+ out_err:
+ return -EIO;
+}
+
+static uint64_t sum_subvolume_sizes(struct bl_volume *vol)
+{
+ int i;
+ uint64_t sum = 0;
+ for (i = 0; i < vol->bv_vol_n; i++)
+ sum += vol->bv_vols[i]->bv_size;
+ return sum;
+}
+
+static int decode_blk_volume(uint32_t **pp, uint32_t *end,
+ struct bl_volume *vols, int i, int *array_cnt)
+{
+ int status = 0, j;
+ struct bl_sig sig;
+ uint32_t *p = *pp;
+ struct bl_volume *vol = &vols[i];
+ uint64_t tmp, tmp_size;
+ div_t d;
+
+ BLK_READBUF(p, end, 4);
+ READ32(vol->bv_type);
+ switch (vol->bv_type) {
+ case BLOCK_VOLUME_SIMPLE:
+ *array_cnt = 0;
+ status = decode_blk_signature(&p, end, &sig);
+ if (status)
+ return status;
+ status = map_sig_to_device(&sig, vol);
+ if (!status) {
+ BL_LOG_ERR("Could not find disk for device\n");
+ return -ENXIO;
+ }
+ status = 0;
+ break;
+ case BLOCK_VOLUME_SLICE:
+ BLK_READBUF(p, end, 16);
+ READ_SECTOR(vol->param.bv_offset);
+ READ_SECTOR(vol->bv_size);
+ *array_cnt = vol->bv_vol_n = 1;
+ status = set_vol_array(&p, end, vols, i);
+ break;
+ case BLOCK_VOLUME_STRIPE:
+ BLK_READBUF(p, end, 8);
+ READ_SECTOR(vol->param.bv_stripe_unit);
+ off_t chunksize = vol->param.bv_stripe_unit;
+ if ((chunksize == 0) ||
+ ((chunksize & (chunksize - 1)) != 0) ||
+ (chunksize < (PAGE_SIZE >> 9)))
+ return -EIO;
+ BLK_READBUF(p, end, 4);
+ READ32(vol->bv_vol_n);
+ if (!vol->bv_vol_n)
+ return -EIO;
+ *array_cnt = vol->bv_vol_n;
+ status = set_vol_array(&p, end, vols, i);
+ if (status)
+ return status;
+ for (j = 1; j < vol->bv_vol_n; j++) {
+ if (vol->bv_vols[j]->bv_size !=
+ vol->bv_vols[0]->bv_size) {
+ BL_LOG_ERR("varying subvol size\n");
+ return -EIO;
+ }
+ }
+ /* Make sure total size only includes addressable areas */
+ tmp_size = vol->bv_vols[0]->bv_size;
+ d = div(tmp_size, (uint32_t) vol->param.bv_stripe_unit);
+ tmp_size = d.quot;
+ vol->bv_size = tmp_size * vol->param.bv_stripe_unit;
+ break;
+ case BLOCK_VOLUME_CONCAT:
+ BLK_READBUF(p, end, 4);
+ READ32(vol->bv_vol_n);
+ if (!vol->bv_vol_n)
+ return -EIO;
+ *array_cnt = vol->bv_vol_n;
+ status = set_vol_array(&p, end, vols, i);
+ if (status)
+ return status;
+ vol->bv_size = sum_subvolume_sizes(vol);
+ break;
+ default:
+ BL_LOG_ERR("Unknown volume type %i\n", vol->bv_type);
+ out_err:
+ return -EIO;
+ }
+ *pp = p;
+ return status;
+}
+
+uint64_t process_deviceinfo(const char *dev_addr_buf,
+ unsigned int dev_addr_len,
+ uint32_t *major, uint32_t *minor)
+{
+ int num_vols, i, status, count;
+ uint32_t *p, *end;
+ struct bl_volume *vols = NULL, **arrays = NULL, **arrays_ptr = NULL;
+ uint64_t dev = 0;
+ int tried = 0;
+
+ restart:
+ p = (uint32_t *) dev_addr_buf;
+ end = (uint32_t *) ((char *)p + dev_addr_len);
+ /* Decode block volume */
+ BLK_READBUF(p, end, 4);
+ READ32(num_vols);
+ if (num_vols <= 0) {
+ BL_LOG_WARNING("Error: number of vols: %d\n", num_vols);
+ goto out_err;
+ }
+
+ vols = (struct bl_volume *)malloc(num_vols * sizeof(struct bl_volume));
+ if (!vols) {
+ BL_LOG_ERR("%s: Out of memory\n", __func__);
+ goto out_err;
+ }
+
+ /* Each volume in vols array needs its own array. Save time by
+ * allocating them all in one large hunk. Because each volume
+ * array can only reference previous volumes, and because once
+ * a concat or stripe references a volume, it may never be
+ * referenced again, the volume arrays are guaranteed to fit
+ * in the suprisingly small space allocated.
+ */
+ arrays =
+ (struct bl_volume **)malloc(num_vols * 2 *
+ sizeof(struct bl_volume *));
+ if (!arrays) {
+ BL_LOG_ERR("%s: Out of memory\n", __func__);
+ goto out_err;
+ }
+
+ arrays_ptr = arrays;
+
+ for (i = 0; i < num_vols; i++) {
+ vols[i].bv_vols = arrays_ptr;
+ status = decode_blk_volume(&p, end, vols, i, &count);
+ if (status == -ENXIO && (tried <= 5)) {
+ sleep(1);
+ BL_LOG_DEBUG("%s: discover again!\n", __func__);
+ bl_discover_devices();
+ tried++;
+ free(vols);
+ free(arrays);
+ goto restart;
+ }
+ if (status)
+ goto out_err;
+ arrays_ptr += count;
+ }
+
+ if (p != end) {
+ BL_LOG_ERR("p is not equal to end!\n");
+ goto out_err;
+ }
+
+ dev = dm_device_create(vols, num_vols);
+ *major = MAJOR(dev);
+ *minor = MINOR(dev);
+ out_err:
+ if (vols)
+ free(vols);
+ if (arrays)
+ free(arrays);
+ return dev;
+}
diff -up nfs-utils-1.2.3/utils/blkmapd/dm-device.c.orig nfs-utils-1.2.3/utils/blkmapd/dm-device.c
--- nfs-utils-1.2.3/utils/blkmapd/dm-device.c.orig 2010-10-04 15:48:00.075557769 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/dm-device.c 2010-10-04 15:48:00.076394449 -0400
@@ -0,0 +1,509 @@
+/*
+ * dm-device.c: create or remove device via device mapper API.
+ *
+ * Copyright (c) 2010 EMC Corporation, Haiying Tang <Tang_Haiying@emc.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+#include <libdevmapper.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+#include <errno.h>
+#include <linux/kdev_t.h>
+#include "device-discovery.h"
+
+#define DM_DEV_NAME_LEN 256
+
+#ifndef DM_MAX_TYPE_NAME
+#define DM_MAX_TYPE_NAME 16
+#endif
+
+#define DM_PARAMS_LEN 512 /* XXX: is this enough for target? */
+#define DM_DIR "/dev/mapper"
+#define DM_DIR_LEN12
+#define TYPE_HAS_DEV(type) ((type == BLOCK_VOLUME_SIMPLE) || \
+ (type == BLOCK_VOLUME_PSEUDO))
+
+struct bl_dm_table {
+ uint64_t offset;
+ uint64_t size;
+ char target_type[DM_MAX_TYPE_NAME];
+ char params[DM_PARAMS_LEN];
+ struct bl_dm_table *next;
+};
+
+struct bl_dm_tree {
+ uint64_t dev;
+ struct dm_tree *tree;
+ struct bl_dm_tree *next;
+};
+
+static inline struct bl_dm_table *bl_dm_table_alloc(void)
+{
+ return (struct bl_dm_table *)calloc(1, sizeof(struct bl_dm_table));
+}
+
+void bl_dm_table_free(struct bl_dm_table *bl_table_head)
+{
+ struct bl_dm_table *p = bl_table_head;
+ while (bl_table_head) {
+ p = bl_table_head->next;
+ free(bl_table_head);
+ bl_table_head = p;
+ }
+}
+
+void add_to_bl_dm_table(struct bl_dm_table **bl_table_head,
+ struct bl_dm_table *table)
+{
+ struct bl_dm_table *pre;
+ if (!*bl_table_head) {
+ *bl_table_head = table;
+ return;
+ }
+ pre = *bl_table_head;
+ while (pre->next)
+ pre = pre->next;
+ pre->next = table;
+ return;
+}
+
+struct bl_dm_tree *bl_tree_head;
+
+struct bl_dm_tree *find_bl_dm_tree(uint64_t dev)
+{
+ struct bl_dm_tree *p = bl_tree_head;
+ while (p) {
+ if (p->dev == dev)
+ return p;
+ p = p->next;
+ }
+ return NULL;
+}
+
+void del_from_bl_dm_tree(uint64_t dev)
+{
+ struct bl_dm_tree *pre = bl_tree_head;
+ struct bl_dm_tree *p;
+
+ p = pre;
+ while (p) {
+ if (p->dev == dev) {
+ pre->next = p->next;
+ if (p == bl_tree_head)
+ bl_tree_head = bl_tree_head->next;
+ free(p);
+ break;
+ }
+ pre = p;
+ p = pre->next;
+ }
+}
+
+void add_to_bl_dm_tree(struct bl_dm_tree *tree)
+{
+ struct bl_dm_tree *pre;
+ if (!bl_tree_head) {
+ bl_tree_head = tree;
+ return;
+ }
+ pre = bl_tree_head;
+ while (pre->next)
+ pre = pre->next;
+ pre->next = tree;
+ return;
+}
+
+/* Create device via device mapper
+ * return 0 when creation failed
+ * return dev no for created device
+ */
+uint64_t dm_single_device_create(const char *dev_name, struct bl_dm_table * p)
+{
+ struct dm_task *dmt;
+ struct dm_info dminfo;
+ int ret = 0;
+
+ dmt = dm_task_create(DM_DEVICE_CREATE);
+ if (!dmt) {
+ BL_LOG_ERR("Create dm_task for %s failed\n", dev_name);
+ return 0;
+ }
+ ret = dm_task_set_name(dmt, dev_name);
+ if (!ret)
+ goto err_out;
+
+ while (p) {
+ ret = dm_task_add_target(dmt, p->offset, p->size,
+ p->target_type, p->params);
+ if (!ret)
+ goto err_out;
+ p = p->next;
+ }
+
+ ret = dm_task_run(dmt) &&
+ dm_task_get_info(dmt, &dminfo) && dminfo.exists;
+
+ if (!ret)
+ goto err_out;
+
+ dm_task_update_nodes();
+
+ err_out:
+ dm_task_destroy(dmt);
+
+ if (!ret) {
+ BL_LOG_ERR("Create device %s failed\n", dev_name);
+ return 0;
+ }
+ return MKDEV(dminfo.major, dminfo.minor);
+}
+
+int dm_device_remove_byname(const char *dev_name)
+{
+ struct dm_task *dmt;
+ int ret = 0;
+
+ dmt = dm_task_create(DM_DEVICE_REMOVE);
+ if (!dmt)
+ return -ENODEV;
+
+ ret = dm_task_set_name(dmt, dev_name) && dm_task_run(dmt);
+
+ dm_task_update_nodes();
+
+ if (dmt)
+ dm_task_destroy(dmt);
+
+ return ret;
+}
+
+int dm_device_remove(uint64_t dev)
+{
+ struct dm_task *dmt;
+ struct dm_names *dmnames;
+ char *names = NULL;
+ int ret = -1;
+
+ /* Look for dev_name via dev, if dev_name could be transferred here,
+ we could jump to DM_DEVICE_REMOVE directly */
+ dmt = dm_task_create(DM_DEVICE_LIST);
+ if (!dmt) {
+ BL_LOG_ERR("dm_task creation failed\n");
+ return -ENODEV;
+ }
+
+ ret = dm_task_run(dmt);
+ if (!ret) {
+ BL_LOG_ERR("dm_task_run failed\n");
+ goto error;
+ }
+
+ dmnames = dm_task_get_names(dmt);
+ if (!dmnames || !dmnames->dev) {
+ BL_LOG_ERR("dm_task_get_names failed\n");
+ goto error;
+ }
+
+ do {
+ if (dmnames->dev == dev) {
+ names = dmnames->name;
+ break;
+ }
+ dmnames = (void *)dmnames + dmnames->next;
+ } while (dmnames);
+
+ if (!names) {
+ BL_LOG_ERR("Could not find device\n");
+ goto error;
+ }
+
+ dm_task_update_nodes();
+
+ error:
+ dm_task_destroy(dmt);
+
+ /* Start to remove device */
+ if (names)
+ ret = dm_device_remove_byname(names);
+ return ret;
+}
+
+static unsigned long dev_count;
+
+void dm_devicelist_remove(unsigned long start, unsigned long end)
+{
+ char dev_name[DM_DEV_NAME_LEN];
+ unsigned long count;
+
+ if ((start >= dev_count) || (end <= 1) || (start >= end - 1))
+ return;
+
+ for (count = end - 1; count > start; count--) {
+ sprintf(dev_name, "pnfs_vol_%lu", count - 1);
+ dm_device_remove_byname(dev_name);
+ }
+
+ return;
+}
+
+void bl_dm_remove_tree(uint64_t dev)
+{
+ struct bl_dm_tree *p;
+
+ p = find_bl_dm_tree(dev);
+ if (!p)
+ return;
+
+ dm_tree_free(p->tree);
+ del_from_bl_dm_tree(dev);
+}
+
+void bl_dm_create_tree(uint64_t dev)
+{
+ struct dm_tree *tree;
+ struct bl_dm_tree *bl_tree;
+
+ bl_tree = find_bl_dm_tree(dev);
+ if (bl_tree)
+ return; /* XXX: error? */
+
+ tree = dm_tree_create();
+ if (!tree)
+ return;
+
+ if (!dm_tree_add_dev(tree, MAJOR(dev), MINOR(dev))) {
+ dm_tree_free(tree);
+ return;
+ }
+
+ bl_tree = malloc(sizeof(struct bl_dm_tree));
+ if (!bl_tree) {
+ dm_tree_free(tree);
+ return;
+ }
+
+ bl_tree->dev = dev;
+ bl_tree->tree = tree;
+ bl_tree->next = NULL;
+ add_to_bl_dm_tree(bl_tree);
+
+ return;
+}
+
+uint64_t dm_device_nametodev(char *dev_name)
+{
+ struct dm_task *dmt;
+ int ret = 0;
+ struct dm_info dminfo;
+
+ dmt = dm_task_create(DM_DEVICE_INFO);
+ if (!dmt)
+ return -ENODEV;
+
+ ret = dm_task_set_name(dmt, dev_name) &&
+ dm_task_run(dmt) && dm_task_get_info(dmt, &dminfo);
+
+ if (dmt)
+ dm_task_destroy(dmt);
+
+ if (!ret)
+ return 0;
+
+ return MKDEV(dminfo.major, dminfo.minor);
+}
+
+int dm_device_remove_all(uint64_t *dev)
+{
+ struct bl_dm_tree *p;
+ struct dm_tree_node *node;
+ const char *uuid;
+ int ret = 0;
+ uint32_t major, minor;
+ uint64_t bl_dev;
+
+ memcpy(&major, dev, sizeof(uint32_t));
+ memcpy(&minor, (void *)dev + sizeof(uint32_t), sizeof(uint32_t));
+ bl_dev = MKDEV(major, minor);
+ p = find_bl_dm_tree(bl_dev);
+ if (!p)
+ return ret;
+
+ node = dm_tree_find_node(p->tree, MAJOR(bl_dev), MINOR(bl_dev));
+ if (!node)
+ return ret;
+
+ uuid = dm_tree_node_get_uuid(node);
+ if (!uuid)
+ return ret;
+
+ dm_device_remove(bl_dev);
+ ret = dm_tree_deactivate_children(node, uuid, strlen(uuid));
+ dm_task_update_nodes();
+ bl_dm_remove_tree(bl_dev);
+ return ret;
+}
+
+/* TODO: check the value for DM_DEV_NAME_LEN, DM_TYPE_LEN, DM_PARAMS_LEN */
+uint64_t dm_device_create(struct bl_volume *vols, int num_vols)
+{
+ uint64_t size, dev = 0;
+ unsigned long count = dev_count;
+ int number = 0, i, pos;
+ struct bl_volume *node;
+ char *tmp;
+ struct bl_dm_table *table = NULL;
+ struct bl_dm_table *bl_table_head = NULL;
+ unsigned int len;
+ char *dev_name = NULL;
+ /* Create pseudo device here */
+ while (number < num_vols) {
+ node = &vols[number];
+ switch (node->bv_type) {
+ case BLOCK_VOLUME_SIMPLE:
+ /* Do not need to create device here */
+ dev = node->param.bv_dev;
+ goto continued;
+ case BLOCK_VOLUME_SLICE:
+ table = bl_dm_table_alloc();
+ if (!table)
+ goto out;
+ table->offset = 0;
+ table->size = node->bv_size;
+ strcpy(table->target_type, "linear");
+ if (!TYPE_HAS_DEV(node->bv_vols[0]->bv_type)) {
+ free(table);
+ goto out;
+ }
+ dev = node->bv_vols[0]->param.bv_dev;
+ tmp = table->params;
+ if (!dm_format_dev(tmp, DM_PARAMS_LEN,
+ MAJOR(dev), MINOR(dev))) {
+ free(table);
+ goto out;
+ }
+ tmp += strlen(tmp);
+ sprintf(tmp, " %lu", node->param.bv_offset);
+ add_to_bl_dm_table(&bl_table_head, table);
+ break;
+ case BLOCK_VOLUME_STRIPE:
+ table = bl_dm_table_alloc();
+ if (!table)
+ goto out;
+ table->offset = 0;
+ table->size = node->bv_size;
+ strcpy(table->target_type, "striped");
+ sprintf(table->params, "%d %lu %n", node->bv_vol_n,
+ node->param.bv_stripe_unit, &pos);
+ /* Repeatedly copy subdev to params */
+ tmp = table->params + pos;
+ len = DM_PARAMS_LEN - pos;
+ for (i = 0; i < node->bv_vol_n; i++) {
+ if (!TYPE_HAS_DEV(node->bv_vols[i]->bv_type)) {
+ free(table);
+ goto out;
+ }
+ dev = node->bv_vols[i]->param.bv_dev;
+ if (!dm_format_dev(tmp, len, MAJOR(dev),
+ MINOR(dev))) {
+ free(table);
+ goto out;
+ }
+ pos = strlen(tmp);
+ tmp += pos;
+ len -= pos;
+ sprintf(tmp, " %d ", 0);
+ tmp += 3;
+ len -= 3;
+ }
+ add_to_bl_dm_table(&bl_table_head, table);
+ break;
+ case BLOCK_VOLUME_CONCAT:
+ size = 0;
+ for (i = 0; i < node->bv_vol_n; i++) {
+ table = bl_dm_table_alloc();
+ if (!table)
+ goto out;
+ table->offset = size;
+ table->size = node->bv_vols[i]->bv_size;
+ if (!TYPE_HAS_DEV(node->bv_vols[i]->bv_type)) {
+ free(table);
+ goto out;
+ }
+ strcpy(table->target_type, "linear");
+ tmp = table->params;
+ dev = node->bv_vols[i]->param.bv_dev;
+ if (!dm_format_dev(tmp, DM_PARAMS_LEN,
+ MAJOR(dev), MINOR(dev))) {
+ free(table);
+ goto out;
+ }
+ tmp += strlen(tmp);
+ sprintf(tmp, " %d", 0);
+ size += table->size;
+ add_to_bl_dm_table(&bl_table_head, table);
+ }
+ break;
+ default:
+ /* Delete previous temporary devices */
+ dm_devicelist_remove(count, dev_count);
+ goto out;
+ } /* end of swtich */
+ /* Create dev_name here. Name of device is pnfs_vol_XXX */
+ if (dev_name)
+ free(dev_name);
+ dev_name = (char *)calloc(DM_DEV_NAME_LEN, sizeof(char));
+ if (!dev_name) {
+ BL_LOG_ERR("%s: Out of memory\n", __func__);
+ goto out;
+ }
+ sprintf(dev_name, "pnfs_vol_%lu", dev_count++);
+
+ dev = dm_single_device_create(dev_name, bl_table_head);
+ if (!dev) {
+ /* Delete previous temporary devices */
+ dm_devicelist_remove(count, dev_count);
+ goto out;
+ }
+ node->param.bv_dev = dev;
+ /* TODO: extend use with PSEUDO later */
+ node->bv_type = BLOCK_VOLUME_PSEUDO;
+ continued:
+ number++;
+ if (bl_table_head)
+ bl_dm_table_free(bl_table_head);
+ bl_table_head = NULL;
+ }
+ out:
+ if (bl_table_head)
+ bl_dm_table_free(bl_table_head);
+ bl_table_head = NULL;
+ if (dev)
+ bl_dm_create_tree(dev);
+ if (dev_name)
+ free(dev_name);
+ return dev;
+}
diff -up nfs-utils-1.2.3/utils/blkmapd/etc/blkmapd.conf.orig nfs-utils-1.2.3/utils/blkmapd/etc/blkmapd.conf
--- nfs-utils-1.2.3/utils/blkmapd/etc/blkmapd.conf.orig 2010-10-04 15:48:00.076394449 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/etc/blkmapd.conf 2010-10-04 15:48:00.076394449 -0400
@@ -0,0 +1,10 @@
+# This is an example config file
+
+# Look at all /dev/sd* devices
+# /dev/sd or /dev/sd*
+/dev/sd*
+
+# Look at all /dev/mapper/* devices
+# /dev/mapper/* or
+# /dev/mapper/
+/dev/mapper/*
diff -up nfs-utils-1.2.3/utils/blkmapd/etc/initd/initd.redhat.orig nfs-utils-1.2.3/utils/blkmapd/etc/initd/initd.redhat
--- nfs-utils-1.2.3/utils/blkmapd/etc/initd/initd.redhat.orig 2010-10-04 15:48:00.076394449 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/etc/initd/initd.redhat 2010-10-04 15:48:00.077339793 -0400
@@ -0,0 +1,76 @@
+#!/bin/sh
+#
+# description: Starts and stops the iSCSI initiator
+#
+# processname: blkmapd
+# pidfile: /var/run/blkmapd.pid
+# config: /etc/blkmapd.conf
+
+# Source function library.
+if [ -f /etc/init.d/functions ] ; then
+ . /etc/init.d/functions
+elif [ -f /etc/rc.d/init.d/functions ] ; then
+ . /etc/rc.d/init.d/functions
+else
+ exit 0
+fi
+
+PATH=/sbin:/bin:/usr/sbin:/usr/bin
+
+RETVAL=0
+
+start()
+{
+ echo -n $"Starting pNFS block-layout device discovery service: "
+ modprobe -q blocklayoutdriver
+ daemon /usr/sbin/blkmapd
+ RETVAL=$?
+ if [ $RETVAL -eq 0 ]; then
+ touch /var/lock/subsys/blkmapd
+ fi
+ echo
+ return $RETVAL
+}
+
+stop()
+{
+ echo -n $"Stopping pNFS block-layout device discovery service: "
+ killproc blkmapd 2> /dev/null
+ rm -f /var/run/blkmapd.pid
+ RETVAL=$?
+ [ $RETVAL -eq 0 ] && rm -f /var/lock/subsys/blkmapd
+ if [ $RETVAL -eq 0 ]; then
+ echo_success
+ else
+ echo_failure
+ fi
+ echo
+ return $RETVAL
+}
+
+restart()
+{
+ stop
+ start
+}
+
+case "$1" in
+ start)
+ start
+ ;;
+ stop)
+ stop
+ ;;
+ restart)
+ stop
+ start
+ ;;
+ status)
+ status blkmapd
+ ;;
+ *)
+ echo $"Usage: $0 {start|stop|restart|status}"
+ exit 1
+esac
+
+exit $RETVAL
diff -up nfs-utils-1.2.3/utils/blkmapd/Makefile.am.orig nfs-utils-1.2.3/utils/blkmapd/Makefile.am
--- nfs-utils-1.2.3/utils/blkmapd/Makefile.am.orig 2010-10-04 15:48:00.071418550 -0400
+++ nfs-utils-1.2.3/utils/blkmapd/Makefile.am 2010-10-04 15:48:00.071418550 -0400
@@ -0,0 +1,22 @@
+## Process this file with automake to produce Makefile.in
+
+#man8_MANS = blkmapd.man
+
+AM_CFLAGS += -D_LARGEFILE64_SOURCE
+sbin_PROGRAMS = blkmapd
+
+blkmapd_SOURCES = \
+ atomicio.c \
+ cfg.c \
+ device-discovery.c \
+ device-inq.c \
+ device-process.c \
+ dm-device.c \
+ \
+ cfg.h \
+ device-discovery.h
+
+blkmapd_LDADD = -ldevmapper ../../support/nfs/libnfs.a
+
+MAINTAINERCLEANFILES = Makefile.in
+
diff -up nfs-utils-1.2.3/utils/exportfs/exportfs.c.orig nfs-utils-1.2.3/utils/exportfs/exportfs.c
--- nfs-utils-1.2.3/utils/exportfs/exportfs.c.orig 2010-09-28 08:24:16.000000000 -0400
+++ nfs-utils-1.2.3/utils/exportfs/exportfs.c 2010-10-04 15:48:00.077339793 -0400
@@ -577,6 +577,8 @@ dump(int verbose)
#endif
}
secinfo_show(stdout, ep);
+ if (ep->e_pnfs)
+ c = dumpopt(c, ",pnfs");
printf("%c\n", (c != '(')? ')' : ' ');
}
}
diff -up nfs-utils-1.2.3/utils/Makefile.am.orig nfs-utils-1.2.3/utils/Makefile.am
--- nfs-utils-1.2.3/utils/Makefile.am.orig 2010-09-28 08:24:16.000000000 -0400
+++ nfs-utils-1.2.3/utils/Makefile.am 2010-10-04 15:48:00.070350101 -0400
@@ -4,6 +4,8 @@ OPTDIRS =
if CONFIG_NFSV4
OPTDIRS += idmapd
+OPTDIRS += spnfsd
+OPTDIRS += blkmapd
endif
if CONFIG_GSS
diff -up nfs-utils-1.2.3/utils/mountd/cache.c.orig nfs-utils-1.2.3/utils/mountd/cache.c
--- nfs-utils-1.2.3/utils/mountd/cache.c.orig 2010-09-28 08:24:16.000000000 -0400
+++ nfs-utils-1.2.3/utils/mountd/cache.c 2010-10-04 15:48:00.078357497 -0400
@@ -653,6 +653,8 @@ static int dump_to_cache(FILE *f, char *
qword_printint(f, exp->e_anonuid);
qword_printint(f, exp->e_anongid);
qword_printint(f, exp->e_fsid);
+ if (exp->e_pnfs == 1)
+ qword_print(f, "pnfs");
write_fsloc(f, exp);
write_secinfo(f, exp, flag_mask);
if (exp->e_uuid == NULL || different_fs) {
diff -up nfs-utils-1.2.3/utils/spnfsd/atomicio.c.orig nfs-utils-1.2.3/utils/spnfsd/atomicio.c
--- nfs-utils-1.2.3/utils/spnfsd/atomicio.c.orig 2010-10-04 15:48:00.079379348 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/atomicio.c 2010-10-04 15:48:00.079379348 -0400
@@ -0,0 +1,63 @@
+/*
+ * Copyright (c) 2002 Marius Aamodt Eriksen <marius@monkey.org>
+ * Copyright (c) 1995,1999 Theo de Raadt. All rights reserved.
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <sys/types.h>
+#include <unistd.h>
+#include <errno.h>
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif /* HAVE_CONFIG_H */
+
+/*
+ * ensure all of data on socket comes through. f==read || f==write
+ */
+ssize_t
+atomicio(f, fd, _s, n)
+ ssize_t (*f) ();
+ int fd;
+ void *_s;
+ size_t n;
+{
+ char *s = _s;
+ ssize_t res, pos = 0;
+
+ while (n > pos) {
+ res = (f) (fd, s + pos, n - pos);
+ switch (res) {
+ case -1:
+ if (errno == EINTR || errno == EAGAIN)
+ continue;
+ case 0:
+ if (pos != 0)
+ return (pos);
+ return (res);
+ default:
+ pos += res;
+ }
+ }
+ return (pos);
+}
diff -up nfs-utils-1.2.3/utils/spnfsd/cfg.c.orig nfs-utils-1.2.3/utils/spnfsd/cfg.c
--- nfs-utils-1.2.3/utils/spnfsd/cfg.c.orig 2010-10-04 15:48:00.080414616 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/cfg.c 2010-10-04 15:48:00.080414616 -0400
@@ -0,0 +1,893 @@
+/* $OpenBSD: conf.c,v 1.55 2003/06/03 14:28:16 ho Exp $ */
+/* $EOM: conf.c,v 1.48 2000/12/04 02:04:29 angelos Exp $ */
+
+/*
+ * Copyright (c) 1998, 1999, 2000, 2001 Niklas Hallqvist. All rights reserved.
+ * Copyright (c) 2000, 2001, 2002 HÃ¥kan Olsson. All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+/*
+ * This code was written under funding by Ericsson Radio Systems.
+ */
+
+#include <sys/param.h>
+#include <sys/mman.h>
+#include <sys/socket.h>
+#include <sys/stat.h>
+#include <netinet/in.h>
+#include <arpa/inet.h>
+#include <ctype.h>
+#include <fcntl.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <unistd.h>
+#include <errno.h>
+#include <err.h>
+
+#include "cfg.h"
+
+static void conf_load_defaults (int);
+#if 0
+static int conf_find_trans_xf (int, char *);
+#endif
+
+size_t strlcpy(char *, const char *, size_t);
+
+struct conf_trans {
+ TAILQ_ENTRY (conf_trans) link;
+ int trans;
+ enum conf_op { CONF_SET, CONF_REMOVE, CONF_REMOVE_SECTION } op;
+ char *section;
+ char *tag;
+ char *value;
+ int override;
+ int is_default;
+};
+
+TAILQ_HEAD (conf_trans_head, conf_trans) conf_trans_queue;
+
+/*
+ * Radix-64 Encoding.
+ */
+const u_int8_t bin2asc[]
+ = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
+
+const u_int8_t asc2bin[] =
+{
+ 255, 255, 255, 255, 255, 255, 255, 255,
+ 255, 255, 255, 255, 255, 255, 255, 255,
+ 255, 255, 255, 255, 255, 255, 255, 255,
+ 255, 255, 255, 255, 255, 255, 255, 255,
+ 255, 255, 255, 255, 255, 255, 255, 255,
+ 255, 255, 255, 62, 255, 255, 255, 63,
+ 52, 53, 54, 55, 56, 57, 58, 59,
+ 60, 61, 255, 255, 255, 255, 255, 255,
+ 255, 0, 1, 2, 3, 4, 5, 6,
+ 7, 8, 9, 10, 11, 12, 13, 14,
+ 15, 16, 17, 18, 19, 20, 21, 22,
+ 23, 24, 25, 255, 255, 255, 255, 255,
+ 255, 26, 27, 28, 29, 30, 31, 32,
+ 33, 34, 35, 36, 37, 38, 39, 40,
+ 41, 42, 43, 44, 45, 46, 47, 48,
+ 49, 50, 51, 255, 255, 255, 255, 255
+};
+
+struct conf_binding {
+ LIST_ENTRY (conf_binding) link;
+ char *section;
+ char *tag;
+ char *value;
+ int is_default;
+};
+
+char *conf_path;
+LIST_HEAD (conf_bindings, conf_binding) conf_bindings[256];
+
+static char *conf_addr;
+
+static __inline__ u_int8_t
+conf_hash (char *s)
+{
+ u_int8_t hash = 0;
+
+ while (*s)
+ {
+ hash = ((hash << 1) | (hash >> 7)) ^ tolower (*s);
+ s++;
+ }
+ return hash;
+}
+
+/*
+ * Insert a tag-value combination from LINE (the equal sign is at POS)
+ */
+static int
+conf_remove_now (char *section, char *tag)
+{
+ struct conf_binding *cb, *next;
+
+ for (cb = LIST_FIRST (&conf_bindings[conf_hash (section)]); cb; cb = next)
+ {
+ next = LIST_NEXT (cb, link);
+ if (strcasecmp (cb->section, section) == 0
+ && strcasecmp (cb->tag, tag) == 0)
+ {
+ LIST_REMOVE (cb, link);
+ warnx("[%s]:%s->%s removed", section, tag, cb->value);
+ free (cb->section);
+ free (cb->tag);
+ free (cb->value);
+ free (cb);
+ return 0;
+ }
+ }
+ return 1;
+}
+
+static int
+conf_remove_section_now (char *section)
+{
+ struct conf_binding *cb, *next;
+ int unseen = 1;
+
+ for (cb = LIST_FIRST (&conf_bindings[conf_hash (section)]); cb; cb = next)
+ {
+ next = LIST_NEXT (cb, link);
+ if (strcasecmp (cb->section, section) == 0)
+ {
+ unseen = 0;
+ LIST_REMOVE (cb, link);
+ warnx("[%s]:%s->%s removed", section, cb->tag, cb->value);
+ free (cb->section);
+ free (cb->tag);
+ free (cb->value);
+ free (cb);
+ }
+ }
+ return unseen;
+}
+
+/*
+ * Insert a tag-value combination from LINE (the equal sign is at POS)
+ * into SECTION of our configuration database.
+ */
+static int
+conf_set_now (char *section, char *tag, char *value, int override,
+ int is_default)
+{
+ struct conf_binding *node = 0;
+
+ if (override)
+ conf_remove_now (section, tag);
+ else if (conf_get_str (section, tag))
+ {
+ if (!is_default)
+ warnx("conf_set: duplicate tag [%s]:%s, ignoring...\n", section, tag);
+ return 1;
+ }
+
+ node = calloc (1, sizeof *node);
+ if (!node)
+ {
+ warnx("conf_set: calloc (1, %lu) failed", (unsigned long)sizeof *node);
+ return 1;
+ }
+ node->section = strdup (section);
+ node->tag = strdup (tag);
+ node->value = strdup (value);
+ node->is_default = is_default;
+
+ LIST_INSERT_HEAD (&conf_bindings[conf_hash (section)], node, link);
+ return 0;
+}
+
+/*
+ * Parse the line LINE of SZ bytes. Skip Comments, recognize section
+ * headers and feed tag-value pairs into our configuration database.
+ */
+static void
+conf_parse_line (int trans, char *line, size_t sz)
+{
+ char *val;
+ size_t i;
+ int j;
+ static char *section = 0;
+ static int ln = 0;
+
+ ln++;
+
+ /* Lines starting with '#' or ';' are comments. */
+ if (*line == '#' || *line == ';')
+ return;
+
+ /* '[section]' parsing... */
+ if (*line == '[')
+ {
+ for (i = 1; i < sz; i++)
+ if (line[i] == ']')
+ break;
+ if (section)
+ free (section);
+ if (i == sz)
+ {
+ warnx("conf_parse_line: %d:"
+ "non-matched ']', ignoring until next section", ln);
+ section = 0;
+ return;
+ }
+ section = malloc (i);
+ if (!section)
+ {
+ warnx("conf_parse_line: %d: malloc (%lu) failed", ln,
+ (unsigned long)i);
+ return;
+ }
+ strlcpy (section, line + 1, i);
+ return;
+ }
+
+ /* Deal with assignments. */
+ for (i = 0; i < sz; i++)
+ if (line[i] == '=')
+ {
+ /* If no section, we are ignoring the lines. */
+ if (!section)
+ {
+ warnx("conf_parse_line: %d: ignoring line due to no section", ln);
+ return;
+ }
+ line[strcspn (line, " \t=")] = '\0';
+ val = line + i + 1 + strspn (line + i + 1, " \t");
+ /* Skip trailing whitespace, if any */
+ for (j = sz - (val - line) - 1; j > 0 && isspace (val[j]); j--)
+ val[j] = '\0';
+ /* XXX Perhaps should we not ignore errors? */
+ conf_set (trans, section, line, val, 0, 0);
+ return;
+ }
+
+ /* Other non-empty lines are weird. */
+ i = strspn (line, " \t");
+ if (line[i])
+ warnx("conf_parse_line: %d: syntax error", ln);
+
+ return;
+}
+
+/* Parse the mapped configuration file. */
+static void
+conf_parse (int trans, char *buf, size_t sz)
+{
+ char *cp = buf;
+ char *bufend = buf + sz;
+ char *line;
+
+ line = cp;
+ while (cp < bufend)
+ {
+ if (*cp == '\n')
+ {
+ /* Check for escaped newlines. */
+ if (cp > buf && *(cp - 1) == '\\')
+ *(cp - 1) = *cp = ' ';
+ else
+ {
+ *cp = '\0';
+ conf_parse_line (trans, line, cp - line);
+ line = cp + 1;
+ }
+ }
+ cp++;
+ }
+ if (cp != line)
+ warnx("conf_parse: last line non-terminated, ignored.");
+}
+
+static void
+conf_load_defaults (int tr)
+{
+ /* No defaults */
+ return;
+}
+
+void
+conf_init (void)
+{
+ unsigned int i;
+
+ for (i = 0; i < sizeof conf_bindings / sizeof conf_bindings[0]; i++)
+ LIST_INIT (&conf_bindings[i]);
+ TAILQ_INIT (&conf_trans_queue);
+ conf_reinit ();
+}
+
+/* Open the config file and map it into our address space, then parse it. */
+void
+conf_reinit (void)
+{
+ struct conf_binding *cb = 0;
+ int fd, trans;
+ unsigned int i;
+ size_t sz;
+ char *new_conf_addr = 0;
+ struct stat sb;
+
+ if ((stat (conf_path, &sb) == 0) || (errno != ENOENT))
+ {
+ sz = sb.st_size;
+ fd = open (conf_path, O_RDONLY, 0);
+ if (fd == -1)
+ {
+ warnx("conf_reinit: open (\"%s\", O_RDONLY) failed", conf_path);
+ return;
+ }
+
+ new_conf_addr = malloc (sz);
+ if (!new_conf_addr)
+ {
+ warnx("conf_reinit: malloc (%lu) failed", (unsigned long)sz);
+ goto fail;
+ }
+
+ /* XXX I assume short reads won't happen here. */
+ if (read (fd, new_conf_addr, sz) != (int)sz)
+ {
+ warnx("conf_reinit: read (%d, %p, %lu) failed",
+ fd, new_conf_addr, (unsigned long)sz);
+ goto fail;
+ }
+ close (fd);
+
+ trans = conf_begin ();
+
+ /* XXX Should we not care about errors and rollback? */
+ conf_parse (trans, new_conf_addr, sz);
+ }
+ else
+ trans = conf_begin ();
+
+ /* Load default configuration values. */
+ conf_load_defaults (trans);
+
+ /* Free potential existing configuration. */
+ if (conf_addr)
+ {
+ for (i = 0; i < sizeof conf_bindings / sizeof conf_bindings[0]; i++)
+ for (cb = LIST_FIRST (&conf_bindings[i]); cb;
+ cb = LIST_FIRST (&conf_bindings[i]))
+ conf_remove_now (cb->section, cb->tag);
+ free (conf_addr);
+ }
+
+ conf_end (trans, 1);
+ conf_addr = new_conf_addr;
+ return;
+
+ fail:
+ if (new_conf_addr)
+ free (new_conf_addr);
+ close (fd);
+}
+
+/*
+ * Return the numeric value denoted by TAG in section SECTION or DEF
+ * if that tag does not exist.
+ */
+int
+conf_get_num (char *section, char *tag, int def)
+{
+ char *value = conf_get_str (section, tag);
+
+ if (value)
+ return atoi (value);
+ return def;
+}
+
+/* Validate X according to the range denoted by TAG in section SECTION. */
+int
+conf_match_num (char *section, char *tag, int x)
+{
+ char *value = conf_get_str (section, tag);
+ int val, min, max, n;
+
+ if (!value)
+ return 0;
+ n = sscanf (value, "%d,%d:%d", &val, &min, &max);
+ switch (n)
+ {
+ case 1:
+ warnx("conf_match_num: %s:%s %d==%d?", section, tag, val, x);
+ return x == val;
+ case 3:
+ warnx("conf_match_num: %s:%s %d<=%d<=%d?", section, tag, min, x, max);
+ return min <= x && max >= x;
+ default:
+ warnx("conf_match_num: section %s tag %s: invalid number spec %s",
+ section, tag, value);
+ }
+ return 0;
+}
+
+/* Return the string value denoted by TAG in section SECTION. */
+char *
+conf_get_str (char *section, char *tag)
+{
+ struct conf_binding *cb;
+
+ for (cb = LIST_FIRST (&conf_bindings[conf_hash (section)]); cb;
+ cb = LIST_NEXT (cb, link))
+ if (strcasecmp (section, cb->section) == 0
+ && strcasecmp (tag, cb->tag) == 0)
+ {
+ return cb->value;
+ }
+ return 0;
+}
+
+/*
+ * Build a list of string values out of the comma separated value denoted by
+ * TAG in SECTION.
+ */
+struct conf_list *
+conf_get_list (char *section, char *tag)
+{
+ char *liststr = 0, *p, *field, *t;
+ struct conf_list *list = 0;
+ struct conf_list_node *node;
+
+ list = malloc (sizeof *list);
+ if (!list)
+ goto cleanup;
+ TAILQ_INIT (&list->fields);
+ list->cnt = 0;
+ liststr = conf_get_str (section, tag);
+ if (!liststr)
+ goto cleanup;
+ liststr = strdup (liststr);
+ if (!liststr)
+ goto cleanup;
+ p = liststr;
+ while ((field = strsep (&p, ",")) != NULL)
+ {
+ /* Skip leading whitespace */
+ while (isspace (*field))
+ field++;
+ /* Skip trailing whitespace */
+ if (p)
+ for (t = p - 1; t > field && isspace (*t); t--)
+ *t = '\0';
+ if (*field == '\0')
+ {
+ warnx("conf_get_list: empty field, ignoring...");
+ continue;
+ }
+ list->cnt++;
+ node = calloc (1, sizeof *node);
+ if (!node)
+ goto cleanup;
+ node->field = strdup (field);
+ if (!node->field) {
+ free(node);
+ goto cleanup;
+ }
+ TAILQ_INSERT_TAIL (&list->fields, node, link);
+ }
+ free (liststr);
+ return list;
+
+ cleanup:
+ if (list)
+ conf_free_list (list);
+ if (liststr)
+ free (liststr);
+ return 0;
+}
+
+struct conf_list *
+conf_get_tag_list (char *section)
+{
+ struct conf_list *list = 0;
+ struct conf_list_node *node;
+ struct conf_binding *cb;
+
+ list = malloc (sizeof *list);
+ if (!list)
+ goto cleanup;
+ TAILQ_INIT (&list->fields);
+ list->cnt = 0;
+ for (cb = LIST_FIRST (&conf_bindings[conf_hash (section)]); cb;
+ cb = LIST_NEXT (cb, link))
+ if (strcasecmp (section, cb->section) == 0)
+ {
+ list->cnt++;
+ node = calloc (1, sizeof *node);
+ if (!node)
+ goto cleanup;
+ node->field = strdup (cb->tag);
+ if (!node->field) {
+ free(node);
+ goto cleanup;
+ }
+ TAILQ_INSERT_TAIL (&list->fields, node, link);
+ }
+ return list;
+
+ cleanup:
+ if (list)
+ conf_free_list (list);
+ return 0;
+}
+
+/* Decode a PEM encoded buffer. */
+int
+conf_decode_base64 (u_int8_t *out, u_int32_t *len, u_char *buf)
+{
+ u_int32_t c = 0;
+ u_int8_t c1, c2, c3, c4;
+
+ while (*buf)
+ {
+ if (*buf > 127 || (c1 = asc2bin[*buf]) == 255)
+ return 0;
+ buf++;
+
+ if (*buf > 127 || (c2 = asc2bin[*buf]) == 255)
+ return 0;
+ buf++;
+
+ if (*buf == '=')
+ {
+ c3 = c4 = 0;
+ c++;
+
+ /* Check last four bit */
+ if (c2 & 0xF)
+ return 0;
+
+ if (strcmp ((char *)buf, "==") == 0)
+ buf++;
+ else
+ return 0;
+ }
+ else if (*buf > 127 || (c3 = asc2bin[*buf]) == 255)
+ return 0;
+ else
+ {
+ if (*++buf == '=')
+ {
+ c4 = 0;
+ c += 2;
+
+ /* Check last two bit */
+ if (c3 & 3)
+ return 0;
+
+ if (strcmp ((char *)buf, "="))
+ return 0;
+
+ }
+ else if (*buf > 127 || (c4 = asc2bin[*buf]) == 255)
+ return 0;
+ else
+ c += 3;
+ }
+
+ buf++;
+ *out++ = (c1 << 2) | (c2 >> 4);
+ *out++ = (c2 << 4) | (c3 >> 2);
+ *out++ = (c3 << 6) | c4;
+ }
+
+ *len = c;
+ return 1;
+
+}
+
+void
+conf_free_list (struct conf_list *list)
+{
+ struct conf_list_node *node = TAILQ_FIRST (&list->fields);
+
+ while (node)
+ {
+ TAILQ_REMOVE (&list->fields, node, link);
+ if (node->field)
+ free (node->field);
+ free (node);
+ node = TAILQ_FIRST (&list->fields);
+ }
+ free (list);
+}
+
+int
+conf_begin (void)
+{
+ static int seq = 0;
+
+ return ++seq;
+}
+
+static struct conf_trans *
+conf_trans_node (int transaction, enum conf_op op)
+{
+ struct conf_trans *node;
+
+ node = calloc (1, sizeof *node);
+ if (!node)
+ {
+ warnx("conf_trans_node: calloc (1, %lu) failed",
+ (unsigned long)sizeof *node);
+ return 0;
+ }
+ node->trans = transaction;
+ node->op = op;
+ TAILQ_INSERT_TAIL (&conf_trans_queue, node, link);
+ return node;
+}
+
+/* Queue a set operation. */
+int
+conf_set (int transaction, char *section, char *tag, char *value, int override,
+ int is_default)
+{
+ struct conf_trans *node;
+
+ node = conf_trans_node (transaction, CONF_SET);
+ if (!node)
+ return 1;
+ node->section = strdup (section);
+ if (!node->section)
+ {
+ warnx("conf_set: strdup (\"%s\") failed", section);
+ goto fail;
+ }
+ node->tag = strdup (tag);
+ if (!node->tag)
+ {
+ warnx("conf_set: strdup (\"%s\") failed", tag);
+ goto fail;
+ }
+ node->value = strdup (value);
+ if (!node->value)
+ {
+ warnx("conf_set: strdup (\"%s\") failed", value);
+ goto fail;
+ }
+ node->override = override;
+ node->is_default = is_default;
+ return 0;
+
+ fail:
+ if (node->tag)
+ free (node->tag);
+ if (node->section)
+ free (node->section);
+ if (node)
+ free (node);
+ return 1;
+}
+
+/* Queue a remove operation. */
+int
+conf_remove (int transaction, char *section, char *tag)
+{
+ struct conf_trans *node;
+
+ node = conf_trans_node (transaction, CONF_REMOVE);
+ if (!node)
+ goto fail;
+ node->section = strdup (section);
+ if (!node->section)
+ {
+ warnx("conf_remove: strdup (\"%s\") failed", section);
+ goto fail;
+ }
+ node->tag = strdup (tag);
+ if (!node->tag)
+ {
+ warnx("conf_remove: strdup (\"%s\") failed", tag);
+ goto fail;
+ }
+ return 0;
+
+ fail:
+ if (node && node->section)
+ free (node->section);
+ if (node)
+ free (node);
+ return 1;
+}
+
+/* Queue a remove section operation. */
+int
+conf_remove_section (int transaction, char *section)
+{
+ struct conf_trans *node;
+
+ node = conf_trans_node (transaction, CONF_REMOVE_SECTION);
+ if (!node)
+ goto fail;
+ node->section = strdup (section);
+ if (!node->section)
+ {
+ warnx("conf_remove_section: strdup (\"%s\") failed", section);
+ goto fail;
+ }
+ return 0;
+
+ fail:
+ if (node)
+ free (node);
+ return 1;
+}
+
+/* Execute all queued operations for this transaction. Cleanup. */
+int
+conf_end (int transaction, int commit)
+{
+ struct conf_trans *node, *next;
+
+ for (node = TAILQ_FIRST (&conf_trans_queue); node; node = next)
+ {
+ next = TAILQ_NEXT (node, link);
+ if (node->trans == transaction)
+ {
+ if (commit)
+ switch (node->op)
+ {
+ case CONF_SET:
+ conf_set_now (node->section, node->tag, node->value,
+ node->override, node->is_default);
+ break;
+ case CONF_REMOVE:
+ conf_remove_now (node->section, node->tag);
+ break;
+ case CONF_REMOVE_SECTION:
+ conf_remove_section_now (node->section);
+ break;
+ default:
+ warnx("conf_end: unknown operation: %d", node->op);
+ }
+ TAILQ_REMOVE (&conf_trans_queue, node, link);
+ if (node->section)
+ free (node->section);
+ if (node->tag)
+ free (node->tag);
+ if (node->value)
+ free (node->value);
+ free (node);
+ }
+ }
+ return 0;
+}
+
+/*
+ * Dump running configuration upon SIGUSR1.
+ * Configuration is "stored in reverse order", so reverse it again.
+ */
+struct dumper {
+ char *s, *v;
+ struct dumper *next;
+};
+
+static void
+conf_report_dump (struct dumper *node)
+{
+ /* Recursive, cleanup when we're done. */
+
+ if (node->next)
+ conf_report_dump (node->next);
+
+ if (node->v)
+ warnx("%s=\t%s", node->s, node->v);
+ else if (node->s)
+ {
+ warnx("%s", node->s);
+ if (strlen (node->s) > 0)
+ free (node->s);
+ }
+
+ free (node);
+}
+
+void
+conf_report (void)
+{
+ struct conf_binding *cb, *last = 0;
+ unsigned int i, len;
+ char *current_section = (char *)0;
+ struct dumper *dumper, *dnode;
+
+ dumper = dnode = (struct dumper *)calloc (1, sizeof *dumper);
+ if (!dumper)
+ goto mem_fail;
+
+ warnx("conf_report: dumping running configuration");
+
+ for (i = 0; i < sizeof conf_bindings / sizeof conf_bindings[0]; i++)
+ for (cb = LIST_FIRST (&conf_bindings[i]); cb;
+ cb = LIST_NEXT (cb, link))
+ {
+ if (!cb->is_default)
+ {
+ /* Dump this entry. */
+ if (!current_section || strcmp (cb->section, current_section))
+ {
+ if (current_section)
+ {
+ len = strlen (current_section) + 3;
+ dnode->s = malloc (len);
+ if (!dnode->s)
+ goto mem_fail;
+
+ snprintf (dnode->s, len, "[%s]", current_section);
+ dnode->next
+ = (struct dumper *)calloc (1, sizeof (struct dumper));
+ dnode = dnode->next;
+ if (!dnode)
+ goto mem_fail;
+
+ dnode->s = "";
+ dnode->next
+ = (struct dumper *)calloc (1, sizeof (struct dumper));
+ dnode = dnode->next;
+ if (!dnode)
+ goto mem_fail;
+ }
+ current_section = cb->section;
+ }
+ dnode->s = cb->tag;
+ dnode->v = cb->value;
+ dnode->next = (struct dumper *)calloc (1, sizeof (struct dumper));
+ dnode = dnode->next;
+ if (!dnode)
+ goto mem_fail;
+ last = cb;
+ }
+ }
+
+ if (last)
+ {
+ len = strlen (last->section) + 3;
+ dnode->s = malloc (len);
+ if (!dnode->s)
+ goto mem_fail;
+ snprintf (dnode->s, len, "[%s]", last->section);
+ }
+
+ conf_report_dump (dumper);
+
+ return;
+
+ mem_fail:
+ warnx("conf_report: malloc/calloc failed");
+ while ((dnode = dumper) != 0)
+ {
+ dumper = dumper->next;
+ if (dnode->s)
+ free (dnode->s);
+ free (dnode);
+ }
+ return;
+}
diff -up nfs-utils-1.2.3/utils/spnfsd/cfg.h.orig nfs-utils-1.2.3/utils/spnfsd/cfg.h
--- nfs-utils-1.2.3/utils/spnfsd/cfg.h.orig 2010-10-04 15:48:00.080414616 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/cfg.h 2010-10-04 15:48:00.080414616 -0400
@@ -0,0 +1,67 @@
+/* $OpenBSD: conf.h,v 1.30 2004/06/25 20:25:34 hshoexer Exp $ */
+/* $EOM: conf.h,v 1.13 2000/09/18 00:01:47 ho Exp $ */
+
+/*
+ * Copyright (c) 1998, 1999, 2001 Niklas Hallqvist. All rights reserved.
+ * Copyright (c) 2000, 2003 HÃ¥kan Olsson. All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+/*
+ * This code was written under funding by Ericsson Radio Systems.
+ */
+
+#ifndef _CONF_H_
+#define _CONF_H_
+
+#include "queue.h"
+
+struct conf_list_node {
+ TAILQ_ENTRY(conf_list_node) link;
+ char *field;
+};
+
+struct conf_list {
+ size_t cnt;
+ TAILQ_HEAD(conf_list_fields_head, conf_list_node) fields;
+};
+
+extern char *conf_path;
+
+extern int conf_begin(void);
+extern int conf_decode_base64(u_int8_t *, u_int32_t *, u_char *);
+extern int conf_end(int, int);
+extern void conf_free_list(struct conf_list *);
+extern struct sockaddr *conf_get_address(char *, char *);
+extern struct conf_list *conf_get_list(char *, char *);
+extern struct conf_list *conf_get_tag_list(char *);
+extern int conf_get_num(char *, char *, int);
+extern char *conf_get_str(char *, char *);
+extern void conf_init(void);
+extern int conf_match_num(char *, char *, int);
+extern void conf_reinit(void);
+extern int conf_remove(int, char *, char *);
+extern int conf_remove_section(int, char *);
+extern int conf_set(int, char *, char *, char *, int, int);
+extern void conf_report(void);
+
+#endif /* _CONF_H_ */
diff -up nfs-utils-1.2.3/utils/spnfsd/Makefile.am.orig nfs-utils-1.2.3/utils/spnfsd/Makefile.am
--- nfs-utils-1.2.3/utils/spnfsd/Makefile.am.orig 2010-10-04 15:48:00.078357497 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/Makefile.am 2010-10-04 15:48:00.078357497 -0400
@@ -0,0 +1,30 @@
+## Process this file with automake to produce Makefile.in
+
+man5_MANS =
+man8_MANS =
+
+RPCPREFIX =
+KPREFIX = @kprefix@
+sbin_PROGRAMS = spnfsd
+
+EXTRA_DIST = \
+ $(man5_MANS) \
+ $(man8_MANS) \
+ spnfsd.conf
+
+spnfsd_SOURCES = \
+ atomicio.c \
+ spnfsd_ops.c \
+ cfg.c \
+ spnfsd.c \
+ strlcat.c \
+ strlcpy.c \
+ \
+ cfg.h \
+ spnfsd.h \
+ spnfsd_queue.h \
+ queue.h
+
+spnfsd_LDADD = -levent ../../support/nfs/libnfs.a
+
+MAINTAINERCLEANFILES = Makefile.in
diff -up nfs-utils-1.2.3/utils/spnfsd/makestatic.orig nfs-utils-1.2.3/utils/spnfsd/makestatic
--- nfs-utils-1.2.3/utils/spnfsd/makestatic.orig 2010-10-04 15:48:00.081429548 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/makestatic 2010-10-04 15:48:00.081429548 -0400
@@ -0,0 +1,23 @@
+/******************************************************************************
+
+(c) 2007 Network Appliance, Inc. All Rights Reserved.
+
+Network Appliance provides this source code under the GPL v2 License.
+The GPL v2 license is available at
+http://opensource.org/licenses/gpl-license.php.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+******************************************************************************/
+
+gcc -static -Wall -pipe -g -O2 -o spnfsd atomicio.o spnfsd_ops.o cfg.o spnfsd.o strlcat.o strlcpy.o /usr/lib/libevent.a ../../support/nfs/libnfs.a
diff -up nfs-utils-1.2.3/utils/spnfsd/nfsd4_spnfs.h.orig nfs-utils-1.2.3/utils/spnfsd/nfsd4_spnfs.h
--- nfs-utils-1.2.3/utils/spnfsd/nfsd4_spnfs.h.orig 2010-10-04 15:48:00.081429548 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/nfsd4_spnfs.h 2010-10-04 15:48:00.081429548 -0400
@@ -0,0 +1,334 @@
+/*
+ * include/linux/nfsd4_spnfs.h
+ *
+ * spNFS - simple pNFS implementation with userspace daemon
+ *
+ */
+
+/******************************************************************************
+
+(c) 2007 Network Appliance, Inc. All Rights Reserved.
+
+Network Appliance provides this source code under the GPL v2 License.
+The GPL v2 license is available at
+http://opensource.org/licenses/gpl-license.php.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+******************************************************************************/
+
+#ifndef NFS_SPNFS_H
+#define NFS_SPNFS_H
+
+
+#ifdef __KERNEL__
+#include "exportfs.h"
+#include "sunrpc/svc.h"
+#include "nfsd/nfsfh.h"
+#else
+#include <sys/types.h>
+#endif /* __KERNEL__ */
+
+#define SPNFS_STATUS_INVALIDMSG 0x01
+#define SPNFS_STATUS_AGAIN 0x02
+#define SPNFS_STATUS_FAIL 0x04
+#define SPNFS_STATUS_SUCCESS 0x08
+
+#define SPNFS_TYPE_LAYOUTGET 0x01
+#define SPNFS_TYPE_LAYOUTCOMMIT 0x02
+#define SPNFS_TYPE_LAYOUTRETURN 0x03
+#define SPNFS_TYPE_GETDEVICEITER 0x04
+#define SPNFS_TYPE_GETDEVICEINFO 0x05
+#define SPNFS_TYPE_SETATTR 0x06
+#define SPNFS_TYPE_OPEN 0x07
+#define SPNFS_TYPE_CLOSE 0x08
+#define SPNFS_TYPE_CREATE 0x09
+#define SPNFS_TYPE_REMOVE 0x0a
+#define SPNFS_TYPE_COMMIT 0x0b
+#define SPNFS_TYPE_READ 0x0c
+#define SPNFS_TYPE_WRITE 0x0d
+
+#define SPNFS_MAX_DEVICES 1
+#define SPNFS_MAX_DATA_SERVERS 16
+#define SPNFS_MAX_IO 512
+
+/* layout */
+struct spnfs_msg_layoutget_args {
+ unsigned long inode;
+ unsigned long generation;
+};
+
+struct spnfs_filelayout_list {
+ u_int32_t fh_len;
+ unsigned char fh_val[128]; /* DMXXX fix this const */
+};
+
+struct spnfs_msg_layoutget_res {
+ int status;
+ u_int64_t devid;
+ u_int64_t stripe_size;
+ u_int32_t stripe_type;
+ u_int32_t stripe_count;
+ struct spnfs_filelayout_list flist[SPNFS_MAX_DATA_SERVERS];
+};
+
+/* layoutcommit */
+struct spnfs_msg_layoutcommit_args {
+ unsigned long inode;
+ unsigned long generation;
+ u_int64_t file_size;
+};
+
+struct spnfs_msg_layoutcommit_res {
+ int status;
+};
+
+/* layoutreturn */
+/* No op for the daemon */
+/*
+struct spnfs_msg_layoutreturn_args {
+};
+
+struct spnfs_msg_layoutreturn_res {
+};
+*/
+
+/* getdeviceiter */
+struct spnfs_msg_getdeviceiter_args {
+ unsigned long inode;
+ u_int64_t cookie;
+ u_int64_t verf;
+};
+
+struct spnfs_msg_getdeviceiter_res {
+ int status;
+ u_int64_t devid;
+ u_int64_t cookie;
+ u_int64_t verf;
+ u_int32_t eof;
+};
+
+/* getdeviceinfo */
+struct spnfs_data_server {
+ u_int32_t dsid;
+ char netid[5];
+ char addr[29];
+};
+
+struct spnfs_device {
+ u_int64_t devid;
+ int dscount;
+ struct spnfs_data_server dslist[SPNFS_MAX_DATA_SERVERS];
+};
+
+struct spnfs_msg_getdeviceinfo_args {
+ u_int64_t devid;
+};
+
+struct spnfs_msg_getdeviceinfo_res {
+ int status;
+ struct spnfs_device devinfo;
+};
+
+/* setattr */
+struct spnfs_msg_setattr_args {
+ unsigned long inode;
+ unsigned long generation;
+ int file_size;
+};
+
+struct spnfs_msg_setattr_res {
+ int status;
+};
+
+/* open */
+struct spnfs_msg_open_args {
+ unsigned long inode;
+ unsigned long generation;
+ int create;
+ int createmode;
+ int truncate;
+};
+
+struct spnfs_msg_open_res {
+ int status;
+};
+
+/* close */
+/* No op for daemon */
+struct spnfs_msg_close_args {
+ int x;
+};
+
+struct spnfs_msg_close_res {
+ int y;
+};
+
+/* create */
+/*
+struct spnfs_msg_create_args {
+ int x;
+};
+
+struct spnfs_msg_create_res {
+ int y;
+};
+*/
+
+/* remove */
+struct spnfs_msg_remove_args {
+ unsigned long inode;
+ unsigned long generation;
+};
+
+struct spnfs_msg_remove_res {
+ int status;
+};
+
+/* commit */
+/*
+struct spnfs_msg_commit_args {
+ int x;
+};
+
+struct spnfs_msg_commit_res {
+ int y;
+};
+*/
+
+/* read */
+struct spnfs_msg_read_args {
+ unsigned long inode;
+ unsigned long generation;
+ loff_t offset;
+ unsigned long len;
+};
+
+struct spnfs_msg_read_res {
+ int status;
+ char data[SPNFS_MAX_IO];
+};
+
+/* write */
+struct spnfs_msg_write_args {
+ unsigned long inode;
+ unsigned long generation;
+ loff_t offset;
+ unsigned long len;
+ char data[SPNFS_MAX_IO];
+};
+
+struct spnfs_msg_write_res {
+ int status;
+};
+
+/* bundle args and responses */
+union spnfs_msg_args {
+ struct spnfs_msg_layoutget_args layoutget_args;
+ struct spnfs_msg_layoutcommit_args layoutcommit_args;
+/*
+ struct spnfs_msg_layoutreturn_args layoutreturn_args;
+*/
+ struct spnfs_msg_getdeviceiter_args getdeviceiter_args;
+ struct spnfs_msg_getdeviceinfo_args getdeviceinfo_args;
+ struct spnfs_msg_setattr_args setattr_args;
+ struct spnfs_msg_open_args open_args;
+ struct spnfs_msg_close_args close_args;
+/*
+ struct spnfs_msg_create_args create_args;
+*/
+ struct spnfs_msg_remove_args remove_args;
+/*
+ struct spnfs_msg_commit_args commit_args;
+*/
+ struct spnfs_msg_read_args read_args;
+ struct spnfs_msg_write_args write_args;
+};
+
+union spnfs_msg_res {
+ struct spnfs_msg_layoutget_res layoutget_res;
+ struct spnfs_msg_layoutcommit_res layoutcommit_res;
+/*
+ struct spnfs_msg_layoutreturn_res layoutreturn_res;
+*/
+ struct spnfs_msg_getdeviceiter_res getdeviceiter_res;
+ struct spnfs_msg_getdeviceinfo_res getdeviceinfo_res;
+ struct spnfs_msg_setattr_res setattr_res;
+ struct spnfs_msg_open_res open_res;
+ struct spnfs_msg_close_res close_res;
+/*
+ struct spnfs_msg_create_res create_res;
+*/
+ struct spnfs_msg_remove_res remove_res;
+/*
+ struct spnfs_msg_commit_res commit_res;
+*/
+ struct spnfs_msg_read_res read_res;
+ struct spnfs_msg_write_res write_res;
+};
+
+/* a spnfs message, args and response */
+struct spnfs_msg {
+ unsigned char im_type;
+ unsigned char im_status;
+ union spnfs_msg_args im_args;
+ union spnfs_msg_res im_res;
+};
+
+/* spnfs configuration info */
+struct spnfs_config {
+ unsigned char dense_striping;
+ int stripe_size;
+ int num_ds;
+ char ds_dir[SPNFS_MAX_DATA_SERVERS][80]; /* XXX */
+};
+
+#ifdef __KERNEL__
+
+/* pipe mgmt structure. messages flow through here */
+struct spnfs {
+ char spnfs_path[48]; /* path to pipe */
+ struct dentry *spnfs_dentry; /* dentry for pipe */
+ wait_queue_head_t spnfs_wq;
+ struct spnfs_msg spnfs_im; /* spnfs message */
+ struct mutex spnfs_lock; /* Serializes upcalls */
+ struct mutex spnfs_plock;
+};
+
+int spnfs_layout_type(void);
+int spnfs_layoutget(struct inode *, struct pnfs_layoutget_arg *);
+int spnfs_layoutcommit(void);
+int spnfs_layoutreturn(struct inode *, void *);
+int spnfs_getdeviceiter(struct super_block *, struct pnfs_deviter_arg *);
+int spnfs_getdeviceinfo(struct super_block *, struct pnfs_devinfo_arg *);
+int spnfs_setattr(void);
+int spnfs_open(struct inode *, void *);
+int spnfs_close(struct inode *);
+int spnfs_get_state(struct inode *, void *, void *);
+int spnfs_remove(unsigned long, unsigned long);
+int spnfs_read(struct inode *, loff_t, unsigned long *, int, struct svc_rqst *);
+int spnfs_write(struct inode *, loff_t, size_t, int, struct svc_rqst *);
+int spnfs_getfh(int, struct nfs_fh *);
+int spnfs_test_layoutrecall(char *);
+int spnfs_layoutrecall(struct inode *, int);
+
+int nfsd_spnfs_new(void);
+void nfsd_spnfs_delete(void);
+int spnfs_upcall(struct spnfs *, struct spnfs_msg *, union spnfs_msg_res *);
+int spnfs_enabled(void);
+int nfs4_spnfs_propagate_open(struct super_block *, struct svc_fh *, void *);
+int spnfs_init_proc(void);
+
+#endif /* __KERNEL__ */
+
+#endif /* NFS_SPNFS_H */
diff -up nfs-utils-1.2.3/utils/spnfsd/queue.h.orig nfs-utils-1.2.3/utils/spnfsd/queue.h
--- nfs-utils-1.2.3/utils/spnfsd/queue.h.orig 2010-10-04 15:48:00.082454595 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/queue.h 2010-10-04 15:48:00.082454595 -0400
@@ -0,0 +1,499 @@
+/* $OpenBSD: queue.h,v 1.22 2001/06/23 04:39:35 angelos Exp $ */
+/* $NetBSD: queue.h,v 1.11 1996/05/16 05:17:14 mycroft Exp $ */
+
+/*
+ * Copyright (c) 1991, 1993
+ * The Regents of the University of California. All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * 3. Neither the name of the University nor the names of its contributors
+ * may be used to endorse or promote products derived from this software
+ * without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * @(#)queue.h 8.5 (Berkeley) 8/20/94
+ */
+
+#ifndef _SYS_QUEUE_H_
+#define _SYS_QUEUE_H_
+
+/*
+ * This file defines five types of data structures: singly-linked lists,
+ * lists, simple queues, tail queues, and circular queues.
+ *
+ *
+ * A singly-linked list is headed by a single forward pointer. The elements
+ * are singly linked for minimum space and pointer manipulation overhead at
+ * the expense of O(n) removal for arbitrary elements. New elements can be
+ * added to the list after an existing element or at the head of the list.
+ * Elements being removed from the head of the list should use the explicit
+ * macro for this purpose for optimum efficiency. A singly-linked list may
+ * only be traversed in the forward direction. Singly-linked lists are ideal
+ * for applications with large datasets and few or no removals or for
+ * implementing a LIFO queue.
+ *
+ * A list is headed by a single forward pointer (or an array of forward
+ * pointers for a hash table header). The elements are doubly linked
+ * so that an arbitrary element can be removed without a need to
+ * traverse the list. New elements can be added to the list before
+ * or after an existing element or at the head of the list. A list
+ * may only be traversed in the forward direction.
+ *
+ * A simple queue is headed by a pair of pointers, one the head of the
+ * list and the other to the tail of the list. The elements are singly
+ * linked to save space, so elements can only be removed from the
+ * head of the list. New elements can be added to the list before or after
+ * an existing element, at the head of the list, or at the end of the
+ * list. A simple queue may only be traversed in the forward direction.
+ *
+ * A tail queue is headed by a pair of pointers, one to the head of the
+ * list and the other to the tail of the list. The elements are doubly
+ * linked so that an arbitrary element can be removed without a need to
+ * traverse the list. New elements can be added to the list before or
+ * after an existing element, at the head of the list, or at the end of
+ * the list. A tail queue may be traversed in either direction.
+ *
+ * A circle queue is headed by a pair of pointers, one to the head of the
+ * list and the other to the tail of the list. The elements are doubly
+ * linked so that an arbitrary element can be removed without a need to
+ * traverse the list. New elements can be added to the list before or after
+ * an existing element, at the head of the list, or at the end of the list.
+ * A circle queue may be traversed in either direction, but has a more
+ * complex end of list detection.
+ *
+ * For details on the use of these macros, see the queue(3) manual page.
+ */
+
+/*
+ * Singly-linked List definitions.
+ */
+#define SLIST_HEAD(name, type) \
+struct name { \
+ struct type *slh_first; /* first element */ \
+}
+
+#define SLIST_HEAD_INITIALIZER(head) \
+ { NULL }
+
+#define SLIST_ENTRY(type) \
+struct { \
+ struct type *sle_next; /* next element */ \
+}
+
+/*
+ * Singly-linked List access methods.
+ */
+#define SLIST_FIRST(head) ((head)->slh_first)
+#define SLIST_END(head) NULL
+#define SLIST_EMPTY(head) (SLIST_FIRST(head) == SLIST_END(head))
+#define SLIST_NEXT(elm, field) ((elm)->field.sle_next)
+
+#define SLIST_FOREACH(var, head, field) \
+ for((var) = SLIST_FIRST(head); \
+ (var) != SLIST_END(head); \
+ (var) = SLIST_NEXT(var, field))
+
+/*
+ * Singly-linked List functions.
+ */
+#define SLIST_INIT(head) { \
+ SLIST_FIRST(head) = SLIST_END(head); \
+}
+
+#define SLIST_INSERT_AFTER(slistelm, elm, field) do { \
+ (elm)->field.sle_next = (slistelm)->field.sle_next; \
+ (slistelm)->field.sle_next = (elm); \
+} while (0)
+
+#define SLIST_INSERT_HEAD(head, elm, field) do { \
+ (elm)->field.sle_next = (head)->slh_first; \
+ (head)->slh_first = (elm); \
+} while (0)
+
+#define SLIST_REMOVE_HEAD(head, field) do { \
+ (head)->slh_first = (head)->slh_first->field.sle_next; \
+} while (0)
+
+#define SLIST_REMOVE(head, elm, type, field) do { \
+ if ((head)->slh_first == (elm)) { \
+ SLIST_REMOVE_HEAD((head), field); \
+ } \
+ else { \
+ struct type *curelm = (head)->slh_first; \
+ while( curelm->field.sle_next != (elm) ) \
+ curelm = curelm->field.sle_next; \
+ curelm->field.sle_next = \
+ curelm->field.sle_next->field.sle_next; \
+ } \
+} while (0)
+
+/*
+ * List definitions.
+ */
+#define LIST_HEAD(name, type) \
+struct name { \
+ struct type *lh_first; /* first element */ \
+}
+
+#define LIST_HEAD_INITIALIZER(head) \
+ { NULL }
+
+#define LIST_ENTRY(type) \
+struct { \
+ struct type *le_next; /* next element */ \
+ struct type **le_prev; /* address of previous next element */ \
+}
+
+/*
+ * List access methods
+ */
+#define LIST_FIRST(head) ((head)->lh_first)
+#define LIST_END(head) NULL
+#define LIST_EMPTY(head) (LIST_FIRST(head) == LIST_END(head))
+#define LIST_NEXT(elm, field) ((elm)->field.le_next)
+
+#define LIST_FOREACH(var, head, field) \
+ for((var) = LIST_FIRST(head); \
+ (var)!= LIST_END(head); \
+ (var) = LIST_NEXT(var, field))
+
+/*
+ * List functions.
+ */
+#define LIST_INIT(head) do { \
+ LIST_FIRST(head) = LIST_END(head); \
+} while (0)
+
+#define LIST_INSERT_AFTER(listelm, elm, field) do { \
+ if (((elm)->field.le_next = (listelm)->field.le_next) != NULL) \
+ (listelm)->field.le_next->field.le_prev = \
+ &(elm)->field.le_next; \
+ (listelm)->field.le_next = (elm); \
+ (elm)->field.le_prev = &(listelm)->field.le_next; \
+} while (0)
+
+#define LIST_INSERT_BEFORE(listelm, elm, field) do { \
+ (elm)->field.le_prev = (listelm)->field.le_prev; \
+ (elm)->field.le_next = (listelm); \
+ *(listelm)->field.le_prev = (elm); \
+ (listelm)->field.le_prev = &(elm)->field.le_next; \
+} while (0)
+
+#define LIST_INSERT_HEAD(head, elm, field) do { \
+ if (((elm)->field.le_next = (head)->lh_first) != NULL) \
+ (head)->lh_first->field.le_prev = &(elm)->field.le_next;\
+ (head)->lh_first = (elm); \
+ (elm)->field.le_prev = &(head)->lh_first; \
+} while (0)
+
+#define LIST_REMOVE(elm, field) do { \
+ if ((elm)->field.le_next != NULL) \
+ (elm)->field.le_next->field.le_prev = \
+ (elm)->field.le_prev; \
+ *(elm)->field.le_prev = (elm)->field.le_next; \
+} while (0)
+
+#define LIST_REPLACE(elm, elm2, field) do { \
+ if (((elm2)->field.le_next = (elm)->field.le_next) != NULL) \
+ (elm2)->field.le_next->field.le_prev = \
+ &(elm2)->field.le_next; \
+ (elm2)->field.le_prev = (elm)->field.le_prev; \
+ *(elm2)->field.le_prev = (elm2); \
+} while (0)
+
+/*
+ * Simple queue definitions.
+ */
+#define SIMPLEQ_HEAD(name, type) \
+struct name { \
+ struct type *sqh_first; /* first element */ \
+ struct type **sqh_last; /* addr of last next element */ \
+}
+
+#define SIMPLEQ_HEAD_INITIALIZER(head) \
+ { NULL, &(head).sqh_first }
+
+#define SIMPLEQ_ENTRY(type) \
+struct { \
+ struct type *sqe_next; /* next element */ \
+}
+
+/*
+ * Simple queue access methods.
+ */
+#define SIMPLEQ_FIRST(head) ((head)->sqh_first)
+#define SIMPLEQ_END(head) NULL
+#define SIMPLEQ_EMPTY(head) (SIMPLEQ_FIRST(head) == SIMPLEQ_END(head))
+#define SIMPLEQ_NEXT(elm, field) ((elm)->field.sqe_next)
+
+#define SIMPLEQ_FOREACH(var, head, field) \
+ for((var) = SIMPLEQ_FIRST(head); \
+ (var) != SIMPLEQ_END(head); \
+ (var) = SIMPLEQ_NEXT(var, field))
+
+/*
+ * Simple queue functions.
+ */
+#define SIMPLEQ_INIT(head) do { \
+ (head)->sqh_first = NULL; \
+ (head)->sqh_last = &(head)->sqh_first; \
+} while (0)
+
+#define SIMPLEQ_INSERT_HEAD(head, elm, field) do { \
+ if (((elm)->field.sqe_next = (head)->sqh_first) == NULL) \
+ (head)->sqh_last = &(elm)->field.sqe_next; \
+ (head)->sqh_first = (elm); \
+} while (0)
+
+#define SIMPLEQ_INSERT_TAIL(head, elm, field) do { \
+ (elm)->field.sqe_next = NULL; \
+ *(head)->sqh_last = (elm); \
+ (head)->sqh_last = &(elm)->field.sqe_next; \
+} while (0)
+
+#define SIMPLEQ_INSERT_AFTER(head, listelm, elm, field) do { \
+ if (((elm)->field.sqe_next = (listelm)->field.sqe_next) == NULL)\
+ (head)->sqh_last = &(elm)->field.sqe_next; \
+ (listelm)->field.sqe_next = (elm); \
+} while (0)
+
+#define SIMPLEQ_REMOVE_HEAD(head, elm, field) do { \
+ if (((head)->sqh_first = (elm)->field.sqe_next) == NULL) \
+ (head)->sqh_last = &(head)->sqh_first; \
+} while (0)
+
+/*
+ * Tail queue definitions.
+ */
+#define TAILQ_HEAD(name, type) \
+struct name { \
+ struct type *tqh_first; /* first element */ \
+ struct type **tqh_last; /* addr of last next element */ \
+}
+
+#define TAILQ_HEAD_INITIALIZER(head) \
+ { NULL, &(head).tqh_first }
+
+#define TAILQ_ENTRY(type) \
+struct { \
+ struct type *tqe_next; /* next element */ \
+ struct type **tqe_prev; /* address of previous next element */ \
+}
+
+/*
+ * tail queue access methods
+ */
+#define TAILQ_FIRST(head) ((head)->tqh_first)
+#define TAILQ_END(head) NULL
+#define TAILQ_NEXT(elm, field) ((elm)->field.tqe_next)
+#define TAILQ_LAST(head, headname) \
+ (*(((struct headname *)((head)->tqh_last))->tqh_last))
+/* XXX */
+#define TAILQ_PREV(elm, headname, field) \
+ (*(((struct headname *)((elm)->field.tqe_prev))->tqh_last))
+#define TAILQ_EMPTY(head) \
+ (TAILQ_FIRST(head) == TAILQ_END(head))
+
+#define TAILQ_FOREACH(var, head, field) \
+ for((var) = TAILQ_FIRST(head); \
+ (var) != TAILQ_END(head); \
+ (var) = TAILQ_NEXT(var, field))
+
+#define TAILQ_FOREACH_REVERSE(var, head, field, headname) \
+ for((var) = TAILQ_LAST(head, headname); \
+ (var) != TAILQ_END(head); \
+ (var) = TAILQ_PREV(var, headname, field))
+
+/*
+ * Tail queue functions.
+ */
+#define TAILQ_INIT(head) do { \
+ (head)->tqh_first = NULL; \
+ (head)->tqh_last = &(head)->tqh_first; \
+} while (0)
+
+#define TAILQ_INSERT_HEAD(head, elm, field) do { \
+ if (((elm)->field.tqe_next = (head)->tqh_first) != NULL) \
+ (head)->tqh_first->field.tqe_prev = \
+ &(elm)->field.tqe_next; \
+ else \
+ (head)->tqh_last = &(elm)->field.tqe_next; \
+ (head)->tqh_first = (elm); \
+ (elm)->field.tqe_prev = &(head)->tqh_first; \
+} while (0)
+
+#define TAILQ_INSERT_TAIL(head, elm, field) do { \
+ (elm)->field.tqe_next = NULL; \
+ (elm)->field.tqe_prev = (head)->tqh_last; \
+ *(head)->tqh_last = (elm); \
+ (head)->tqh_last = &(elm)->field.tqe_next; \
+} while (0)
+
+#define TAILQ_INSERT_AFTER(head, listelm, elm, field) do { \
+ if (((elm)->field.tqe_next = (listelm)->field.tqe_next) != NULL)\
+ (elm)->field.tqe_next->field.tqe_prev = \
+ &(elm)->field.tqe_next; \
+ else \
+ (head)->tqh_last = &(elm)->field.tqe_next; \
+ (listelm)->field.tqe_next = (elm); \
+ (elm)->field.tqe_prev = &(listelm)->field.tqe_next; \
+} while (0)
+
+#define TAILQ_INSERT_BEFORE(listelm, elm, field) do { \
+ (elm)->field.tqe_prev = (listelm)->field.tqe_prev; \
+ (elm)->field.tqe_next = (listelm); \
+ *(listelm)->field.tqe_prev = (elm); \
+ (listelm)->field.tqe_prev = &(elm)->field.tqe_next; \
+} while (0)
+
+#define TAILQ_REMOVE(head, elm, field) do { \
+ if (((elm)->field.tqe_next) != NULL) \
+ (elm)->field.tqe_next->field.tqe_prev = \
+ (elm)->field.tqe_prev; \
+ else \
+ (head)->tqh_last = (elm)->field.tqe_prev; \
+ *(elm)->field.tqe_prev = (elm)->field.tqe_next; \
+} while (0)
+
+#define TAILQ_REPLACE(head, elm, elm2, field) do { \
+ if (((elm2)->field.tqe_next = (elm)->field.tqe_next) != NULL) \
+ (elm2)->field.tqe_next->field.tqe_prev = \
+ &(elm2)->field.tqe_next; \
+ else \
+ (head)->tqh_last = &(elm2)->field.tqe_next; \
+ (elm2)->field.tqe_prev = (elm)->field.tqe_prev; \
+ *(elm2)->field.tqe_prev = (elm2); \
+} while (0)
+
+/*
+ * Circular queue definitions.
+ */
+#define CIRCLEQ_HEAD(name, type) \
+struct name { \
+ struct type *cqh_first; /* first element */ \
+ struct type *cqh_last; /* last element */ \
+}
+
+#define CIRCLEQ_HEAD_INITIALIZER(head) \
+ { CIRCLEQ_END(&head), CIRCLEQ_END(&head) }
+
+#define CIRCLEQ_ENTRY(type) \
+struct { \
+ struct type *cqe_next; /* next element */ \
+ struct type *cqe_prev; /* previous element */ \
+}
+
+/*
+ * Circular queue access methods
+ */
+#define CIRCLEQ_FIRST(head) ((head)->cqh_first)
+#define CIRCLEQ_LAST(head) ((head)->cqh_last)
+#define CIRCLEQ_END(head) ((void *)(head))
+#define CIRCLEQ_NEXT(elm, field) ((elm)->field.cqe_next)
+#define CIRCLEQ_PREV(elm, field) ((elm)->field.cqe_prev)
+#define CIRCLEQ_EMPTY(head) \
+ (CIRCLEQ_FIRST(head) == CIRCLEQ_END(head))
+
+#define CIRCLEQ_FOREACH(var, head, field) \
+ for((var) = CIRCLEQ_FIRST(head); \
+ (var) != CIRCLEQ_END(head); \
+ (var) = CIRCLEQ_NEXT(var, field))
+
+#define CIRCLEQ_FOREACH_REVERSE(var, head, field) \
+ for((var) = CIRCLEQ_LAST(head); \
+ (var) != CIRCLEQ_END(head); \
+ (var) = CIRCLEQ_PREV(var, field))
+
+/*
+ * Circular queue functions.
+ */
+#define CIRCLEQ_INIT(head) do { \
+ (head)->cqh_first = CIRCLEQ_END(head); \
+ (head)->cqh_last = CIRCLEQ_END(head); \
+} while (0)
+
+#define CIRCLEQ_INSERT_AFTER(head, listelm, elm, field) do { \
+ (elm)->field.cqe_next = (listelm)->field.cqe_next; \
+ (elm)->field.cqe_prev = (listelm); \
+ if ((listelm)->field.cqe_next == CIRCLEQ_END(head)) \
+ (head)->cqh_last = (elm); \
+ else \
+ (listelm)->field.cqe_next->field.cqe_prev = (elm); \
+ (listelm)->field.cqe_next = (elm); \
+} while (0)
+
+#define CIRCLEQ_INSERT_BEFORE(head, listelm, elm, field) do { \
+ (elm)->field.cqe_next = (listelm); \
+ (elm)->field.cqe_prev = (listelm)->field.cqe_prev; \
+ if ((listelm)->field.cqe_prev == CIRCLEQ_END(head)) \
+ (head)->cqh_first = (elm); \
+ else \
+ (listelm)->field.cqe_prev->field.cqe_next = (elm); \
+ (listelm)->field.cqe_prev = (elm); \
+} while (0)
+
+#define CIRCLEQ_INSERT_HEAD(head, elm, field) do { \
+ (elm)->field.cqe_next = (head)->cqh_first; \
+ (elm)->field.cqe_prev = CIRCLEQ_END(head); \
+ if ((head)->cqh_last == CIRCLEQ_END(head)) \
+ (head)->cqh_last = (elm); \
+ else \
+ (head)->cqh_first->field.cqe_prev = (elm); \
+ (head)->cqh_first = (elm); \
+} while (0)
+
+#define CIRCLEQ_INSERT_TAIL(head, elm, field) do { \
+ (elm)->field.cqe_next = CIRCLEQ_END(head); \
+ (elm)->field.cqe_prev = (head)->cqh_last; \
+ if ((head)->cqh_first == CIRCLEQ_END(head)) \
+ (head)->cqh_first = (elm); \
+ else \
+ (head)->cqh_last->field.cqe_next = (elm); \
+ (head)->cqh_last = (elm); \
+} while (0)
+
+#define CIRCLEQ_REMOVE(head, elm, field) do { \
+ if ((elm)->field.cqe_next == CIRCLEQ_END(head)) \
+ (head)->cqh_last = (elm)->field.cqe_prev; \
+ else \
+ (elm)->field.cqe_next->field.cqe_prev = \
+ (elm)->field.cqe_prev; \
+ if ((elm)->field.cqe_prev == CIRCLEQ_END(head)) \
+ (head)->cqh_first = (elm)->field.cqe_next; \
+ else \
+ (elm)->field.cqe_prev->field.cqe_next = \
+ (elm)->field.cqe_next; \
+} while (0)
+
+#define CIRCLEQ_REPLACE(head, elm, elm2, field) do { \
+ if (((elm2)->field.cqe_next = (elm)->field.cqe_next) == \
+ CIRCLEQ_END(head)) \
+ (head).cqh_last = (elm2); \
+ else \
+ (elm2)->field.cqe_next->field.cqe_prev = (elm2); \
+ if (((elm2)->field.cqe_prev = (elm)->field.cqe_prev) == \
+ CIRCLEQ_END(head)) \
+ (head).cqh_first = (elm2); \
+ else \
+ (elm2)->field.cqe_prev->field.cqe_next = (elm2); \
+} while (0)
+
+#endif /* !_SYS_QUEUE_H_ */
diff -up nfs-utils-1.2.3/utils/spnfsd/spnfsd.conf.orig nfs-utils-1.2.3/utils/spnfsd/spnfsd.conf
--- nfs-utils-1.2.3/utils/spnfsd/spnfsd.conf.orig 2010-10-04 15:48:00.083419957 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/spnfsd.conf 2010-10-04 15:48:00.083419957 -0400
@@ -0,0 +1,21 @@
+[General]
+
+Verbosity = 1
+Stripe-size = 8192
+Dense-striping = 0
+Pipefs-Directory = /var/lib/nfs/rpc_pipefs
+DS-Mount-Directory = /spnfs
+
+[DataServers]
+
+NumDS = 2
+
+DS1_IP = 172.16.28.134
+DS1_PORT = 2049
+DS1_ROOT = /pnfs
+DS1_ID = 1
+
+DS2_IP = 172.16.28.141
+DS2_PORT = 2049
+DS2_ROOT = /pnfs
+DS2_ID = 2
diff -up nfs-utils-1.2.3/utils/spnfsd/spnfsd.c.orig nfs-utils-1.2.3/utils/spnfsd/spnfsd.c
--- nfs-utils-1.2.3/utils/spnfsd/spnfsd.c.orig 2010-10-04 15:48:00.083419957 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/spnfsd.c 2010-10-04 15:48:00.083419957 -0400
@@ -0,0 +1,578 @@
+/*
+ * spnfsd.c
+ * Userland daemon for spNFS.
+ * Based heavily on idmapd.c
+ *
+ */
+/*
+ * idmapd.c
+ *
+ * Userland daemon for idmap.
+ *
+ * Copyright (c) 2002 The Regents of the University of Michigan.
+ * All rights reserved.
+ *
+ * Marius Aamodt Eriksen <marius@umich.edu>
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * 3. Neither the name of the University nor the names of its
+ * contributors may be used to endorse or promote products derived
+ * from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
+ * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+ * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+ * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+ * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+ * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+ * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#define _LARGEFILE64_SOURCE
+#define _FILE_OFFSET_BITS 64
+#include <sys/types.h>
+#include <sys/time.h>
+#include <sys/poll.h>
+#include <sys/socket.h>
+#include <sys/stat.h>
+#include <time.h>
+
+#include <err.h>
+#include <errno.h>
+#include <event.h>
+#include <fcntl.h>
+#include <dirent.h>
+#include <unistd.h>
+#include <netdb.h>
+#include <signal.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <stdarg.h>
+#include <syslog.h>
+#include <pwd.h>
+#include <grp.h>
+#include <limits.h>
+#include <ctype.h>
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif /* HAVE_CONFIG_H */
+
+#include "cfg.h"
+#include "queue.h"
+#include "nfslib.h"
+
+#include "nfsd4_spnfs.h"
+#include "spnfsd.h"
+
+#ifndef PIPEFS_DIR
+#define PIPEFS_DIR "/var/lib/nfs/rpc_pipefs/"
+#endif
+
+#ifndef DSMOUNT_DIR
+#define DSMOUNT_DIR "/spnfs"
+#endif
+
+/* From Niels */
+#define CONF_SAVE(w, f) do { \
+ char *p = f; \
+ if (p != NULL) \
+ (w) = p; \
+} while (0)
+
+struct spnfs_client {
+ int sc_fd;
+ char sc_path[PATH_MAX]; /* DM: full path to spnfs pipe */
+ struct event sc_event;
+};
+
+static void spnfscb(int, short, void *);
+static int do_mounts(void);
+
+static void spnfs_msg_handler(struct spnfs_client *, struct spnfs_msg *);
+static void send_invalid_msg(int);
+
+size_t strlcat(char *, const char *, size_t);
+size_t strlcpy(char *, const char *, size_t);
+ssize_t atomicio(ssize_t (*)(), int, void *, size_t);
+void mydaemon(int, int);
+void release_parent();
+static int read_config();
+static void dump_config();
+
+int verbose = 0;
+int stripesize = DEFAULT_STRIPE_SIZE;
+int densestriping = 0;
+int num_dev = 1; /* XXX no multiple device support yet */
+int num_ds;
+struct dserver dataservers[SPNFS_MAX_DATA_SERVERS];
+char dsmountdir[PATH_MAX];
+struct spnfs_config spnfs_config;
+
+static int cache_entry_expiration = 0;
+static char pipefsdir[PATH_MAX];
+static char pipefspath[PATH_MAX];
+
+/* SPNFS */
+struct spnfs_client sc;
+
+/* Used by cfg.c */
+char *conf_path;
+
+static void
+msg_format(char *rtnbuff, int rtnbuffsize, int errval,
+ const char *fmt, va_list args)
+{
+ char buff[1024];
+ int n;
+
+ vsnprintf(buff, sizeof(buff), fmt, args);
+
+ if ((n = strlen(buff)) > 0 && buff[n-1] == '\n')
+ buff[--n] = '\0';
+
+ snprintf(rtnbuff, rtnbuffsize, "%s: %s", buff, strerror(errval));
+}
+
+void
+spnfsd_warn(const char *fmt, ...)
+{
+ int errval = errno; /* save this! */
+ char buff[1024];
+ va_list args;
+
+ va_start(args, fmt);
+ msg_format(buff, sizeof(buff), errval, fmt, args);
+ va_end(args);
+
+ syslog(LOG_WARNING, "%s", buff);
+}
+
+void
+spnfsd_warnx(const char *fmt, ...)
+{
+ va_list args;
+
+ va_start(args, fmt);
+ vsyslog(LOG_WARNING, fmt, args);
+ va_end(args);
+}
+
+void
+spnfsd_err(int eval, const char *fmt, ...)
+{
+ int errval = errno; /* save this! */
+ char buff[1024];
+ va_list args;
+
+ va_start(args, fmt);
+ msg_format(buff, sizeof(buff), errval, fmt, args);
+ va_end(args);
+
+ syslog(LOG_ERR, "%s", buff);
+ exit(eval);
+}
+
+void
+spnfsd_errx(int eval, const char *fmt, ...)
+{
+ va_list args;
+
+ va_start(args, fmt);
+ vsyslog(LOG_ERR, fmt, args);
+ va_end(args);
+ exit(eval);
+}
+
+int
+main(int argc, char **argv)
+{
+ int opt, fg = 0;
+ char *progname;
+ struct stat sb;
+ int rc, fd, cmd = 1;
+ int i;
+
+ fd = open("/proc/fs/spnfs/ctl", O_WRONLY);
+ if (fd < 0)
+ spnfsd_errx(1, "kernel init failed (%s)", strerror(errno));
+ rc = write(fd, &cmd, sizeof(int));
+ if (rc < 0 && errno != EEXIST)
+ spnfsd_errx(1, "kernel init failed (%s)", strerror(errno));
+ close(fd);
+
+ conf_path = _PATH_SPNFSDCONF;
+ strlcpy(pipefsdir, PIPEFS_DIR, sizeof(pipefsdir));
+ strlcpy(dsmountdir, DSMOUNT_DIR, sizeof(dsmountdir));
+ strlcpy(sc.sc_path, PIPEFS_DIR, sizeof(sc.sc_path));
+
+ if ((progname = strrchr(argv[0], '/')))
+ progname++;
+ else
+ progname = argv[0];
+
+ openlog(progname, LOG_PID, LOG_DAEMON);
+
+#define GETOPTSTR "vfd:p:U:G:c:CS"
+ opterr=0; /* Turn off error messages */
+ while ((opt = getopt(argc, argv, GETOPTSTR)) != -1) {
+ if (opt == 'c')
+ conf_path = optarg;
+ if (opt == '?') {
+ if (strchr(GETOPTSTR, optopt))
+ errx(1, "'-%c' option requires an argument.", optopt);
+ else
+ errx(1, "'-%c' is an invalid argument.", optopt);
+ }
+ }
+ optind = 1;
+
+ if (stat(conf_path, &sb) == -1 &&(errno == ENOENT || errno == EACCES)) {
+ warn("Skipping configuration file \"%s\"", conf_path);
+ conf_path = NULL;
+ } else {
+ conf_init();
+ if (read_config() != 0)
+ spnfsd_err(1, "Invalid config file\n");
+ if (verbose)
+ dump_config();
+ }
+
+ while ((opt = getopt(argc, argv, GETOPTSTR)) != -1)
+ switch (opt) {
+ case 'v':
+ verbose++;
+ break;
+ case 'f':
+ fg = 1;
+ break;
+ case 'p':
+ strlcpy(pipefsdir, optarg, sizeof(pipefsdir));
+ strlcpy(sc.sc_path, optarg, sizeof(sc.sc_path));
+ break;
+ default:
+ break;
+ }
+
+ strncat(pipefsdir, "/nfs", sizeof(pipefsdir));
+ strncat(sc.sc_path, "/nfs/spnfs", sizeof(sc.sc_path));
+ memcpy(pipefspath, sc.sc_path, sizeof(pipefspath));
+
+ spnfs_config.stripe_size = stripesize;
+ spnfs_config.dense_striping = densestriping;
+ spnfs_config.num_ds = num_ds;
+
+ for (i = 0; i < num_ds; i++)
+ sprintf(spnfs_config.ds_dir[i], "%s/%s",
+ dsmountdir, dataservers[i].ds_ip);
+
+ fd = open("/proc/fs/spnfs/config", O_WRONLY);
+ if (fd < 0)
+ spnfsd_errx(1, "error creating config (%s)", strerror(errno));
+ rc = write(fd, &spnfs_config, sizeof(struct spnfs_config));
+ if (rc < 0 && errno != EEXIST)
+ spnfsd_errx(1, "error writing config (%s)", strerror(errno));
+ close(fd);
+
+ signal(SIGHUP, send_invalid_msg);
+
+ if (do_mounts() != 0)
+ spnfsd_err(1, "Mounting DSs failed\n");
+
+
+/* DMXXX in case I forget -f while testing... */
+fg = 1;
+ if (!fg)
+ mydaemon(0, 0);
+
+ event_init();
+
+ if (verbose > 0)
+ spnfsd_warnx("Expiration time is %d seconds.",
+ cache_entry_expiration);
+
+ if ((sc.sc_fd = open(sc.sc_path, O_RDWR, 0)) == -1) {
+ perror("spnfsd open file");
+ } else {
+ event_set(&sc.sc_event, sc.sc_fd, EV_READ, spnfscb, &sc);
+ event_add(&sc.sc_event, NULL);
+ }
+
+ release_parent();
+
+ if (event_dispatch() < 0)
+ spnfsd_errx(1, "main: event_dispatch returns errno %d (%s)",
+ errno, strerror(errno));
+ /* NOTREACHED */
+ return 1;
+}
+
+static void
+spnfs_msg_handler(struct spnfs_client *scp, struct spnfs_msg *im)
+{
+ int err;
+
+ switch (im->im_type) {
+ case SPNFS_TYPE_LAYOUTGET:
+ err = spnfsd_layoutget(im);
+ break;
+ case SPNFS_TYPE_LAYOUTCOMMIT:
+ err = spnfsd_layoutcommit(im);
+ break;
+ case SPNFS_TYPE_LAYOUTRETURN:
+ err = spnfsd_layoutreturn(im);
+ break;
+ case SPNFS_TYPE_GETDEVICEITER:
+ err = spnfsd_getdeviceiter(im);
+ break;
+ case SPNFS_TYPE_GETDEVICEINFO:
+ err = spnfsd_getdeviceinfo(im);
+ break;
+ case SPNFS_TYPE_SETATTR:
+ err = spnfsd_setattr(im);
+ break;
+ case SPNFS_TYPE_OPEN:
+ err = spnfsd_open(im);
+ break;
+ case SPNFS_TYPE_CLOSE:
+ err = spnfsd_close(im);
+ break;
+ case SPNFS_TYPE_CREATE:
+ err = spnfsd_create(im);
+ break;
+ case SPNFS_TYPE_REMOVE:
+ err = spnfsd_remove(im);
+ break;
+ case SPNFS_TYPE_COMMIT:
+ err = spnfsd_commit(im);
+ break;
+ case SPNFS_TYPE_READ:
+ err = spnfsd_read(im);
+ break;
+ case SPNFS_TYPE_WRITE:
+ err = spnfsd_write(im);
+ break;
+ default:
+ spnfsd_warnx("spnfs_msg_handler: Invalid msg type (%d) in message",
+ im->im_type);
+ im->im_status |= SPNFS_STATUS_INVALIDMSG;
+ err = -EINVAL;
+ break;
+ }
+}
+
+static void
+spnfscb(int fd, short which, void *data)
+{
+ struct spnfs_client *scp = data;
+ struct spnfs_msg im;
+ int rval;
+
+ if (which != EV_READ)
+ goto out;
+
+ if (atomicio(read, scp->sc_fd, &im, sizeof(im)) != sizeof(im)) {
+ if (verbose > 0)
+ spnfsd_warn("spnfscb: read(%s)", scp->sc_path);
+ if (errno == EPIPE)
+ return;
+ goto out;
+ }
+
+ spnfs_msg_handler(scp, &im);
+
+ /* XXX: I don't like ignoring this error in the id->name case,
+ * but we've never returned it, and I need to check that the client
+ * can handle it gracefully before starting to return it now. */
+
+ if (im.im_status == SPNFS_STATUS_FAIL)
+ im.im_status = SPNFS_STATUS_SUCCESS;
+
+ if ((rval=atomicio(write, scp->sc_fd, &im, sizeof(im))) != sizeof(im)) {
+ spnfsd_warn("spnfscb: write(%s)", scp->sc_path);
+ }
+
+out:
+ event_add(&scp->sc_event, NULL);
+}
+
+/*
+ * mydaemon creates a pipe between the partent and child
+ * process. The parent process will wait until the
+ * child dies or writes a '1' on the pipe signaling
+ * that it started successfully.
+ */
+int pipefds[2] = { -1, -1};
+
+void
+mydaemon(int nochdir, int noclose)
+{
+ int pid, status, tempfd;
+
+ if (pipe(pipefds) < 0)
+ err(1, "mydaemon: pipe() failed: errno %d", errno);
+
+ if ((pid = fork ()) < 0)
+ err(1, "mydaemon: fork() failed: errno %d", errno);
+
+ if (pid != 0) {
+ /*
+ * Parent. Wait for status from child.
+ */
+ close(pipefds[1]);
+ if (read(pipefds[0], &status, 1) != 1)
+ exit(1);
+ exit (0);
+ }
+ /* Child. */
+ close(pipefds[0]);
+ setsid ();
+ if (nochdir == 0) {
+ if (chdir ("/") == -1)
+ err(1, "mydaemon: chdir() failed: errno %d", errno);
+ }
+
+ while (pipefds[1] <= 2) {
+ pipefds[1] = dup(pipefds[1]);
+ if (pipefds[1] < 0)
+ err(1, "mydaemon: dup() failed: errno %d", errno);
+ }
+
+ if (noclose == 0) {
+ tempfd = open("/dev/null", O_RDWR);
+ if (tempfd < 0)
+ tempfd = open("/", O_RDONLY);
+ if (tempfd >= 0) {
+ dup2(tempfd, 0);
+ dup2(tempfd, 1);
+ dup2(tempfd, 2);
+ closeall(3);
+ } else
+ closeall(0);
+ }
+
+ return;
+}
+
+void
+release_parent()
+{
+ int status;
+
+ if (pipefds[1] > 0) {
+ write(pipefds[1], &status, 1);
+ close(pipefds[1]);
+ pipefds[1] = -1;
+ }
+}
+
+static int
+read_config()
+{
+ char *xpipefsdir = NULL;
+ char *xdsmountdir = NULL;
+ int ds;
+ char ipstr[20], portstr[20], rootstr[20], dsidstr[20];
+
+ verbose = conf_get_num("General", "Verbosity", 0);
+ stripesize = conf_get_num("General", "Stripe-size",DEFAULT_STRIPE_SIZE);
+ densestriping = conf_get_num("General", "Dense-striping", 0);
+ CONF_SAVE(xpipefsdir, conf_get_str("General", "Pipefs-Directory"));
+ if (xpipefsdir != NULL)
+ strlcpy(pipefsdir, xpipefsdir, sizeof(pipefsdir));
+ CONF_SAVE(xdsmountdir, conf_get_str("General", "DS-Mount-Directory"));
+ if (xdsmountdir != NULL)
+ strlcpy(dsmountdir, xdsmountdir, sizeof(dsmountdir));
+ num_ds = conf_get_num("DataServers", "NumDS", 0);
+ if (num_ds < 1 || num_ds > SPNFS_MAX_DATA_SERVERS)
+ spnfsd_err(1, "Invalid number of data servers in config: %d\n",
+ num_ds);
+ for (ds = 1; ds <= num_ds ; ds++) {
+ sprintf(ipstr, "DS%d_IP", ds);
+ sprintf(portstr, "DS%d_PORT", ds);
+ sprintf(rootstr, "DS%d_ROOT", ds);
+ sprintf(dsidstr, "DS%d_ID", ds);
+ CONF_SAVE(dataservers[ds-1].ds_ip,
+ conf_get_str("DataServers", ipstr));
+ if (dataservers[ds-1].ds_ip == NULL)
+ spnfsd_err(1, "Missing IP for DS%d\n", ds);
+ dataservers[ds-1].ds_port =
+ conf_get_num("DataServers", portstr, DEFAULT_DS_PORT);
+ CONF_SAVE(dataservers[ds-1].ds_path,
+ conf_get_str("DataServers", rootstr));
+ if (dataservers[ds-1].ds_ip == NULL)
+ spnfsd_err(1, "Missing IP for DS%d\n", ds);
+ dataservers[ds-1].ds_id =
+ conf_get_num("DataServers", dsidstr, -1);
+ if (dataservers[ds-1].ds_id < 0)
+ spnfsd_err(1, "Missing or invalid ID for DS%d\n", ds);
+ }
+
+ return 0;
+}
+
+static void
+dump_config()
+{
+ int ds;
+
+ printf("Verbosity: %d\n", verbose);
+ printf("Stripe size: %d\n", stripesize);
+ printf("Dense striping: %d\n", densestriping);
+ printf("Number of data servers: %d\n", num_ds);
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ printf("DS%d IP: %s\n", ds+1, dataservers[ds].ds_ip);
+ printf("DS%d PORT: %d\n", ds+1, dataservers[ds].ds_port);
+ printf("DS%d ROOT: %s\n", ds+1, dataservers[ds].ds_path);
+ printf("DS%d DSID: %d\n", ds+1, dataservers[ds].ds_id);
+ }
+}
+
+static int
+do_mounts()
+{
+ int ds;
+ char cmd[1024];
+
+ return 0;
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ sprintf(cmd, "mkdir -p %s/%s", dsmountdir,
+ dataservers[ds].ds_ip);
+ system(cmd);
+ sprintf(cmd, "mount -t nfs4 %s:%s %s/%s",
+ dataservers[ds].ds_ip, dataservers[ds].ds_path,
+ dsmountdir, dataservers[ds].ds_ip);
+ system(cmd);
+ }
+}
+
+static void
+send_invalid_msg(int signum)
+{
+ struct spnfs_msg im;
+ int fd, rval;
+
+ im.im_status = SPNFS_STATUS_FAIL;
+
+ if ((fd = open(pipefspath, O_RDWR, 0)) == -1) {
+ perror("spnfsd open pipe");
+ } else {
+ if ((rval=atomicio(write, fd, &im, sizeof(im))) != sizeof(im)) {
+ spnfsd_warn("send_invalid_msg: write(%s)", pipefspath);
+ }
+ }
+}
diff -up nfs-utils-1.2.3/utils/spnfsd/spnfsd.h.orig nfs-utils-1.2.3/utils/spnfsd/spnfsd.h
--- nfs-utils-1.2.3/utils/spnfsd/spnfsd.h.orig 2010-10-04 15:48:00.084495938 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/spnfsd.h 2010-10-04 15:48:00.084495938 -0400
@@ -0,0 +1,70 @@
+/*
+ * spnfsd.h
+ *
+ * spNFS - simple pNFS implementation with userspace daemon
+ *
+ */
+/******************************************************************************
+
+(c) 2007 Network Appliance, Inc. All Rights Reserved.
+
+Network Appliance provides this source code under the GPL v2 License.
+The GPL v2 license is available at
+http://opensource.org/licenses/gpl-license.php.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+******************************************************************************/
+
+#ifndef _PATH_SPNFSDCONF
+#define _PATH_SPNFSDCONF "/etc/spnfsd.conf"
+#endif
+
+#ifndef DEFAULT_STRIPE_SIZE
+#define DEFAULT_STRIPE_SIZE 4096
+#endif
+
+#ifndef DEFAULT_DS_PORT
+#define DEFAULT_DS_PORT 2049
+#endif
+
+struct dserver {
+ char *ds_ip;
+ int ds_port;
+ char *ds_path;
+ int ds_id;
+};
+
+/* DMXXX future struct for whole config */
+struct spnfsd_config {
+ int verbose;
+ int stripesize;
+ int densestriping;
+ int num_ds;
+ struct dserver dataservers[SPNFS_MAX_DATA_SERVERS];
+};
+
+int spnfsd_layoutget(struct spnfs_msg *);
+int spnfsd_layoutcommit(struct spnfs_msg *);
+int spnfsd_layoutreturn(struct spnfs_msg *);
+int spnfsd_getdeviceiter(struct spnfs_msg *);
+int spnfsd_getdeviceinfo(struct spnfs_msg *);
+int spnfsd_setattr(struct spnfs_msg *);
+int spnfsd_open(struct spnfs_msg *);
+int spnfsd_close(struct spnfs_msg *);
+int spnfsd_create(struct spnfs_msg *);
+int spnfsd_remove(struct spnfs_msg *);
+int spnfsd_commit(struct spnfs_msg *);
+int spnfsd_read(struct spnfs_msg *);
+int spnfsd_write(struct spnfs_msg *);
+int spnfsd_getfh(char *, unsigned char *, unsigned int *);
diff -up nfs-utils-1.2.3/utils/spnfsd/spnfsd_ops.c.orig nfs-utils-1.2.3/utils/spnfsd/spnfsd_ops.c
--- nfs-utils-1.2.3/utils/spnfsd/spnfsd_ops.c.orig 2010-10-04 15:48:00.084495938 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/spnfsd_ops.c 2010-10-04 15:48:00.085512992 -0400
@@ -0,0 +1,439 @@
+/******************************************************************************
+
+(c) 2007 Network Appliance, Inc. All Rights Reserved.
+
+Network Appliance provides this source code under the GPL v2 License.
+The GPL v2 license is available at
+http://opensource.org/licenses/gpl-license.php.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+******************************************************************************/
+
+#define _LARGEFILE64_SOURCE
+#define _FILE_OFFSET_BITS 64
+#include "nfsd4_spnfs.h"
+#include "spnfsd.h"
+#include "nfs/nfs.h"
+#include <string.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+#include <unistd.h>
+#include <errno.h>
+
+
+extern int stripesize;
+extern int densestriping;
+extern int num_ds;
+extern int num_dev;
+extern char dsmountdir[];
+extern struct dserver dataservers[SPNFS_MAX_DATA_SERVERS];
+size_t strlcat(char *, const char *, size_t);
+size_t strlcpy(char *, const char *, size_t);
+
+int
+spnfsd_layoutget(struct spnfs_msg *im)
+{
+ int ds;
+ int rc;
+ char fullpath[1024]; /* MSXXX */
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.layoutget_res.status = 0;
+ im->im_res.layoutget_res.devid = 1; /* XXX */
+ im->im_res.layoutget_res.stripe_size = stripesize;
+ if (densestriping)
+ im->im_res.layoutget_res.stripe_type = 1; /* DMXXX enum */
+ else
+ im->im_res.layoutget_res.stripe_type = 0; /* DMXXX ^^^^ */
+ im->im_res.layoutget_res.stripe_count = num_ds;
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ memset(im->im_res.layoutget_res.flist[ds].fh_val, 0, 128); /*DMXXX*/
+ sprintf(fullpath, "%s/%s/%lu.%lu",
+ dsmountdir, dataservers[ds].ds_ip,
+ im->im_args.layoutget_args.inode,
+ im->im_args.layoutget_args.generation);
+ rc = spnfsd_getfh(fullpath,
+ im->im_res.layoutget_res.flist[ds].fh_val,
+ &im->im_res.layoutget_res.flist[ds].fh_len);
+ if (rc < 0) {
+ /* MSXXX needs error msg/handling */
+ im->im_res.layoutget_res.status = ENOENT;
+ return -1;
+ }
+
+ /*
+ * MSXXX another hack...fix the hardcoding.
+ * The fh's fsid_type is incremented by 8 to get
+ * around stateid checking.
+ */
+ im->im_res.layoutget_res.flist[ds].fh_val[2] += 8;
+ }
+
+ return 0;
+}
+
+int
+spnfsd_layoutcommit(struct spnfs_msg *im)
+{
+ char basename[1024]; /* DMXXX */
+ char fullpath[1024]; /* DMXXX */
+ int ds;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.layoutcommit_res.status = 0;
+ sprintf(basename, "%lu.%lu", im->im_args.layoutcommit_args.inode,
+ im->im_args.layoutcommit_args.generation);
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ sprintf(fullpath, "%s/%s/%s", dsmountdir,
+ dataservers[ds].ds_ip, basename);
+ truncate(fullpath, im->im_args.layoutcommit_args.file_size);
+ }
+
+ return 0;
+}
+
+int
+spnfsd_layoutreturn(struct spnfs_msg *im)
+{
+ return 0;
+}
+
+int
+spnfsd_getdeviceiter(struct spnfs_msg *im)
+{
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.getdeviceiter_res.status = 0;
+
+ /* verifier ignored for now */
+ if (im->im_args.getdeviceiter_args.cookie >= num_dev)
+ im->im_res.getdeviceiter_res.eof = 1;
+ else {
+ /* XXX just hardcoded for now...fix this */
+ im->im_res.getdeviceiter_res.devid = 1;
+ im->im_res.getdeviceiter_res.cookie = im->im_args.getdeviceiter_args.cookie + 1;
+ im->im_res.getdeviceiter_res.verf = 0;
+ im->im_res.getdeviceiter_res.eof = 0;
+ }
+
+ return 0;
+}
+
+int
+spnfsd_getdeviceinfo(struct spnfs_msg *im)
+{
+ struct spnfs_device *devp;
+ struct spnfs_data_server *dsp;
+ u_int32_t devid;
+ int ds;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.getdeviceinfo_res.status = 0;
+
+ devid = im->im_args.getdeviceinfo_args.devid;
+
+ /* XXX fix this if/when we support multiple devices */
+ if (devid != 1) {
+ im->im_res.getdeviceinfo_res.status = -ENOENT;
+ return -1;
+ }
+
+ devp = &im->im_res.getdeviceinfo_res.devinfo;
+ devp->dscount = num_ds;
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ dsp = &devp->dslist[ds];
+ dsp->dsid = dataservers[ds].ds_id;
+ memset(dsp->netid, 0, 5);
+ strlcpy(dsp->netid, "tcp", 4);
+ sprintf(dsp->addr, "%s.%d.%d",
+ dataservers[ds].ds_ip,
+ dataservers[ds].ds_port >> 8,
+ dataservers[ds].ds_port & 0xff);
+ }
+
+ return 0;
+}
+
+int
+spnfsd_setattr(struct spnfs_msg *im)
+{
+ char basename[1024]; /* DMXXX */
+ char fullpath[1024]; /* DMXXX */
+ int ds;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.setattr_res.status = 0;
+ sprintf(basename, "%lu.%lu", im->im_args.setattr_args.inode,
+ im->im_args.setattr_args.generation);
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ sprintf(fullpath, "%s/%s/%s", dsmountdir,
+ dataservers[ds].ds_ip, basename);
+ truncate(fullpath, im->im_args.setattr_args.file_size);
+ }
+
+ return 0;
+}
+
+int
+spnfsd_open(struct spnfs_msg *im)
+{
+ char basename[1024]; /* DMXXX */
+ char fullpath[1024]; /* DMXXX */
+ char dirpath[1024]; /* DMXXX */
+ int ds;
+ int fd, status;
+ struct stat buf;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.open_res.status = 0;
+ sprintf(basename, "%lu.%lu", im->im_args.open_args.inode,
+ im->im_args.open_args.generation);
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ sprintf(dirpath, "%s/%s", dsmountdir,
+ dataservers[ds].ds_ip);
+ sprintf(fullpath, "%s/%s", dirpath, basename);
+ status = stat(dirpath, &buf);
+ im->im_res.open_res.status = errno;
+ if (status != 0) {
+ perror(dirpath);
+ break;
+ }
+ if ((fd = open(fullpath, O_WRONLY|O_CREAT, 0777)) < 0) {
+ perror(fullpath);
+ im->im_res.open_res.status = errno;
+ break;
+ } else {
+ if (fchmod(fd, 0777) != 0) {
+ /* DM: we'll consider this non-fatal for now */
+ perror("chmod stripe");
+ }
+ im->im_res.open_res.status = 0;
+ close(fd);
+ }
+ }
+
+ return im->im_res.open_res.status;
+}
+
+int
+spnfsd_close(struct spnfs_msg *im)
+{
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ printf("spnfsd_close received: %d\n", im->im_args.close_args.x);
+ im->im_res.close_res.y = 7331;
+ return 0;
+}
+
+int
+spnfsd_create(struct spnfs_msg *im)
+{
+ return 0;
+}
+
+int
+spnfsd_remove(struct spnfs_msg *im)
+{
+ char basename[1024]; /* DMXXX */
+ char fullpath[1024]; /* DMXXX */
+ int ds;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.remove_res.status = 0;
+ sprintf(basename, "%lu.%lu", im->im_args.remove_args.inode,
+ im->im_args.remove_args.generation);
+
+ for (ds = 0 ; ds < num_ds ; ds++) {
+ sprintf(fullpath, "%s/%s/%s", dsmountdir,
+ dataservers[ds].ds_ip, basename);
+ unlink(fullpath);
+ }
+
+ return 0;
+}
+
+int
+spnfsd_commit(struct spnfs_msg *im)
+{
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ return 0;
+}
+
+int
+min (unsigned int x, unsigned int y)
+{
+ if (x<y) return x; else return y;
+}
+
+/* DMXXX: for read and write, there's an issue with partially completed i/o */
+int
+spnfsd_read(struct spnfs_msg *im)
+{
+ unsigned long inode = im->im_args.read_args.inode;
+ unsigned long generation = im->im_args.read_args.generation;
+ loff_t offset = im->im_args.read_args.offset;
+ unsigned long len = im->im_args.read_args.len;
+ int ds, iolen;
+ loff_t soffset;
+ int bufoffset = 0;
+ char fullpath[1024]; /* DMXXX */
+ int fd, err;
+ int completed = 0;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.read_res.status = 0;
+ if (len > SPNFS_MAX_IO) {
+ im->im_res.read_res.status = -1;
+ return 0;
+ }
+ while (len > 0) {
+ ds = (offset / stripesize) % num_ds;
+ if (densestriping == 0)
+ soffset = offset;
+ else
+ soffset = (offset / num_ds) + (offset % stripesize);
+ iolen = min(len, stripesize - (offset % stripesize));
+
+ sprintf(fullpath, "%s/%s/%lu.%lu", dsmountdir,
+ dataservers[ds].ds_ip, inode, generation);
+ fd = open(fullpath, O_RDONLY);
+ if (fd < 0) {
+ perror(fullpath);
+ im->im_res.read_res.status = -errno;
+ return 0; /* DMXXX */
+ }
+ /* DM: add some error checking */
+ lseek64(fd, offset, SEEK_SET);
+ err = read(fd,
+ (void *)(im->im_res.read_res.data+bufoffset), iolen);
+ close(fd);
+ if (err < 0) {
+ perror("read");
+ im->im_res.read_res.status = -errno;
+ return 0; /* DMXXX */
+ }
+
+ if (err == 0)
+ break;
+ iolen = err; /* number of bytes read */
+ completed += iolen;
+ len -= iolen;
+ offset += iolen;
+ bufoffset += iolen;
+ }
+ im->im_res.read_res.status = completed;
+
+ return 0;
+}
+
+int
+spnfsd_write(struct spnfs_msg *im)
+{
+ unsigned long inode = im->im_args.write_args.inode;
+ unsigned long generation = im->im_args.write_args.generation;
+ loff_t offset = im->im_args.write_args.offset;
+ size_t len = im->im_args.write_args.len;
+ char *wbuf = im->im_args.write_args.data;
+ int ds, iolen;
+ loff_t soffset;
+ int bufoffset = 0;
+ char fullpath[1024]; /* DMXXX */
+ int fd, err;
+ int completed = 0;
+
+ im->im_status = SPNFS_STATUS_SUCCESS;
+ im->im_res.write_res.status = 0;
+ if (len > SPNFS_MAX_IO) {
+ printf("write length > SPNFS_MAX_IO\n");
+ im->im_res.write_res.status = -1;
+ return 0;
+ }
+ while (len > 0) {
+ ds = (offset / stripesize) % num_ds;
+ if (densestriping == 0)
+ soffset = offset;
+ else
+ soffset = (offset / num_ds) + (offset % stripesize);
+ iolen = min(len, stripesize - (offset % stripesize));
+
+ sprintf(fullpath, "%s/%s/%lu.%lu", dsmountdir,
+ dataservers[ds].ds_ip, inode, generation);
+ fd = open(fullpath, O_WRONLY);
+ if (fd < 0) {
+ perror(fullpath);
+ im->im_res.write_res.status = -errno;
+ return 0; /* DMXXX */
+ }
+ /* DM: add some error checking */
+ lseek64(fd, offset, SEEK_SET);
+ err = write(fd, (void *)(wbuf+bufoffset), iolen);
+ close(fd);
+ if (err < 0) {
+ perror("write");
+ im->im_res.write_res.status = -errno;
+ return 0; /* DMXXX */
+ }
+
+ iolen = err; /* number of bytes read */
+ completed += iolen;
+ len -= iolen;
+ offset += iolen;
+ bufoffset += iolen;
+ }
+ im->im_res.write_res.status = completed;
+ return 0;
+}
+
+int
+spnfsd_getfh(char *path, unsigned char *fh_val, unsigned int *fh_len)
+{
+ int fd, proc_fd;
+ unsigned char res[130]; /* XXX align this to proper structure */
+ extern void spnfsd_errx(int, const char *, ...);
+
+ /*
+ * hack to make sure there's an active data structure for this
+ * inode in the nfs client kernel space
+ */
+ if ((fd = open(path, O_RDONLY)) < 0) {
+ perror(path);
+ return -1;
+ }
+
+ /* fd to fh conversion */
+ proc_fd = open("/proc/fs/spnfs/getfh", O_RDWR);
+ if (proc_fd < 0) {
+ spnfsd_errx(1, "open getfh failed (%s)", strerror(errno));
+ }
+ if (write(proc_fd, &fd, sizeof(int)) < 0) {
+ spnfsd_errx(1, "write getfh failed (%s)", strerror(errno));
+ }
+ if (read(proc_fd, res, 130) <= 0) {
+ spnfsd_errx(1, "read getfh failed (%s)", strerror(errno));
+ }
+ close(proc_fd);
+
+ /* XXX use proper structure */
+ *fh_len = (short)res[0];
+ memcpy(fh_val, &res[2], *fh_len);
+
+ close(fd);
+ return 0;
+}
diff -up nfs-utils-1.2.3/utils/spnfsd/strlcat.c.orig nfs-utils-1.2.3/utils/spnfsd/strlcat.c
--- nfs-utils-1.2.3/utils/spnfsd/strlcat.c.orig 2010-10-04 15:48:00.085512992 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/strlcat.c 2010-10-04 15:48:00.085512992 -0400
@@ -0,0 +1,77 @@
+/* $OpenBSD: strlcat.c,v 1.8 2001/05/13 15:40:15 deraadt Exp $ */
+
+/*
+ * Copyright (c) 1998 Todd C. Miller <Todd.Miller@courtesan.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * 3. The name of the author may not be used to endorse or promote products
+ * derived from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
+ * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
+ * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL
+ * THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+ * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+ * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
+ * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
+ * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
+ * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#if defined(LIBC_SCCS) && !defined(lint)
+static char *rcsid = "$OpenBSD: strlcat.c,v 1.8 2001/05/13 15:40:15 deraadt Exp $";
+#endif /* LIBC_SCCS and not lint */
+
+#include <sys/types.h>
+#include <string.h>
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif /* HAVE_CONFIG_H */
+
+/*
+ * Appends src to string dst of size siz (unlike strncat, siz is the
+ * full size of dst, not space left). At most siz-1 characters
+ * will be copied. Always NUL terminates (unless siz <= strlen(dst)).
+ * Returns strlen(src) + MIN(siz, strlen(initial dst)).
+ * If retval >= siz, truncation occurred.
+ */
+size_t
+strlcat(dst, src, siz)
+ char *dst;
+ const char *src;
+ size_t siz;
+{
+ register char *d = dst;
+ register const char *s = src;
+ register size_t n = siz;
+ size_t dlen;
+
+ /* Find the end of dst and adjust bytes left but don't go past end */
+ while (n-- != 0 && *d != '\0')
+ d++;
+ dlen = d - dst;
+ n = siz - dlen;
+
+ if (n == 0)
+ return(dlen + strlen(s));
+ while (*s != '\0') {
+ if (n != 1) {
+ *d++ = *s;
+ n--;
+ }
+ s++;
+ }
+ *d = '\0';
+
+ return(dlen + (s - src)); /* count does not include NUL */
+}
diff -up nfs-utils-1.2.3/utils/spnfsd/strlcpy.c.orig nfs-utils-1.2.3/utils/spnfsd/strlcpy.c
--- nfs-utils-1.2.3/utils/spnfsd/strlcpy.c.orig 2010-10-04 15:48:00.086338923 -0400
+++ nfs-utils-1.2.3/utils/spnfsd/strlcpy.c 2010-10-04 15:48:00.086338923 -0400
@@ -0,0 +1,73 @@
+/* $OpenBSD: strlcpy.c,v 1.5 2001/05/13 15:40:16 deraadt Exp $ */
+
+/*
+ * Copyright (c) 1998 Todd C. Miller <Todd.Miller@courtesan.com>
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * 3. The name of the author may not be used to endorse or promote products
+ * derived from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
+ * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY
+ * AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL
+ * THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+ * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+ * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
+ * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+ * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
+ * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
+ * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#if defined(LIBC_SCCS) && !defined(lint)
+static char *rcsid = "$OpenBSD: strlcpy.c,v 1.5 2001/05/13 15:40:16 deraadt Exp $";
+#endif /* LIBC_SCCS and not lint */
+
+#include <sys/types.h>
+#include <string.h>
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif /* HAVE_CONFIG_H */
+
+/*
+ * Copy src to string dst of size siz. At most siz-1 characters
+ * will be copied. Always NUL terminates (unless siz == 0).
+ * Returns strlen(src); if retval >= siz, truncation occurred.
+ */
+size_t
+strlcpy(dst, src, siz)
+ char *dst;
+ const char *src;
+ size_t siz;
+{
+ register char *d = dst;
+ register const char *s = src;
+ register size_t n = siz;
+
+ /* Copy as many bytes as will fit */
+ if (n != 0 && --n != 0) {
+ do {
+ if ((*d++ = *s++) == 0)
+ break;
+ } while (--n != 0);
+ }
+
+ /* Not enough room in dst, add NUL and traverse rest of src */
+ if (n == 0) {
+ if (siz != 0)
+ *d = '\0'; /* NUL-terminate dst */
+ while (*s++)
+ ;
+ }
+
+ return(s - src - 1); /* count does not include NUL */
+}