[dm-devel] [PATCH RFC 1/2] dm-mp dm_evt hardware handler

Mike Anderson andmike at us.ibm.com
Wed Nov 9 07:55:48 UTC 2005


This patch adds a dm-mp hardware handler the sends events over netlink
when its error function is called.

Signed-off-by: Mike Anderson <andmike at us.ibm.com>

---
 drivers/md/Kconfig      |    5 
 drivers/md/Makefile     |    1 
 drivers/md/dm-evt.c     |  330 ++++++++++++++++++++++++++++++++++++++++++++++++
 drivers/md/dm-mpath.c   |   18 --
 drivers/md/dm-mpath.h   |   19 ++
 include/linux/dm-evt.h  |   46 ++++++
 include/linux/netlink.h |    1 
 7 files changed, 402 insertions(+), 18 deletions(-)

Index: sas-2.6-patched/drivers/md/dm-evt.c
===================================================================
--- /dev/null	1970-01-01 00:00:00.000000000 +0000
+++ sas-2.6-patched/drivers/md/dm-evt.c	2005-11-08 23:14:36.000000000 -0800
@@ -0,0 +1,330 @@
+/*
+ * Device Mapper Event Handler (dm-evt)
+ *
+ * Copyright (C) 2005 IBM Corporation
+ * Copyright (C) 2005 Mike Anderson <andmike at us.ibm.com>
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+ *
+ * skb mempool derived from drivers/scsi/scsi_transport_iscsi.c
+ *
+ */
+#include <linux/module.h>
+#include <linux/mempool.h>
+#include <net/tcp.h>
+#include <linux/dm-evt.h>
+#include <linux/time.h>
+#include "dm.h"
+#include "dm-hw-handler.h"
+
+#define MIN_NR_EVT_SKBS	16
+#define HIWAT_EVT_SKBS 32
+
+struct mempool_zone {
+	mempool_t *pool;
+	int allocated;
+	int size;
+	int hiwat;
+	struct list_head freequeue;
+	spinlock_t freelock;
+};
+
+static struct mempool_zone z_dm_evt;
+
+static struct sock *dm_evt_sock;
+static int dm_evt_daemon_pid;
+
+static inline struct list_head *skb_to_lh(struct sk_buff *skb)
+{
+	return (struct list_head *)&skb->cb;
+}
+
+static void* mempool_zone_alloc_skb(unsigned int gfp_mask,
+				    void *pool_data)
+{
+	struct mempool_zone *zone = pool_data;
+
+	return alloc_skb(zone->size, gfp_mask);
+}
+
+static void mempool_zone_free_skb(void *element, void *pool_data)
+{
+	kfree_skb(element);
+}
+
+static void
+mempool_zone_complete(struct mempool_zone *zone, int release_all)
+{
+	unsigned long flags;
+	struct list_head *lh, *n;
+
+	spin_lock_irqsave(&zone->freelock, flags);
+	if (zone->allocated) {
+		list_for_each_safe(lh, n, &zone->freequeue) {
+			struct sk_buff *skb =
+				(struct sk_buff *)((char *)lh -
+				 offsetof(struct sk_buff, cb));
+			if (skb_shared(skb)) {
+				if (release_all)
+					kfree_skb(skb);
+				else
+					continue;
+			}
+
+			list_del(skb_to_lh(skb));
+			mempool_free(skb, zone->pool);
+			--zone->allocated;
+
+		}
+	}
+	spin_unlock_irqrestore(&zone->freelock, flags);
+}
+
+static int mempool_zone_init(struct mempool_zone *zp, unsigned size,
+			     int min_nr, unsigned hiwat)
+{
+	zp->pool = mempool_create(min_nr, mempool_zone_alloc_skb,
+				  mempool_zone_free_skb, zp);
+	if (!zp->pool)
+		return -ENOMEM;
+
+	zp->size = size;
+	zp->hiwat = hiwat;
+	zp->allocated = 0;
+	INIT_LIST_HEAD(&zp->freequeue);
+	spin_lock_init(&zp->freelock);
+
+	return 0;
+}
+
+static struct sk_buff* mempool_zone_get_skb(struct mempool_zone *zone)
+{
+	struct sk_buff *skb;
+	unsigned long flags;
+
+	/* Check for ones we can complete before we alloc */
+	mempool_zone_complete(zone, 0);
+
+	skb = mempool_alloc(zone->pool, GFP_ATOMIC);
+	if (skb) {
+		skb_get(skb);
+		spin_lock_irqsave(&z_dm_evt.freelock, flags);
+		list_add(skb_to_lh(skb), &z_dm_evt.freequeue);
+		++zone->allocated;
+		spin_unlock_irqrestore(&z_dm_evt.freelock, flags);
+	}
+	return skb;
+}
+
+static int dm_evt_create(struct hw_handler *hwh, unsigned argc, char **argv)
+{
+	return 0;
+}
+
+static void dm_evt_destroy(struct hw_handler *hwh)
+{
+	return;
+}
+
+#ifndef BLKERR_IO
+#define BLKERR_IO 0x5A5A5A5A
+#endif
+
+static int dm_evt_send_nl_evt(struct path *path, struct bio *bio)
+{
+	struct sk_buff	*skb;
+	struct nlmsghdr	*nlh;
+	struct dm_evt_msg *dm_evt;
+	struct timeval tv;
+	int err = -ENOMEM;
+	unsigned int blk_err = BLKERR_IO;
+
+	if (!dm_evt_sock || !dm_evt_daemon_pid)
+		return 0;
+
+	skb = mempool_zone_get_skb(&z_dm_evt);
+	if (!skb)
+		goto out;
+
+	nlh = NLMSG_PUT(skb, dm_evt_daemon_pid, 0, DM_EVENT_PATH_ERR,
+			sizeof(*dm_evt));
+	dm_evt = NLMSG_DATA(nlh);
+	strncpy(dm_evt->dm_name, path->dev->name, sizeof(dm_evt->dm_name));
+	do_gettimeofday(&tv);
+	dm_evt->tv_sec = tv.tv_sec;
+	dm_evt->tv_usec = tv.tv_usec;
+	dm_evt->u.patherr.blk_err = blk_err;
+
+	nlh = (struct nlmsghdr *) skb->data;
+
+	err = netlink_unicast(dm_evt_sock, skb, dm_evt_daemon_pid,
+			      MSG_DONTWAIT);
+	if (err < 0)
+		goto unicast_failure;
+	return err;
+
+unicast_failure:
+nlmsg_failure:
+	kfree_skb(skb);
+	mempool_zone_complete(&z_dm_evt, 0);
+out:
+	DMERR("%s: failed %d", __FUNCTION__, err);
+	return err;
+
+}
+
+
+static unsigned dm_evt_error(struct hw_handler *hwh, struct bio *bio)
+{
+	int err;
+	union map_info *info;
+	struct mpath_io *mpio;
+	struct path *path;
+
+	info = dm_get_mapinfo(bio);
+	mpio = info->ptr;
+	path = &mpio->pgpath->path;
+
+	if (path->is_active) {
+		err = dm_evt_send_nl_evt(path, bio);
+	}
+
+	return MP_FAIL_PATH;
+}
+
+#define RCV_SKB_FAIL(err) do { netlink_ack(skb, nlh, (err)); return; } while (0)
+
+static void dm_evt_rcv_msg(struct sk_buff *skb)
+{
+	int pid, flags;
+	struct nlmsghdr *nlh = (struct nlmsghdr *) skb->data;
+
+	if (skb->len >= NLMSG_SPACE(0)) {
+
+		if (nlh->nlmsg_len < sizeof(*nlh) ||
+			skb->len < nlh->nlmsg_len) {
+			return;
+		}
+		pid = nlh->nlmsg_pid;
+		flags = nlh->nlmsg_flags;
+
+		if (security_netlink_recv(skb))
+			RCV_SKB_FAIL(-EPERM);
+
+		if (dm_evt_daemon_pid) {
+			if (dm_evt_daemon_pid != pid) {
+				RCV_SKB_FAIL(-EBUSY);
+			}
+		} else {
+			dm_evt_daemon_pid = pid;
+		}
+
+		if (flags & NLM_F_ACK)
+			netlink_ack(skb, nlh, 0);
+	}
+}
+
+static void dm_evt_rcv(struct sock *sk, int len)
+{
+	struct sk_buff *skb;
+	unsigned int qlen;
+
+	for (qlen = skb_queue_len(&sk->sk_receive_queue); qlen; qlen--) {
+		skb = skb_dequeue(&sk->sk_receive_queue);
+		dm_evt_rcv_msg(skb);
+		kfree_skb(skb);
+	}
+}
+
+static int dm_evt_rcv_nl_event(struct notifier_block *this, unsigned long event, void *ptr)
+{
+	struct netlink_notify *n = ptr;
+
+	if (event == NETLINK_URELEASE &&
+	    n->protocol == NETLINK_DM_EVENT && n->pid) {
+		if ( n->pid == dm_evt_daemon_pid  ) {
+			dm_evt_daemon_pid = 0;
+		}
+		mempool_zone_complete(&z_dm_evt, 1);
+	}
+
+	return NOTIFY_DONE;
+}
+
+static struct hw_handler_type dm_evt_hwh = {
+	.name = "dm-evt",
+	.module = THIS_MODULE,
+	.create = dm_evt_create,
+	.destroy = dm_evt_destroy,
+	.error = dm_evt_error,
+};
+
+static struct notifier_block dm_evt_nl_notifier = {
+	.notifier_call  = dm_evt_rcv_nl_event,
+};
+
+static int __init dm_evt_init(void)
+{
+	int err;
+
+	err = netlink_register_notifier(&dm_evt_nl_notifier);
+	if (err)
+		return err;
+
+	dm_evt_sock = netlink_kernel_create(NETLINK_DM_EVENT, 0,
+					    dm_evt_rcv, THIS_MODULE);
+	if (!dm_evt_sock) {
+		err = -ENOBUFS;
+		goto unregister_notifier;
+	}
+
+	err = mempool_zone_init(&z_dm_evt, NLMSG_SPACE(sizeof(struct
+							      dm_evt_msg)),
+				MIN_NR_EVT_SKBS, HIWAT_EVT_SKBS);
+	if (err)
+		goto release_socket;
+
+	err = dm_register_hw_handler(&dm_evt_hwh);
+	if (err)
+		goto release_zone;
+
+	DMINFO("dm-evt version 0.0.2 loaded");
+
+	return err;
+
+release_zone:
+	mempool_destroy(z_dm_evt.pool);
+release_socket:
+	sock_release(dm_evt_sock->sk_socket);
+unregister_notifier:
+	netlink_unregister_notifier(&dm_evt_nl_notifier);
+	DMERR("%s: failed %d", __FUNCTION__, err);
+	return err;
+}
+
+static void __exit dm_evt_exit(void)
+{
+	dm_unregister_hw_handler(&dm_evt_hwh);
+	mempool_destroy(z_dm_evt.pool);
+	sock_release(dm_evt_sock->sk_socket);
+	netlink_unregister_notifier(&dm_evt_nl_notifier);
+}
+
+module_init(dm_evt_init);
+module_exit(dm_evt_exit);
+
+MODULE_DESCRIPTION(DM_NAME "dm-evt multipath hwh");
+MODULE_AUTHOR("Mike Anderson <andmike at us.ibm.com>");
+MODULE_LICENSE("GPL");
Index: sas-2.6-patched/drivers/md/Makefile
===================================================================
--- sas-2.6-patched.orig/drivers/md/Makefile	2005-11-02 13:59:04.000000000 -0800
+++ sas-2.6-patched/drivers/md/Makefile	2005-11-02 13:59:31.000000000 -0800
@@ -34,6 +34,7 @@ obj-$(CONFIG_BLK_DEV_DM)	+= dm-mod.o
 obj-$(CONFIG_DM_CRYPT)		+= dm-crypt.o
 obj-$(CONFIG_DM_MULTIPATH)	+= dm-multipath.o dm-round-robin.o
 obj-$(CONFIG_DM_MULTIPATH_EMC)	+= dm-emc.o
+obj-$(CONFIG_DM_MULTIPATH_EVT)	+= dm-evt.o
 obj-$(CONFIG_DM_SNAPSHOT)	+= dm-snapshot.o
 obj-$(CONFIG_DM_MIRROR)		+= dm-mirror.o
 obj-$(CONFIG_DM_ZERO)		+= dm-zero.o
Index: sas-2.6-patched/include/linux/netlink.h
===================================================================
--- sas-2.6-patched.orig/include/linux/netlink.h	2005-11-02 13:59:04.000000000 -0800
+++ sas-2.6-patched/include/linux/netlink.h	2005-11-02 13:59:31.000000000 -0800
@@ -21,6 +21,7 @@
 #define NETLINK_DNRTMSG		14	/* DECnet routing messages */
 #define NETLINK_KOBJECT_UEVENT	15	/* Kernel messages to userspace */
 #define NETLINK_GENERIC		16
+#define NETLINK_DM_EVENT	17	/* DM Event */
 
 #define MAX_LINKS 32		
 
Index: sas-2.6-patched/include/linux/dm-evt.h
===================================================================
--- /dev/null	1970-01-01 00:00:00.000000000 +0000
+++ sas-2.6-patched/include/linux/dm-evt.h	2005-11-07 11:28:35.000000000 -0800
@@ -0,0 +1,46 @@
+/*
+ * Device Mapper Event Handler
+ *
+ * Copyright (C) 2005 IBM Corporation
+ * Copyright (C) 2005 Mike Anderson <andmike at us.ibm.com>
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+ *
+ */
+#ifndef DM_EVENT_H
+#define DM_EVENT_H
+#include <linux/types.h>
+
+#define EVT_DM_NAME_LEN 16
+
+#define DM_EVENT_BASE	10
+enum dm_evt_e {
+	DM_EVENT_UNKOWN		= 0,
+	DM_EVENT_PATH_ERR	= DM_EVENT_BASE + 1,
+};
+
+struct dm_evt_msg {
+	uint8_t dm_name[EVT_DM_NAME_LEN];
+	uint64_t tv_sec;
+	uint64_t tv_usec;
+
+	union {
+		struct msg_path_err {
+			uint32_t blk_err; /* BLKERR Values */
+		} patherr;
+	} u;
+} __attribute__((aligned(sizeof(uint64_t))));
+
+#endif
Index: sas-2.6-patched/drivers/md/Kconfig
===================================================================
--- sas-2.6-patched.orig/drivers/md/Kconfig	2005-11-02 13:59:04.000000000 -0800
+++ sas-2.6-patched/drivers/md/Kconfig	2005-11-02 13:59:31.000000000 -0800
@@ -235,6 +235,11 @@ config DM_MULTIPATH_EMC
 	depends on DM_MULTIPATH && BLK_DEV_DM && EXPERIMENTAL
 	---help---
 	  Multipath support for EMC CX/AX series hardware.
+config DM_MULTIPATH_EVT
+	tristate "Generate netlink events for multipath failures"
+	depends on DM_MULTIPATH && BLK_DEV_DM && EXPERIMENTAL
+	---help---
+	  Multipath support for EMC CX/AX series hardware.
 
 endmenu
 
Index: sas-2.6-patched/drivers/md/dm-mpath.c
===================================================================
--- sas-2.6-patched.orig/drivers/md/dm-mpath.c	2005-11-02 13:59:04.000000000 -0800
+++ sas-2.6-patched/drivers/md/dm-mpath.c	2005-11-02 13:59:31.000000000 -0800
@@ -23,16 +23,6 @@
 
 #define MESG_STR(x) x, sizeof(x)
 
-/* Path properties */
-struct pgpath {
-	struct list_head list;
-
-	struct priority_group *pg;	/* Owning PG */
-	unsigned fail_count;		/* Cumulative failure count */
-
-	struct path path;
-};
-
 #define path_to_pgpath(__pgp) container_of((__pgp), struct pgpath, path)
 
 /*
@@ -88,14 +78,6 @@ struct multipath {
 	mempool_t *mpio_pool;
 };
 
-/*
- * Context information attached to each bio we process.
- */
-struct mpath_io {
-	struct pgpath *pgpath;
-	struct dm_bio_details details;
-};
-
 typedef int (*action_fn) (struct pgpath *pgpath);
 
 #define MIN_IOS 256	/* Mempool size */
Index: sas-2.6-patched/drivers/md/dm-mpath.h
===================================================================
--- sas-2.6-patched.orig/drivers/md/dm-mpath.h	2005-11-02 13:59:04.000000000 -0800
+++ sas-2.6-patched/drivers/md/dm-mpath.h	2005-11-02 13:59:31.000000000 -0800
@@ -8,6 +8,7 @@
 
 #ifndef	DM_MPATH_H
 #define	DM_MPATH_H
+#include "dm-bio-record.h"
 
 struct dm_dev;
 
@@ -19,6 +20,24 @@ struct path {
 	void *hwhcontext;	/* For hw-handler use */
 };
 
+/* Path properties */
+struct pgpath {
+	struct list_head list;
+
+	struct priority_group *pg;	/* Owning PG */
+	unsigned fail_count;		/* Cumulative failure count */
+
+	struct path path;
+};
+
+/*
+ * Context information attached to each bio we process.
+ */
+struct mpath_io {
+	struct pgpath *pgpath;
+	struct dm_bio_details details;
+};
+
 /* Callback for hwh_pg_init_fn to use when complete */
 void dm_pg_init_complete(struct path *path, unsigned err_flags);
 




More information about the dm-devel mailing list