xref: /openbmc/linux/drivers/md/dm-ps-queue-length.c (revision 8ec456629d0bf051e41ef2c87a60755f941dd11c)
1298fb372SMike Snitzer /*
2298fb372SMike Snitzer  * Copyright (C) 2004-2005 IBM Corp.  All Rights Reserved.
3298fb372SMike Snitzer  * Copyright (C) 2006-2009 NEC Corporation.
4298fb372SMike Snitzer  *
5298fb372SMike Snitzer  * dm-queue-length.c
6298fb372SMike Snitzer  *
7298fb372SMike Snitzer  * Module Author: Stefan Bader, IBM
8298fb372SMike Snitzer  * Modified by: Kiyoshi Ueda, NEC
9298fb372SMike Snitzer  *
10298fb372SMike Snitzer  * This file is released under the GPL.
11298fb372SMike Snitzer  *
12298fb372SMike Snitzer  * queue-length path selector - choose a path with the least number of
13298fb372SMike Snitzer  * in-flight I/Os.
14298fb372SMike Snitzer  */
15298fb372SMike Snitzer 
16298fb372SMike Snitzer #include "dm.h"
17298fb372SMike Snitzer #include "dm-path-selector.h"
18298fb372SMike Snitzer 
19298fb372SMike Snitzer #include <linux/slab.h>
20298fb372SMike Snitzer #include <linux/ctype.h>
21298fb372SMike Snitzer #include <linux/errno.h>
22298fb372SMike Snitzer #include <linux/module.h>
23298fb372SMike Snitzer #include <linux/atomic.h>
24298fb372SMike Snitzer 
25298fb372SMike Snitzer #define DM_MSG_PREFIX	"multipath queue-length"
26298fb372SMike Snitzer #define QL_MIN_IO	1
27298fb372SMike Snitzer #define QL_VERSION	"0.2.0"
28298fb372SMike Snitzer 
29298fb372SMike Snitzer struct selector {
30298fb372SMike Snitzer 	struct list_head	valid_paths;
31298fb372SMike Snitzer 	struct list_head	failed_paths;
32298fb372SMike Snitzer 	spinlock_t lock;
33298fb372SMike Snitzer };
34298fb372SMike Snitzer 
35298fb372SMike Snitzer struct path_info {
36298fb372SMike Snitzer 	struct list_head	list;
37298fb372SMike Snitzer 	struct dm_path		*path;
38298fb372SMike Snitzer 	unsigned		repeat_count;
39298fb372SMike Snitzer 	atomic_t		qlen;	/* the number of in-flight I/Os */
40298fb372SMike Snitzer };
41298fb372SMike Snitzer 
42298fb372SMike Snitzer static struct selector *alloc_selector(void)
43298fb372SMike Snitzer {
44298fb372SMike Snitzer 	struct selector *s = kmalloc(sizeof(*s), GFP_KERNEL);
45298fb372SMike Snitzer 
46298fb372SMike Snitzer 	if (s) {
47298fb372SMike Snitzer 		INIT_LIST_HEAD(&s->valid_paths);
48298fb372SMike Snitzer 		INIT_LIST_HEAD(&s->failed_paths);
49298fb372SMike Snitzer 		spin_lock_init(&s->lock);
50298fb372SMike Snitzer 	}
51298fb372SMike Snitzer 
52298fb372SMike Snitzer 	return s;
53298fb372SMike Snitzer }
54298fb372SMike Snitzer 
55298fb372SMike Snitzer static int ql_create(struct path_selector *ps, unsigned argc, char **argv)
56298fb372SMike Snitzer {
57298fb372SMike Snitzer 	struct selector *s = alloc_selector();
58298fb372SMike Snitzer 
59298fb372SMike Snitzer 	if (!s)
60298fb372SMike Snitzer 		return -ENOMEM;
61298fb372SMike Snitzer 
62298fb372SMike Snitzer 	ps->context = s;
63298fb372SMike Snitzer 	return 0;
64298fb372SMike Snitzer }
65298fb372SMike Snitzer 
66298fb372SMike Snitzer static void ql_free_paths(struct list_head *paths)
67298fb372SMike Snitzer {
68298fb372SMike Snitzer 	struct path_info *pi, *next;
69298fb372SMike Snitzer 
70298fb372SMike Snitzer 	list_for_each_entry_safe(pi, next, paths, list) {
71298fb372SMike Snitzer 		list_del(&pi->list);
72298fb372SMike Snitzer 		kfree(pi);
73298fb372SMike Snitzer 	}
74298fb372SMike Snitzer }
75298fb372SMike Snitzer 
76298fb372SMike Snitzer static void ql_destroy(struct path_selector *ps)
77298fb372SMike Snitzer {
78298fb372SMike Snitzer 	struct selector *s = ps->context;
79298fb372SMike Snitzer 
80298fb372SMike Snitzer 	ql_free_paths(&s->valid_paths);
81298fb372SMike Snitzer 	ql_free_paths(&s->failed_paths);
82298fb372SMike Snitzer 	kfree(s);
83298fb372SMike Snitzer 	ps->context = NULL;
84298fb372SMike Snitzer }
85298fb372SMike Snitzer 
86298fb372SMike Snitzer static int ql_status(struct path_selector *ps, struct dm_path *path,
87298fb372SMike Snitzer 		     status_type_t type, char *result, unsigned maxlen)
88298fb372SMike Snitzer {
89298fb372SMike Snitzer 	unsigned sz = 0;
90298fb372SMike Snitzer 	struct path_info *pi;
91298fb372SMike Snitzer 
92298fb372SMike Snitzer 	/* When called with NULL path, return selector status/args. */
93298fb372SMike Snitzer 	if (!path)
94298fb372SMike Snitzer 		DMEMIT("0 ");
95298fb372SMike Snitzer 	else {
96298fb372SMike Snitzer 		pi = path->pscontext;
97298fb372SMike Snitzer 
98298fb372SMike Snitzer 		switch (type) {
99298fb372SMike Snitzer 		case STATUSTYPE_INFO:
100298fb372SMike Snitzer 			DMEMIT("%d ", atomic_read(&pi->qlen));
101298fb372SMike Snitzer 			break;
102298fb372SMike Snitzer 		case STATUSTYPE_TABLE:
103298fb372SMike Snitzer 			DMEMIT("%u ", pi->repeat_count);
104298fb372SMike Snitzer 			break;
105*8ec45662STushar Sugandhi 		case STATUSTYPE_IMA:
106*8ec45662STushar Sugandhi 			*result = '\0';
107*8ec45662STushar Sugandhi 			break;
108298fb372SMike Snitzer 		}
109298fb372SMike Snitzer 	}
110298fb372SMike Snitzer 
111298fb372SMike Snitzer 	return sz;
112298fb372SMike Snitzer }
113298fb372SMike Snitzer 
114298fb372SMike Snitzer static int ql_add_path(struct path_selector *ps, struct dm_path *path,
115298fb372SMike Snitzer 		       int argc, char **argv, char **error)
116298fb372SMike Snitzer {
117298fb372SMike Snitzer 	struct selector *s = ps->context;
118298fb372SMike Snitzer 	struct path_info *pi;
119298fb372SMike Snitzer 	unsigned repeat_count = QL_MIN_IO;
120298fb372SMike Snitzer 	char dummy;
121298fb372SMike Snitzer 	unsigned long flags;
122298fb372SMike Snitzer 
123298fb372SMike Snitzer 	/*
124298fb372SMike Snitzer 	 * Arguments: [<repeat_count>]
125298fb372SMike Snitzer 	 * 	<repeat_count>: The number of I/Os before switching path.
126298fb372SMike Snitzer 	 * 			If not given, default (QL_MIN_IO) is used.
127298fb372SMike Snitzer 	 */
128298fb372SMike Snitzer 	if (argc > 1) {
129298fb372SMike Snitzer 		*error = "queue-length ps: incorrect number of arguments";
130298fb372SMike Snitzer 		return -EINVAL;
131298fb372SMike Snitzer 	}
132298fb372SMike Snitzer 
133298fb372SMike Snitzer 	if ((argc == 1) && (sscanf(argv[0], "%u%c", &repeat_count, &dummy) != 1)) {
134298fb372SMike Snitzer 		*error = "queue-length ps: invalid repeat count";
135298fb372SMike Snitzer 		return -EINVAL;
136298fb372SMike Snitzer 	}
137298fb372SMike Snitzer 
138298fb372SMike Snitzer 	if (repeat_count > 1) {
139298fb372SMike Snitzer 		DMWARN_LIMIT("repeat_count > 1 is deprecated, using 1 instead");
140298fb372SMike Snitzer 		repeat_count = 1;
141298fb372SMike Snitzer 	}
142298fb372SMike Snitzer 
143298fb372SMike Snitzer 	/* Allocate the path information structure */
144298fb372SMike Snitzer 	pi = kmalloc(sizeof(*pi), GFP_KERNEL);
145298fb372SMike Snitzer 	if (!pi) {
146298fb372SMike Snitzer 		*error = "queue-length ps: Error allocating path information";
147298fb372SMike Snitzer 		return -ENOMEM;
148298fb372SMike Snitzer 	}
149298fb372SMike Snitzer 
150298fb372SMike Snitzer 	pi->path = path;
151298fb372SMike Snitzer 	pi->repeat_count = repeat_count;
152298fb372SMike Snitzer 	atomic_set(&pi->qlen, 0);
153298fb372SMike Snitzer 
154298fb372SMike Snitzer 	path->pscontext = pi;
155298fb372SMike Snitzer 
156298fb372SMike Snitzer 	spin_lock_irqsave(&s->lock, flags);
157298fb372SMike Snitzer 	list_add_tail(&pi->list, &s->valid_paths);
158298fb372SMike Snitzer 	spin_unlock_irqrestore(&s->lock, flags);
159298fb372SMike Snitzer 
160298fb372SMike Snitzer 	return 0;
161298fb372SMike Snitzer }
162298fb372SMike Snitzer 
163298fb372SMike Snitzer static void ql_fail_path(struct path_selector *ps, struct dm_path *path)
164298fb372SMike Snitzer {
165298fb372SMike Snitzer 	struct selector *s = ps->context;
166298fb372SMike Snitzer 	struct path_info *pi = path->pscontext;
167298fb372SMike Snitzer 	unsigned long flags;
168298fb372SMike Snitzer 
169298fb372SMike Snitzer 	spin_lock_irqsave(&s->lock, flags);
170298fb372SMike Snitzer 	list_move(&pi->list, &s->failed_paths);
171298fb372SMike Snitzer 	spin_unlock_irqrestore(&s->lock, flags);
172298fb372SMike Snitzer }
173298fb372SMike Snitzer 
174298fb372SMike Snitzer static int ql_reinstate_path(struct path_selector *ps, struct dm_path *path)
175298fb372SMike Snitzer {
176298fb372SMike Snitzer 	struct selector *s = ps->context;
177298fb372SMike Snitzer 	struct path_info *pi = path->pscontext;
178298fb372SMike Snitzer 	unsigned long flags;
179298fb372SMike Snitzer 
180298fb372SMike Snitzer 	spin_lock_irqsave(&s->lock, flags);
181298fb372SMike Snitzer 	list_move_tail(&pi->list, &s->valid_paths);
182298fb372SMike Snitzer 	spin_unlock_irqrestore(&s->lock, flags);
183298fb372SMike Snitzer 
184298fb372SMike Snitzer 	return 0;
185298fb372SMike Snitzer }
186298fb372SMike Snitzer 
187298fb372SMike Snitzer /*
188298fb372SMike Snitzer  * Select a path having the minimum number of in-flight I/Os
189298fb372SMike Snitzer  */
190298fb372SMike Snitzer static struct dm_path *ql_select_path(struct path_selector *ps, size_t nr_bytes)
191298fb372SMike Snitzer {
192298fb372SMike Snitzer 	struct selector *s = ps->context;
193298fb372SMike Snitzer 	struct path_info *pi = NULL, *best = NULL;
194298fb372SMike Snitzer 	struct dm_path *ret = NULL;
195298fb372SMike Snitzer 	unsigned long flags;
196298fb372SMike Snitzer 
197298fb372SMike Snitzer 	spin_lock_irqsave(&s->lock, flags);
198298fb372SMike Snitzer 	if (list_empty(&s->valid_paths))
199298fb372SMike Snitzer 		goto out;
200298fb372SMike Snitzer 
201298fb372SMike Snitzer 	list_for_each_entry(pi, &s->valid_paths, list) {
202298fb372SMike Snitzer 		if (!best ||
203298fb372SMike Snitzer 		    (atomic_read(&pi->qlen) < atomic_read(&best->qlen)))
204298fb372SMike Snitzer 			best = pi;
205298fb372SMike Snitzer 
206298fb372SMike Snitzer 		if (!atomic_read(&best->qlen))
207298fb372SMike Snitzer 			break;
208298fb372SMike Snitzer 	}
209298fb372SMike Snitzer 
210298fb372SMike Snitzer 	if (!best)
211298fb372SMike Snitzer 		goto out;
212298fb372SMike Snitzer 
213298fb372SMike Snitzer 	/* Move most recently used to least preferred to evenly balance. */
214298fb372SMike Snitzer 	list_move_tail(&best->list, &s->valid_paths);
215298fb372SMike Snitzer 
216298fb372SMike Snitzer 	ret = best->path;
217298fb372SMike Snitzer out:
218298fb372SMike Snitzer 	spin_unlock_irqrestore(&s->lock, flags);
219298fb372SMike Snitzer 	return ret;
220298fb372SMike Snitzer }
221298fb372SMike Snitzer 
222298fb372SMike Snitzer static int ql_start_io(struct path_selector *ps, struct dm_path *path,
223298fb372SMike Snitzer 		       size_t nr_bytes)
224298fb372SMike Snitzer {
225298fb372SMike Snitzer 	struct path_info *pi = path->pscontext;
226298fb372SMike Snitzer 
227298fb372SMike Snitzer 	atomic_inc(&pi->qlen);
228298fb372SMike Snitzer 
229298fb372SMike Snitzer 	return 0;
230298fb372SMike Snitzer }
231298fb372SMike Snitzer 
232298fb372SMike Snitzer static int ql_end_io(struct path_selector *ps, struct dm_path *path,
233298fb372SMike Snitzer 		     size_t nr_bytes, u64 start_time)
234298fb372SMike Snitzer {
235298fb372SMike Snitzer 	struct path_info *pi = path->pscontext;
236298fb372SMike Snitzer 
237298fb372SMike Snitzer 	atomic_dec(&pi->qlen);
238298fb372SMike Snitzer 
239298fb372SMike Snitzer 	return 0;
240298fb372SMike Snitzer }
241298fb372SMike Snitzer 
242298fb372SMike Snitzer static struct path_selector_type ql_ps = {
243298fb372SMike Snitzer 	.name		= "queue-length",
244298fb372SMike Snitzer 	.module		= THIS_MODULE,
245298fb372SMike Snitzer 	.table_args	= 1,
246298fb372SMike Snitzer 	.info_args	= 1,
247298fb372SMike Snitzer 	.create		= ql_create,
248298fb372SMike Snitzer 	.destroy	= ql_destroy,
249298fb372SMike Snitzer 	.status		= ql_status,
250298fb372SMike Snitzer 	.add_path	= ql_add_path,
251298fb372SMike Snitzer 	.fail_path	= ql_fail_path,
252298fb372SMike Snitzer 	.reinstate_path	= ql_reinstate_path,
253298fb372SMike Snitzer 	.select_path	= ql_select_path,
254298fb372SMike Snitzer 	.start_io	= ql_start_io,
255298fb372SMike Snitzer 	.end_io		= ql_end_io,
256298fb372SMike Snitzer };
257298fb372SMike Snitzer 
258298fb372SMike Snitzer static int __init dm_ql_init(void)
259298fb372SMike Snitzer {
260298fb372SMike Snitzer 	int r = dm_register_path_selector(&ql_ps);
261298fb372SMike Snitzer 
262298fb372SMike Snitzer 	if (r < 0)
263298fb372SMike Snitzer 		DMERR("register failed %d", r);
264298fb372SMike Snitzer 
265298fb372SMike Snitzer 	DMINFO("version " QL_VERSION " loaded");
266298fb372SMike Snitzer 
267298fb372SMike Snitzer 	return r;
268298fb372SMike Snitzer }
269298fb372SMike Snitzer 
270298fb372SMike Snitzer static void __exit dm_ql_exit(void)
271298fb372SMike Snitzer {
272298fb372SMike Snitzer 	int r = dm_unregister_path_selector(&ql_ps);
273298fb372SMike Snitzer 
274298fb372SMike Snitzer 	if (r < 0)
275298fb372SMike Snitzer 		DMERR("unregister failed %d", r);
276298fb372SMike Snitzer }
277298fb372SMike Snitzer 
278298fb372SMike Snitzer module_init(dm_ql_init);
279298fb372SMike Snitzer module_exit(dm_ql_exit);
280298fb372SMike Snitzer 
281298fb372SMike Snitzer MODULE_AUTHOR("Stefan Bader <Stefan.Bader at de.ibm.com>");
282298fb372SMike Snitzer MODULE_DESCRIPTION(
283298fb372SMike Snitzer 	"(C) Copyright IBM Corp. 2004,2005   All Rights Reserved.\n"
284298fb372SMike Snitzer 	DM_NAME " path selector to balance the number of in-flight I/Os"
285298fb372SMike Snitzer );
286298fb372SMike Snitzer MODULE_LICENSE("GPL");
287