1298fb372SMike Snitzer /* 2298fb372SMike Snitzer * Copyright (C) 2004-2005 IBM Corp. All Rights Reserved. 3298fb372SMike Snitzer * Copyright (C) 2006-2009 NEC Corporation. 4298fb372SMike Snitzer * 5298fb372SMike Snitzer * dm-queue-length.c 6298fb372SMike Snitzer * 7298fb372SMike Snitzer * Module Author: Stefan Bader, IBM 8298fb372SMike Snitzer * Modified by: Kiyoshi Ueda, NEC 9298fb372SMike Snitzer * 10298fb372SMike Snitzer * This file is released under the GPL. 11298fb372SMike Snitzer * 12298fb372SMike Snitzer * queue-length path selector - choose a path with the least number of 13298fb372SMike Snitzer * in-flight I/Os. 14298fb372SMike Snitzer */ 15298fb372SMike Snitzer 16298fb372SMike Snitzer #include "dm.h" 17298fb372SMike Snitzer #include "dm-path-selector.h" 18298fb372SMike Snitzer 19298fb372SMike Snitzer #include <linux/slab.h> 20298fb372SMike Snitzer #include <linux/ctype.h> 21298fb372SMike Snitzer #include <linux/errno.h> 22298fb372SMike Snitzer #include <linux/module.h> 23298fb372SMike Snitzer #include <linux/atomic.h> 24298fb372SMike Snitzer 25298fb372SMike Snitzer #define DM_MSG_PREFIX "multipath queue-length" 26298fb372SMike Snitzer #define QL_MIN_IO 1 27298fb372SMike Snitzer #define QL_VERSION "0.2.0" 28298fb372SMike Snitzer 29298fb372SMike Snitzer struct selector { 30298fb372SMike Snitzer struct list_head valid_paths; 31298fb372SMike Snitzer struct list_head failed_paths; 32298fb372SMike Snitzer spinlock_t lock; 33298fb372SMike Snitzer }; 34298fb372SMike Snitzer 35298fb372SMike Snitzer struct path_info { 36298fb372SMike Snitzer struct list_head list; 37298fb372SMike Snitzer struct dm_path *path; 38298fb372SMike Snitzer unsigned repeat_count; 39298fb372SMike Snitzer atomic_t qlen; /* the number of in-flight I/Os */ 40298fb372SMike Snitzer }; 41298fb372SMike Snitzer 42298fb372SMike Snitzer static struct selector *alloc_selector(void) 43298fb372SMike Snitzer { 44298fb372SMike Snitzer struct selector *s = kmalloc(sizeof(*s), GFP_KERNEL); 45298fb372SMike Snitzer 46298fb372SMike Snitzer if (s) { 47298fb372SMike Snitzer INIT_LIST_HEAD(&s->valid_paths); 48298fb372SMike Snitzer INIT_LIST_HEAD(&s->failed_paths); 49298fb372SMike Snitzer spin_lock_init(&s->lock); 50298fb372SMike Snitzer } 51298fb372SMike Snitzer 52298fb372SMike Snitzer return s; 53298fb372SMike Snitzer } 54298fb372SMike Snitzer 55298fb372SMike Snitzer static int ql_create(struct path_selector *ps, unsigned argc, char **argv) 56298fb372SMike Snitzer { 57298fb372SMike Snitzer struct selector *s = alloc_selector(); 58298fb372SMike Snitzer 59298fb372SMike Snitzer if (!s) 60298fb372SMike Snitzer return -ENOMEM; 61298fb372SMike Snitzer 62298fb372SMike Snitzer ps->context = s; 63298fb372SMike Snitzer return 0; 64298fb372SMike Snitzer } 65298fb372SMike Snitzer 66298fb372SMike Snitzer static void ql_free_paths(struct list_head *paths) 67298fb372SMike Snitzer { 68298fb372SMike Snitzer struct path_info *pi, *next; 69298fb372SMike Snitzer 70298fb372SMike Snitzer list_for_each_entry_safe(pi, next, paths, list) { 71298fb372SMike Snitzer list_del(&pi->list); 72298fb372SMike Snitzer kfree(pi); 73298fb372SMike Snitzer } 74298fb372SMike Snitzer } 75298fb372SMike Snitzer 76298fb372SMike Snitzer static void ql_destroy(struct path_selector *ps) 77298fb372SMike Snitzer { 78298fb372SMike Snitzer struct selector *s = ps->context; 79298fb372SMike Snitzer 80298fb372SMike Snitzer ql_free_paths(&s->valid_paths); 81298fb372SMike Snitzer ql_free_paths(&s->failed_paths); 82298fb372SMike Snitzer kfree(s); 83298fb372SMike Snitzer ps->context = NULL; 84298fb372SMike Snitzer } 85298fb372SMike Snitzer 86298fb372SMike Snitzer static int ql_status(struct path_selector *ps, struct dm_path *path, 87298fb372SMike Snitzer status_type_t type, char *result, unsigned maxlen) 88298fb372SMike Snitzer { 89298fb372SMike Snitzer unsigned sz = 0; 90298fb372SMike Snitzer struct path_info *pi; 91298fb372SMike Snitzer 92298fb372SMike Snitzer /* When called with NULL path, return selector status/args. */ 93298fb372SMike Snitzer if (!path) 94298fb372SMike Snitzer DMEMIT("0 "); 95298fb372SMike Snitzer else { 96298fb372SMike Snitzer pi = path->pscontext; 97298fb372SMike Snitzer 98298fb372SMike Snitzer switch (type) { 99298fb372SMike Snitzer case STATUSTYPE_INFO: 100298fb372SMike Snitzer DMEMIT("%d ", atomic_read(&pi->qlen)); 101298fb372SMike Snitzer break; 102298fb372SMike Snitzer case STATUSTYPE_TABLE: 103298fb372SMike Snitzer DMEMIT("%u ", pi->repeat_count); 104298fb372SMike Snitzer break; 105*8ec45662STushar Sugandhi case STATUSTYPE_IMA: 106*8ec45662STushar Sugandhi *result = '\0'; 107*8ec45662STushar Sugandhi break; 108298fb372SMike Snitzer } 109298fb372SMike Snitzer } 110298fb372SMike Snitzer 111298fb372SMike Snitzer return sz; 112298fb372SMike Snitzer } 113298fb372SMike Snitzer 114298fb372SMike Snitzer static int ql_add_path(struct path_selector *ps, struct dm_path *path, 115298fb372SMike Snitzer int argc, char **argv, char **error) 116298fb372SMike Snitzer { 117298fb372SMike Snitzer struct selector *s = ps->context; 118298fb372SMike Snitzer struct path_info *pi; 119298fb372SMike Snitzer unsigned repeat_count = QL_MIN_IO; 120298fb372SMike Snitzer char dummy; 121298fb372SMike Snitzer unsigned long flags; 122298fb372SMike Snitzer 123298fb372SMike Snitzer /* 124298fb372SMike Snitzer * Arguments: [<repeat_count>] 125298fb372SMike Snitzer * <repeat_count>: The number of I/Os before switching path. 126298fb372SMike Snitzer * If not given, default (QL_MIN_IO) is used. 127298fb372SMike Snitzer */ 128298fb372SMike Snitzer if (argc > 1) { 129298fb372SMike Snitzer *error = "queue-length ps: incorrect number of arguments"; 130298fb372SMike Snitzer return -EINVAL; 131298fb372SMike Snitzer } 132298fb372SMike Snitzer 133298fb372SMike Snitzer if ((argc == 1) && (sscanf(argv[0], "%u%c", &repeat_count, &dummy) != 1)) { 134298fb372SMike Snitzer *error = "queue-length ps: invalid repeat count"; 135298fb372SMike Snitzer return -EINVAL; 136298fb372SMike Snitzer } 137298fb372SMike Snitzer 138298fb372SMike Snitzer if (repeat_count > 1) { 139298fb372SMike Snitzer DMWARN_LIMIT("repeat_count > 1 is deprecated, using 1 instead"); 140298fb372SMike Snitzer repeat_count = 1; 141298fb372SMike Snitzer } 142298fb372SMike Snitzer 143298fb372SMike Snitzer /* Allocate the path information structure */ 144298fb372SMike Snitzer pi = kmalloc(sizeof(*pi), GFP_KERNEL); 145298fb372SMike Snitzer if (!pi) { 146298fb372SMike Snitzer *error = "queue-length ps: Error allocating path information"; 147298fb372SMike Snitzer return -ENOMEM; 148298fb372SMike Snitzer } 149298fb372SMike Snitzer 150298fb372SMike Snitzer pi->path = path; 151298fb372SMike Snitzer pi->repeat_count = repeat_count; 152298fb372SMike Snitzer atomic_set(&pi->qlen, 0); 153298fb372SMike Snitzer 154298fb372SMike Snitzer path->pscontext = pi; 155298fb372SMike Snitzer 156298fb372SMike Snitzer spin_lock_irqsave(&s->lock, flags); 157298fb372SMike Snitzer list_add_tail(&pi->list, &s->valid_paths); 158298fb372SMike Snitzer spin_unlock_irqrestore(&s->lock, flags); 159298fb372SMike Snitzer 160298fb372SMike Snitzer return 0; 161298fb372SMike Snitzer } 162298fb372SMike Snitzer 163298fb372SMike Snitzer static void ql_fail_path(struct path_selector *ps, struct dm_path *path) 164298fb372SMike Snitzer { 165298fb372SMike Snitzer struct selector *s = ps->context; 166298fb372SMike Snitzer struct path_info *pi = path->pscontext; 167298fb372SMike Snitzer unsigned long flags; 168298fb372SMike Snitzer 169298fb372SMike Snitzer spin_lock_irqsave(&s->lock, flags); 170298fb372SMike Snitzer list_move(&pi->list, &s->failed_paths); 171298fb372SMike Snitzer spin_unlock_irqrestore(&s->lock, flags); 172298fb372SMike Snitzer } 173298fb372SMike Snitzer 174298fb372SMike Snitzer static int ql_reinstate_path(struct path_selector *ps, struct dm_path *path) 175298fb372SMike Snitzer { 176298fb372SMike Snitzer struct selector *s = ps->context; 177298fb372SMike Snitzer struct path_info *pi = path->pscontext; 178298fb372SMike Snitzer unsigned long flags; 179298fb372SMike Snitzer 180298fb372SMike Snitzer spin_lock_irqsave(&s->lock, flags); 181298fb372SMike Snitzer list_move_tail(&pi->list, &s->valid_paths); 182298fb372SMike Snitzer spin_unlock_irqrestore(&s->lock, flags); 183298fb372SMike Snitzer 184298fb372SMike Snitzer return 0; 185298fb372SMike Snitzer } 186298fb372SMike Snitzer 187298fb372SMike Snitzer /* 188298fb372SMike Snitzer * Select a path having the minimum number of in-flight I/Os 189298fb372SMike Snitzer */ 190298fb372SMike Snitzer static struct dm_path *ql_select_path(struct path_selector *ps, size_t nr_bytes) 191298fb372SMike Snitzer { 192298fb372SMike Snitzer struct selector *s = ps->context; 193298fb372SMike Snitzer struct path_info *pi = NULL, *best = NULL; 194298fb372SMike Snitzer struct dm_path *ret = NULL; 195298fb372SMike Snitzer unsigned long flags; 196298fb372SMike Snitzer 197298fb372SMike Snitzer spin_lock_irqsave(&s->lock, flags); 198298fb372SMike Snitzer if (list_empty(&s->valid_paths)) 199298fb372SMike Snitzer goto out; 200298fb372SMike Snitzer 201298fb372SMike Snitzer list_for_each_entry(pi, &s->valid_paths, list) { 202298fb372SMike Snitzer if (!best || 203298fb372SMike Snitzer (atomic_read(&pi->qlen) < atomic_read(&best->qlen))) 204298fb372SMike Snitzer best = pi; 205298fb372SMike Snitzer 206298fb372SMike Snitzer if (!atomic_read(&best->qlen)) 207298fb372SMike Snitzer break; 208298fb372SMike Snitzer } 209298fb372SMike Snitzer 210298fb372SMike Snitzer if (!best) 211298fb372SMike Snitzer goto out; 212298fb372SMike Snitzer 213298fb372SMike Snitzer /* Move most recently used to least preferred to evenly balance. */ 214298fb372SMike Snitzer list_move_tail(&best->list, &s->valid_paths); 215298fb372SMike Snitzer 216298fb372SMike Snitzer ret = best->path; 217298fb372SMike Snitzer out: 218298fb372SMike Snitzer spin_unlock_irqrestore(&s->lock, flags); 219298fb372SMike Snitzer return ret; 220298fb372SMike Snitzer } 221298fb372SMike Snitzer 222298fb372SMike Snitzer static int ql_start_io(struct path_selector *ps, struct dm_path *path, 223298fb372SMike Snitzer size_t nr_bytes) 224298fb372SMike Snitzer { 225298fb372SMike Snitzer struct path_info *pi = path->pscontext; 226298fb372SMike Snitzer 227298fb372SMike Snitzer atomic_inc(&pi->qlen); 228298fb372SMike Snitzer 229298fb372SMike Snitzer return 0; 230298fb372SMike Snitzer } 231298fb372SMike Snitzer 232298fb372SMike Snitzer static int ql_end_io(struct path_selector *ps, struct dm_path *path, 233298fb372SMike Snitzer size_t nr_bytes, u64 start_time) 234298fb372SMike Snitzer { 235298fb372SMike Snitzer struct path_info *pi = path->pscontext; 236298fb372SMike Snitzer 237298fb372SMike Snitzer atomic_dec(&pi->qlen); 238298fb372SMike Snitzer 239298fb372SMike Snitzer return 0; 240298fb372SMike Snitzer } 241298fb372SMike Snitzer 242298fb372SMike Snitzer static struct path_selector_type ql_ps = { 243298fb372SMike Snitzer .name = "queue-length", 244298fb372SMike Snitzer .module = THIS_MODULE, 245298fb372SMike Snitzer .table_args = 1, 246298fb372SMike Snitzer .info_args = 1, 247298fb372SMike Snitzer .create = ql_create, 248298fb372SMike Snitzer .destroy = ql_destroy, 249298fb372SMike Snitzer .status = ql_status, 250298fb372SMike Snitzer .add_path = ql_add_path, 251298fb372SMike Snitzer .fail_path = ql_fail_path, 252298fb372SMike Snitzer .reinstate_path = ql_reinstate_path, 253298fb372SMike Snitzer .select_path = ql_select_path, 254298fb372SMike Snitzer .start_io = ql_start_io, 255298fb372SMike Snitzer .end_io = ql_end_io, 256298fb372SMike Snitzer }; 257298fb372SMike Snitzer 258298fb372SMike Snitzer static int __init dm_ql_init(void) 259298fb372SMike Snitzer { 260298fb372SMike Snitzer int r = dm_register_path_selector(&ql_ps); 261298fb372SMike Snitzer 262298fb372SMike Snitzer if (r < 0) 263298fb372SMike Snitzer DMERR("register failed %d", r); 264298fb372SMike Snitzer 265298fb372SMike Snitzer DMINFO("version " QL_VERSION " loaded"); 266298fb372SMike Snitzer 267298fb372SMike Snitzer return r; 268298fb372SMike Snitzer } 269298fb372SMike Snitzer 270298fb372SMike Snitzer static void __exit dm_ql_exit(void) 271298fb372SMike Snitzer { 272298fb372SMike Snitzer int r = dm_unregister_path_selector(&ql_ps); 273298fb372SMike Snitzer 274298fb372SMike Snitzer if (r < 0) 275298fb372SMike Snitzer DMERR("unregister failed %d", r); 276298fb372SMike Snitzer } 277298fb372SMike Snitzer 278298fb372SMike Snitzer module_init(dm_ql_init); 279298fb372SMike Snitzer module_exit(dm_ql_exit); 280298fb372SMike Snitzer 281298fb372SMike Snitzer MODULE_AUTHOR("Stefan Bader <Stefan.Bader at de.ibm.com>"); 282298fb372SMike Snitzer MODULE_DESCRIPTION( 283298fb372SMike Snitzer "(C) Copyright IBM Corp. 2004,2005 All Rights Reserved.\n" 284298fb372SMike Snitzer DM_NAME " path selector to balance the number of in-flight I/Os" 285298fb372SMike Snitzer ); 286298fb372SMike Snitzer MODULE_LICENSE("GPL"); 287