1ccd979bdSMark Fasheh /* -*- mode: c; c-basic-offset: 8; -*- 2ccd979bdSMark Fasheh * vim: noexpandtab sw=8 ts=8 sts=0: 3ccd979bdSMark Fasheh * 4ccd979bdSMark Fasheh * slot_map.c 5ccd979bdSMark Fasheh * 6ccd979bdSMark Fasheh * 7ccd979bdSMark Fasheh * 8ccd979bdSMark Fasheh * Copyright (C) 2002, 2004 Oracle. All rights reserved. 9ccd979bdSMark Fasheh * 10ccd979bdSMark Fasheh * This program is free software; you can redistribute it and/or 11ccd979bdSMark Fasheh * modify it under the terms of the GNU General Public 12ccd979bdSMark Fasheh * License as published by the Free Software Foundation; either 13ccd979bdSMark Fasheh * version 2 of the License, or (at your option) any later version. 14ccd979bdSMark Fasheh * 15ccd979bdSMark Fasheh * This program is distributed in the hope that it will be useful, 16ccd979bdSMark Fasheh * but WITHOUT ANY WARRANTY; without even the implied warranty of 17ccd979bdSMark Fasheh * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 18ccd979bdSMark Fasheh * General Public License for more details. 19ccd979bdSMark Fasheh * 20ccd979bdSMark Fasheh * You should have received a copy of the GNU General Public 21ccd979bdSMark Fasheh * License along with this program; if not, write to the 22ccd979bdSMark Fasheh * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 23ccd979bdSMark Fasheh * Boston, MA 021110-1307, USA. 24ccd979bdSMark Fasheh */ 25ccd979bdSMark Fasheh 26ccd979bdSMark Fasheh #include <linux/types.h> 27ccd979bdSMark Fasheh #include <linux/slab.h> 28ccd979bdSMark Fasheh #include <linux/highmem.h> 29ccd979bdSMark Fasheh 30ccd979bdSMark Fasheh #define MLOG_MASK_PREFIX ML_SUPER 31ccd979bdSMark Fasheh #include <cluster/masklog.h> 32ccd979bdSMark Fasheh 33ccd979bdSMark Fasheh #include "ocfs2.h" 34ccd979bdSMark Fasheh 35ccd979bdSMark Fasheh #include "dlmglue.h" 36ccd979bdSMark Fasheh #include "extent_map.h" 37ccd979bdSMark Fasheh #include "heartbeat.h" 38ccd979bdSMark Fasheh #include "inode.h" 39ccd979bdSMark Fasheh #include "slot_map.h" 40ccd979bdSMark Fasheh #include "super.h" 41ccd979bdSMark Fasheh #include "sysfile.h" 42ccd979bdSMark Fasheh 43ccd979bdSMark Fasheh #include "buffer_head_io.h" 44ccd979bdSMark Fasheh 45ccd979bdSMark Fasheh static s16 __ocfs2_node_num_to_slot(struct ocfs2_slot_info *si, 46ccd979bdSMark Fasheh s16 global); 47ccd979bdSMark Fasheh static void __ocfs2_fill_slot(struct ocfs2_slot_info *si, 48ccd979bdSMark Fasheh s16 slot_num, 49ccd979bdSMark Fasheh s16 node_num); 50ccd979bdSMark Fasheh 51ccd979bdSMark Fasheh /* Use the slot information we've collected to create a map of mounted 52ccd979bdSMark Fasheh * nodes. Should be holding an EX on super block. assumes slot info is 53ccd979bdSMark Fasheh * up to date. Note that we call this *after* we find a slot, so our 54ccd979bdSMark Fasheh * own node should be set in the map too... */ 55ccd979bdSMark Fasheh void ocfs2_populate_mounted_map(struct ocfs2_super *osb) 56ccd979bdSMark Fasheh { 57ccd979bdSMark Fasheh int i; 58ccd979bdSMark Fasheh struct ocfs2_slot_info *si = osb->slot_info; 59ccd979bdSMark Fasheh 60ccd979bdSMark Fasheh spin_lock(&si->si_lock); 61ccd979bdSMark Fasheh 62ccd979bdSMark Fasheh for (i = 0; i < si->si_size; i++) 63ccd979bdSMark Fasheh if (si->si_global_node_nums[i] != OCFS2_INVALID_SLOT) 64ccd979bdSMark Fasheh ocfs2_node_map_set_bit(osb, &osb->mounted_map, 65ccd979bdSMark Fasheh si->si_global_node_nums[i]); 66ccd979bdSMark Fasheh 67ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 68ccd979bdSMark Fasheh } 69ccd979bdSMark Fasheh 70ccd979bdSMark Fasheh /* post the slot information on disk into our slot_info struct. */ 71ccd979bdSMark Fasheh void ocfs2_update_slot_info(struct ocfs2_slot_info *si) 72ccd979bdSMark Fasheh { 73ccd979bdSMark Fasheh int i; 74ccd979bdSMark Fasheh __le16 *disk_info; 75ccd979bdSMark Fasheh 76ccd979bdSMark Fasheh /* we don't read the slot block here as ocfs2_super_lock 77ccd979bdSMark Fasheh * should've made sure we have the most recent copy. */ 78ccd979bdSMark Fasheh spin_lock(&si->si_lock); 79ccd979bdSMark Fasheh disk_info = (__le16 *) si->si_bh->b_data; 80ccd979bdSMark Fasheh 81ccd979bdSMark Fasheh for (i = 0; i < si->si_size; i++) 82ccd979bdSMark Fasheh si->si_global_node_nums[i] = le16_to_cpu(disk_info[i]); 83ccd979bdSMark Fasheh 84ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 85ccd979bdSMark Fasheh } 86ccd979bdSMark Fasheh 87ccd979bdSMark Fasheh /* post the our slot info stuff into it's destination bh and write it 88ccd979bdSMark Fasheh * out. */ 89ccd979bdSMark Fasheh int ocfs2_update_disk_slots(struct ocfs2_super *osb, 90ccd979bdSMark Fasheh struct ocfs2_slot_info *si) 91ccd979bdSMark Fasheh { 92ccd979bdSMark Fasheh int status, i; 93ccd979bdSMark Fasheh __le16 *disk_info = (__le16 *) si->si_bh->b_data; 94ccd979bdSMark Fasheh 95ccd979bdSMark Fasheh spin_lock(&si->si_lock); 96ccd979bdSMark Fasheh for (i = 0; i < si->si_size; i++) 97ccd979bdSMark Fasheh disk_info[i] = cpu_to_le16(si->si_global_node_nums[i]); 98ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 99ccd979bdSMark Fasheh 100ccd979bdSMark Fasheh status = ocfs2_write_block(osb, si->si_bh, si->si_inode); 101ccd979bdSMark Fasheh if (status < 0) 102ccd979bdSMark Fasheh mlog_errno(status); 103ccd979bdSMark Fasheh 104ccd979bdSMark Fasheh return status; 105ccd979bdSMark Fasheh } 106ccd979bdSMark Fasheh 107ccd979bdSMark Fasheh /* try to find global node in the slot info. Returns 108ccd979bdSMark Fasheh * OCFS2_INVALID_SLOT if nothing is found. */ 109ccd979bdSMark Fasheh static s16 __ocfs2_node_num_to_slot(struct ocfs2_slot_info *si, 110ccd979bdSMark Fasheh s16 global) 111ccd979bdSMark Fasheh { 112ccd979bdSMark Fasheh int i; 113ccd979bdSMark Fasheh s16 ret = OCFS2_INVALID_SLOT; 114ccd979bdSMark Fasheh 115ccd979bdSMark Fasheh for(i = 0; i < si->si_num_slots; i++) { 116ccd979bdSMark Fasheh if (global == si->si_global_node_nums[i]) { 117ccd979bdSMark Fasheh ret = (s16) i; 118ccd979bdSMark Fasheh break; 119ccd979bdSMark Fasheh } 120ccd979bdSMark Fasheh } 121ccd979bdSMark Fasheh return ret; 122ccd979bdSMark Fasheh } 123ccd979bdSMark Fasheh 124*baf4661aSSunil Mushran static s16 __ocfs2_find_empty_slot(struct ocfs2_slot_info *si, s16 preferred) 125ccd979bdSMark Fasheh { 126ccd979bdSMark Fasheh int i; 127ccd979bdSMark Fasheh s16 ret = OCFS2_INVALID_SLOT; 128ccd979bdSMark Fasheh 129*baf4661aSSunil Mushran if (preferred >= 0 && preferred < si->si_num_slots) { 130*baf4661aSSunil Mushran if (OCFS2_INVALID_SLOT == si->si_global_node_nums[preferred]) { 131*baf4661aSSunil Mushran ret = preferred; 132*baf4661aSSunil Mushran goto out; 133*baf4661aSSunil Mushran } 134*baf4661aSSunil Mushran } 135*baf4661aSSunil Mushran 136ccd979bdSMark Fasheh for(i = 0; i < si->si_num_slots; i++) { 137ccd979bdSMark Fasheh if (OCFS2_INVALID_SLOT == si->si_global_node_nums[i]) { 138ccd979bdSMark Fasheh ret = (s16) i; 139ccd979bdSMark Fasheh break; 140ccd979bdSMark Fasheh } 141ccd979bdSMark Fasheh } 142*baf4661aSSunil Mushran out: 143ccd979bdSMark Fasheh return ret; 144ccd979bdSMark Fasheh } 145ccd979bdSMark Fasheh 146ccd979bdSMark Fasheh s16 ocfs2_node_num_to_slot(struct ocfs2_slot_info *si, 147ccd979bdSMark Fasheh s16 global) 148ccd979bdSMark Fasheh { 149ccd979bdSMark Fasheh s16 ret; 150ccd979bdSMark Fasheh 151ccd979bdSMark Fasheh spin_lock(&si->si_lock); 152ccd979bdSMark Fasheh ret = __ocfs2_node_num_to_slot(si, global); 153ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 154ccd979bdSMark Fasheh return ret; 155ccd979bdSMark Fasheh } 156ccd979bdSMark Fasheh 157ccd979bdSMark Fasheh static void __ocfs2_fill_slot(struct ocfs2_slot_info *si, 158ccd979bdSMark Fasheh s16 slot_num, 159ccd979bdSMark Fasheh s16 node_num) 160ccd979bdSMark Fasheh { 161ccd979bdSMark Fasheh BUG_ON(slot_num == OCFS2_INVALID_SLOT); 162ccd979bdSMark Fasheh BUG_ON(slot_num >= si->si_num_slots); 163ccd979bdSMark Fasheh BUG_ON((node_num != O2NM_INVALID_NODE_NUM) && 164ccd979bdSMark Fasheh (node_num >= O2NM_MAX_NODES)); 165ccd979bdSMark Fasheh 166ccd979bdSMark Fasheh si->si_global_node_nums[slot_num] = node_num; 167ccd979bdSMark Fasheh } 168ccd979bdSMark Fasheh 169ccd979bdSMark Fasheh void ocfs2_clear_slot(struct ocfs2_slot_info *si, 170ccd979bdSMark Fasheh s16 slot_num) 171ccd979bdSMark Fasheh { 172ccd979bdSMark Fasheh spin_lock(&si->si_lock); 173ccd979bdSMark Fasheh __ocfs2_fill_slot(si, slot_num, OCFS2_INVALID_SLOT); 174ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 175ccd979bdSMark Fasheh } 176ccd979bdSMark Fasheh 177ccd979bdSMark Fasheh int ocfs2_init_slot_info(struct ocfs2_super *osb) 178ccd979bdSMark Fasheh { 179ccd979bdSMark Fasheh int status, i; 180ccd979bdSMark Fasheh u64 blkno; 181ccd979bdSMark Fasheh struct inode *inode = NULL; 182ccd979bdSMark Fasheh struct buffer_head *bh = NULL; 183ccd979bdSMark Fasheh struct ocfs2_slot_info *si; 184ccd979bdSMark Fasheh 185cd861280SRobert P. J. Day si = kzalloc(sizeof(struct ocfs2_slot_info), GFP_KERNEL); 186ccd979bdSMark Fasheh if (!si) { 187ccd979bdSMark Fasheh status = -ENOMEM; 188ccd979bdSMark Fasheh mlog_errno(status); 189ccd979bdSMark Fasheh goto bail; 190ccd979bdSMark Fasheh } 191ccd979bdSMark Fasheh 192ccd979bdSMark Fasheh spin_lock_init(&si->si_lock); 193ccd979bdSMark Fasheh si->si_num_slots = osb->max_slots; 194ccd979bdSMark Fasheh si->si_size = OCFS2_MAX_SLOTS; 195ccd979bdSMark Fasheh 196ccd979bdSMark Fasheh for(i = 0; i < si->si_num_slots; i++) 197ccd979bdSMark Fasheh si->si_global_node_nums[i] = OCFS2_INVALID_SLOT; 198ccd979bdSMark Fasheh 199ccd979bdSMark Fasheh inode = ocfs2_get_system_file_inode(osb, SLOT_MAP_SYSTEM_INODE, 200ccd979bdSMark Fasheh OCFS2_INVALID_SLOT); 201ccd979bdSMark Fasheh if (!inode) { 202ccd979bdSMark Fasheh status = -EINVAL; 203ccd979bdSMark Fasheh mlog_errno(status); 204ccd979bdSMark Fasheh goto bail; 205ccd979bdSMark Fasheh } 206ccd979bdSMark Fasheh 20749cb8d2dSMark Fasheh status = ocfs2_extent_map_get_blocks(inode, 0ULL, &blkno, NULL, NULL); 208ccd979bdSMark Fasheh if (status < 0) { 209ccd979bdSMark Fasheh mlog_errno(status); 210ccd979bdSMark Fasheh goto bail; 211ccd979bdSMark Fasheh } 212ccd979bdSMark Fasheh 213ccd979bdSMark Fasheh status = ocfs2_read_block(osb, blkno, &bh, 0, inode); 214ccd979bdSMark Fasheh if (status < 0) { 215ccd979bdSMark Fasheh mlog_errno(status); 216ccd979bdSMark Fasheh goto bail; 217ccd979bdSMark Fasheh } 218ccd979bdSMark Fasheh 219ccd979bdSMark Fasheh si->si_inode = inode; 220ccd979bdSMark Fasheh si->si_bh = bh; 221ccd979bdSMark Fasheh osb->slot_info = si; 222ccd979bdSMark Fasheh bail: 223ccd979bdSMark Fasheh if (status < 0 && si) 224ccd979bdSMark Fasheh ocfs2_free_slot_info(si); 225ccd979bdSMark Fasheh 226ccd979bdSMark Fasheh return status; 227ccd979bdSMark Fasheh } 228ccd979bdSMark Fasheh 229ccd979bdSMark Fasheh void ocfs2_free_slot_info(struct ocfs2_slot_info *si) 230ccd979bdSMark Fasheh { 231ccd979bdSMark Fasheh if (si->si_inode) 232ccd979bdSMark Fasheh iput(si->si_inode); 233ccd979bdSMark Fasheh if (si->si_bh) 234ccd979bdSMark Fasheh brelse(si->si_bh); 235ccd979bdSMark Fasheh kfree(si); 236ccd979bdSMark Fasheh } 237ccd979bdSMark Fasheh 238ccd979bdSMark Fasheh int ocfs2_find_slot(struct ocfs2_super *osb) 239ccd979bdSMark Fasheh { 240ccd979bdSMark Fasheh int status; 241ccd979bdSMark Fasheh s16 slot; 242ccd979bdSMark Fasheh struct ocfs2_slot_info *si; 243ccd979bdSMark Fasheh 244ccd979bdSMark Fasheh mlog_entry_void(); 245ccd979bdSMark Fasheh 246ccd979bdSMark Fasheh si = osb->slot_info; 247ccd979bdSMark Fasheh 248ccd979bdSMark Fasheh ocfs2_update_slot_info(si); 249ccd979bdSMark Fasheh 250ccd979bdSMark Fasheh spin_lock(&si->si_lock); 251ccd979bdSMark Fasheh /* search for ourselves first and take the slot if it already 252ccd979bdSMark Fasheh * exists. Perhaps we need to mark this in a variable for our 253ccd979bdSMark Fasheh * own journal recovery? Possibly not, though we certainly 254ccd979bdSMark Fasheh * need to warn to the user */ 255ccd979bdSMark Fasheh slot = __ocfs2_node_num_to_slot(si, osb->node_num); 256ccd979bdSMark Fasheh if (slot == OCFS2_INVALID_SLOT) { 257ccd979bdSMark Fasheh /* if no slot yet, then just take 1st available 258ccd979bdSMark Fasheh * one. */ 259*baf4661aSSunil Mushran slot = __ocfs2_find_empty_slot(si, osb->preferred_slot); 260ccd979bdSMark Fasheh if (slot == OCFS2_INVALID_SLOT) { 261ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 262ccd979bdSMark Fasheh mlog(ML_ERROR, "no free slots available!\n"); 263ccd979bdSMark Fasheh status = -EINVAL; 264ccd979bdSMark Fasheh goto bail; 265ccd979bdSMark Fasheh } 266ccd979bdSMark Fasheh } else 267ccd979bdSMark Fasheh mlog(ML_NOTICE, "slot %d is already allocated to this node!\n", 268ccd979bdSMark Fasheh slot); 269ccd979bdSMark Fasheh 270ccd979bdSMark Fasheh __ocfs2_fill_slot(si, slot, osb->node_num); 271ccd979bdSMark Fasheh osb->slot_num = slot; 272ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 273ccd979bdSMark Fasheh 274e7607ab3SMark Fasheh mlog(0, "taking node slot %d\n", osb->slot_num); 275ccd979bdSMark Fasheh 276ccd979bdSMark Fasheh status = ocfs2_update_disk_slots(osb, si); 277ccd979bdSMark Fasheh if (status < 0) 278ccd979bdSMark Fasheh mlog_errno(status); 279ccd979bdSMark Fasheh 280ccd979bdSMark Fasheh bail: 281ccd979bdSMark Fasheh mlog_exit(status); 282ccd979bdSMark Fasheh return status; 283ccd979bdSMark Fasheh } 284ccd979bdSMark Fasheh 285ccd979bdSMark Fasheh void ocfs2_put_slot(struct ocfs2_super *osb) 286ccd979bdSMark Fasheh { 287ccd979bdSMark Fasheh int status; 288ccd979bdSMark Fasheh struct ocfs2_slot_info *si = osb->slot_info; 289ccd979bdSMark Fasheh 290ccd979bdSMark Fasheh if (!si) 291ccd979bdSMark Fasheh return; 292ccd979bdSMark Fasheh 293ccd979bdSMark Fasheh ocfs2_update_slot_info(si); 294ccd979bdSMark Fasheh 295ccd979bdSMark Fasheh spin_lock(&si->si_lock); 296ccd979bdSMark Fasheh __ocfs2_fill_slot(si, osb->slot_num, OCFS2_INVALID_SLOT); 297ccd979bdSMark Fasheh osb->slot_num = OCFS2_INVALID_SLOT; 298ccd979bdSMark Fasheh spin_unlock(&si->si_lock); 299ccd979bdSMark Fasheh 300ccd979bdSMark Fasheh status = ocfs2_update_disk_slots(osb, si); 301ccd979bdSMark Fasheh if (status < 0) { 302ccd979bdSMark Fasheh mlog_errno(status); 303ccd979bdSMark Fasheh goto bail; 304ccd979bdSMark Fasheh } 305ccd979bdSMark Fasheh 306ccd979bdSMark Fasheh bail: 307ccd979bdSMark Fasheh osb->slot_info = NULL; 308ccd979bdSMark Fasheh ocfs2_free_slot_info(si); 309ccd979bdSMark Fasheh } 310ccd979bdSMark Fasheh 311