1ccd979bdSMark Fasheh /* -*- mode: c; c-basic-offset: 8; -*- 2ccd979bdSMark Fasheh * vim: noexpandtab sw=8 ts=8 sts=0: 3ccd979bdSMark Fasheh * 4ccd979bdSMark Fasheh * slot_map.c 5ccd979bdSMark Fasheh * 6ccd979bdSMark Fasheh * 7ccd979bdSMark Fasheh * 8ccd979bdSMark Fasheh * Copyright (C) 2002, 2004 Oracle. All rights reserved. 9ccd979bdSMark Fasheh * 10ccd979bdSMark Fasheh * This program is free software; you can redistribute it and/or 11ccd979bdSMark Fasheh * modify it under the terms of the GNU General Public 12ccd979bdSMark Fasheh * License as published by the Free Software Foundation; either 13ccd979bdSMark Fasheh * version 2 of the License, or (at your option) any later version. 14ccd979bdSMark Fasheh * 15ccd979bdSMark Fasheh * This program is distributed in the hope that it will be useful, 16ccd979bdSMark Fasheh * but WITHOUT ANY WARRANTY; without even the implied warranty of 17ccd979bdSMark Fasheh * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 18ccd979bdSMark Fasheh * General Public License for more details. 19ccd979bdSMark Fasheh * 20ccd979bdSMark Fasheh * You should have received a copy of the GNU General Public 21ccd979bdSMark Fasheh * License along with this program; if not, write to the 22ccd979bdSMark Fasheh * Free Software Foundation, Inc., 59 Temple Place - Suite 330, 23ccd979bdSMark Fasheh * Boston, MA 021110-1307, USA. 24ccd979bdSMark Fasheh */ 25ccd979bdSMark Fasheh 26ccd979bdSMark Fasheh #include <linux/types.h> 27ccd979bdSMark Fasheh #include <linux/slab.h> 28ccd979bdSMark Fasheh #include <linux/highmem.h> 29ccd979bdSMark Fasheh 30ccd979bdSMark Fasheh #define MLOG_MASK_PREFIX ML_SUPER 31ccd979bdSMark Fasheh #include <cluster/masklog.h> 32ccd979bdSMark Fasheh 33ccd979bdSMark Fasheh #include "ocfs2.h" 34ccd979bdSMark Fasheh 35ccd979bdSMark Fasheh #include "dlmglue.h" 36ccd979bdSMark Fasheh #include "extent_map.h" 37ccd979bdSMark Fasheh #include "heartbeat.h" 38ccd979bdSMark Fasheh #include "inode.h" 39ccd979bdSMark Fasheh #include "slot_map.h" 40ccd979bdSMark Fasheh #include "super.h" 41ccd979bdSMark Fasheh #include "sysfile.h" 42ccd979bdSMark Fasheh 43ccd979bdSMark Fasheh #include "buffer_head_io.h" 44ccd979bdSMark Fasheh 45*d85b20e4SJoel Becker struct ocfs2_slot_info { 46*d85b20e4SJoel Becker struct inode *si_inode; 47*d85b20e4SJoel Becker struct buffer_head *si_bh; 48*d85b20e4SJoel Becker unsigned int si_num_slots; 49*d85b20e4SJoel Becker unsigned int si_size; 50*d85b20e4SJoel Becker s16 si_global_node_nums[OCFS2_MAX_SLOTS]; 51*d85b20e4SJoel Becker }; 52*d85b20e4SJoel Becker 53*d85b20e4SJoel Becker 54ccd979bdSMark Fasheh static s16 __ocfs2_node_num_to_slot(struct ocfs2_slot_info *si, 55ccd979bdSMark Fasheh s16 global); 56ccd979bdSMark Fasheh static void __ocfs2_fill_slot(struct ocfs2_slot_info *si, 57ccd979bdSMark Fasheh s16 slot_num, 58ccd979bdSMark Fasheh s16 node_num); 59ccd979bdSMark Fasheh 60*d85b20e4SJoel Becker /* 61*d85b20e4SJoel Becker * Post the slot information on disk into our slot_info struct. 62*d85b20e4SJoel Becker * Must be protected by osb_lock. 63*d85b20e4SJoel Becker */ 648e8a4603SMark Fasheh static void ocfs2_update_slot_info(struct ocfs2_slot_info *si) 65ccd979bdSMark Fasheh { 66ccd979bdSMark Fasheh int i; 67ccd979bdSMark Fasheh __le16 *disk_info; 68ccd979bdSMark Fasheh 69ccd979bdSMark Fasheh /* we don't read the slot block here as ocfs2_super_lock 70ccd979bdSMark Fasheh * should've made sure we have the most recent copy. */ 71ccd979bdSMark Fasheh disk_info = (__le16 *) si->si_bh->b_data; 72ccd979bdSMark Fasheh 73ccd979bdSMark Fasheh for (i = 0; i < si->si_size; i++) 74ccd979bdSMark Fasheh si->si_global_node_nums[i] = le16_to_cpu(disk_info[i]); 75ccd979bdSMark Fasheh } 76ccd979bdSMark Fasheh 778e8a4603SMark Fasheh int ocfs2_refresh_slot_info(struct ocfs2_super *osb) 788e8a4603SMark Fasheh { 798e8a4603SMark Fasheh int ret; 808e8a4603SMark Fasheh struct ocfs2_slot_info *si = osb->slot_info; 818e8a4603SMark Fasheh struct buffer_head *bh; 828e8a4603SMark Fasheh 838e8a4603SMark Fasheh if (si == NULL) 848e8a4603SMark Fasheh return 0; 858e8a4603SMark Fasheh 868e8a4603SMark Fasheh bh = si->si_bh; 878e8a4603SMark Fasheh ret = ocfs2_read_block(osb, bh->b_blocknr, &bh, 0, si->si_inode); 88*d85b20e4SJoel Becker if (ret == 0) { 89*d85b20e4SJoel Becker spin_lock(&osb->osb_lock); 908e8a4603SMark Fasheh ocfs2_update_slot_info(si); 91*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 92*d85b20e4SJoel Becker } 938e8a4603SMark Fasheh 948e8a4603SMark Fasheh return ret; 958e8a4603SMark Fasheh } 968e8a4603SMark Fasheh 97ccd979bdSMark Fasheh /* post the our slot info stuff into it's destination bh and write it 98ccd979bdSMark Fasheh * out. */ 998e8a4603SMark Fasheh static int ocfs2_update_disk_slots(struct ocfs2_super *osb, 100ccd979bdSMark Fasheh struct ocfs2_slot_info *si) 101ccd979bdSMark Fasheh { 102ccd979bdSMark Fasheh int status, i; 103ccd979bdSMark Fasheh __le16 *disk_info = (__le16 *) si->si_bh->b_data; 104ccd979bdSMark Fasheh 105*d85b20e4SJoel Becker spin_lock(&osb->osb_lock); 106ccd979bdSMark Fasheh for (i = 0; i < si->si_size; i++) 107ccd979bdSMark Fasheh disk_info[i] = cpu_to_le16(si->si_global_node_nums[i]); 108*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 109ccd979bdSMark Fasheh 110ccd979bdSMark Fasheh status = ocfs2_write_block(osb, si->si_bh, si->si_inode); 111ccd979bdSMark Fasheh if (status < 0) 112ccd979bdSMark Fasheh mlog_errno(status); 113ccd979bdSMark Fasheh 114ccd979bdSMark Fasheh return status; 115ccd979bdSMark Fasheh } 116ccd979bdSMark Fasheh 117ccd979bdSMark Fasheh /* try to find global node in the slot info. Returns 118ccd979bdSMark Fasheh * OCFS2_INVALID_SLOT if nothing is found. */ 119ccd979bdSMark Fasheh static s16 __ocfs2_node_num_to_slot(struct ocfs2_slot_info *si, 120ccd979bdSMark Fasheh s16 global) 121ccd979bdSMark Fasheh { 122ccd979bdSMark Fasheh int i; 123ccd979bdSMark Fasheh s16 ret = OCFS2_INVALID_SLOT; 124ccd979bdSMark Fasheh 125ccd979bdSMark Fasheh for(i = 0; i < si->si_num_slots; i++) { 126ccd979bdSMark Fasheh if (global == si->si_global_node_nums[i]) { 127ccd979bdSMark Fasheh ret = (s16) i; 128ccd979bdSMark Fasheh break; 129ccd979bdSMark Fasheh } 130ccd979bdSMark Fasheh } 131ccd979bdSMark Fasheh return ret; 132ccd979bdSMark Fasheh } 133ccd979bdSMark Fasheh 134*d85b20e4SJoel Becker static s16 __ocfs2_find_empty_slot(struct ocfs2_slot_info *si, 135*d85b20e4SJoel Becker s16 preferred) 136ccd979bdSMark Fasheh { 137ccd979bdSMark Fasheh int i; 138ccd979bdSMark Fasheh s16 ret = OCFS2_INVALID_SLOT; 139ccd979bdSMark Fasheh 140baf4661aSSunil Mushran if (preferred >= 0 && preferred < si->si_num_slots) { 141baf4661aSSunil Mushran if (OCFS2_INVALID_SLOT == si->si_global_node_nums[preferred]) { 142baf4661aSSunil Mushran ret = preferred; 143baf4661aSSunil Mushran goto out; 144baf4661aSSunil Mushran } 145baf4661aSSunil Mushran } 146baf4661aSSunil Mushran 147ccd979bdSMark Fasheh for(i = 0; i < si->si_num_slots; i++) { 148ccd979bdSMark Fasheh if (OCFS2_INVALID_SLOT == si->si_global_node_nums[i]) { 149ccd979bdSMark Fasheh ret = (s16) i; 150ccd979bdSMark Fasheh break; 151ccd979bdSMark Fasheh } 152ccd979bdSMark Fasheh } 153baf4661aSSunil Mushran out: 154ccd979bdSMark Fasheh return ret; 155ccd979bdSMark Fasheh } 156ccd979bdSMark Fasheh 157*d85b20e4SJoel Becker int ocfs2_node_num_to_slot(struct ocfs2_super *osb, unsigned int node_num) 158ccd979bdSMark Fasheh { 159*d85b20e4SJoel Becker s16 slot; 160*d85b20e4SJoel Becker struct ocfs2_slot_info *si = osb->slot_info; 161ccd979bdSMark Fasheh 162*d85b20e4SJoel Becker spin_lock(&osb->osb_lock); 163*d85b20e4SJoel Becker slot = __ocfs2_node_num_to_slot(si, node_num); 164*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 165*d85b20e4SJoel Becker 166*d85b20e4SJoel Becker if (slot == OCFS2_INVALID_SLOT) 167*d85b20e4SJoel Becker return -ENOENT; 168*d85b20e4SJoel Becker 169*d85b20e4SJoel Becker return slot; 170*d85b20e4SJoel Becker } 171*d85b20e4SJoel Becker 172*d85b20e4SJoel Becker int ocfs2_slot_to_node_num_locked(struct ocfs2_super *osb, int slot_num, 173*d85b20e4SJoel Becker unsigned int *node_num) 174*d85b20e4SJoel Becker { 175*d85b20e4SJoel Becker struct ocfs2_slot_info *si = osb->slot_info; 176*d85b20e4SJoel Becker 177*d85b20e4SJoel Becker assert_spin_locked(&osb->osb_lock); 178*d85b20e4SJoel Becker 179*d85b20e4SJoel Becker BUG_ON(slot_num < 0); 180*d85b20e4SJoel Becker BUG_ON(slot_num > osb->max_slots); 181*d85b20e4SJoel Becker 182*d85b20e4SJoel Becker if (si->si_global_node_nums[slot_num] == OCFS2_INVALID_SLOT) 183*d85b20e4SJoel Becker return -ENOENT; 184*d85b20e4SJoel Becker 185*d85b20e4SJoel Becker *node_num = si->si_global_node_nums[slot_num]; 186*d85b20e4SJoel Becker return 0; 187ccd979bdSMark Fasheh } 188ccd979bdSMark Fasheh 1898e8a4603SMark Fasheh static void __ocfs2_free_slot_info(struct ocfs2_slot_info *si) 1908e8a4603SMark Fasheh { 1918e8a4603SMark Fasheh if (si == NULL) 1928e8a4603SMark Fasheh return; 1938e8a4603SMark Fasheh 1948e8a4603SMark Fasheh if (si->si_inode) 1958e8a4603SMark Fasheh iput(si->si_inode); 1968e8a4603SMark Fasheh if (si->si_bh) 1978e8a4603SMark Fasheh brelse(si->si_bh); 1988e8a4603SMark Fasheh 1998e8a4603SMark Fasheh kfree(si); 2008e8a4603SMark Fasheh } 2018e8a4603SMark Fasheh 202ccd979bdSMark Fasheh static void __ocfs2_fill_slot(struct ocfs2_slot_info *si, 203ccd979bdSMark Fasheh s16 slot_num, 204ccd979bdSMark Fasheh s16 node_num) 205ccd979bdSMark Fasheh { 206ccd979bdSMark Fasheh BUG_ON(slot_num == OCFS2_INVALID_SLOT); 207ccd979bdSMark Fasheh BUG_ON(slot_num >= si->si_num_slots); 208ccd979bdSMark Fasheh BUG_ON((node_num != O2NM_INVALID_NODE_NUM) && 209ccd979bdSMark Fasheh (node_num >= O2NM_MAX_NODES)); 210ccd979bdSMark Fasheh 211ccd979bdSMark Fasheh si->si_global_node_nums[slot_num] = node_num; 212ccd979bdSMark Fasheh } 213ccd979bdSMark Fasheh 2148e8a4603SMark Fasheh int ocfs2_clear_slot(struct ocfs2_super *osb, s16 slot_num) 215ccd979bdSMark Fasheh { 2168e8a4603SMark Fasheh struct ocfs2_slot_info *si = osb->slot_info; 2178e8a4603SMark Fasheh 2188e8a4603SMark Fasheh if (si == NULL) 2198e8a4603SMark Fasheh return 0; 2208e8a4603SMark Fasheh 221*d85b20e4SJoel Becker spin_lock(&osb->osb_lock); 222ccd979bdSMark Fasheh __ocfs2_fill_slot(si, slot_num, OCFS2_INVALID_SLOT); 223*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 2248e8a4603SMark Fasheh 2258e8a4603SMark Fasheh return ocfs2_update_disk_slots(osb, osb->slot_info); 226ccd979bdSMark Fasheh } 227ccd979bdSMark Fasheh 228ccd979bdSMark Fasheh int ocfs2_init_slot_info(struct ocfs2_super *osb) 229ccd979bdSMark Fasheh { 230ccd979bdSMark Fasheh int status, i; 231ccd979bdSMark Fasheh u64 blkno; 232ccd979bdSMark Fasheh struct inode *inode = NULL; 233ccd979bdSMark Fasheh struct buffer_head *bh = NULL; 234ccd979bdSMark Fasheh struct ocfs2_slot_info *si; 235ccd979bdSMark Fasheh 236cd861280SRobert P. J. Day si = kzalloc(sizeof(struct ocfs2_slot_info), GFP_KERNEL); 237ccd979bdSMark Fasheh if (!si) { 238ccd979bdSMark Fasheh status = -ENOMEM; 239ccd979bdSMark Fasheh mlog_errno(status); 240ccd979bdSMark Fasheh goto bail; 241ccd979bdSMark Fasheh } 242ccd979bdSMark Fasheh 243ccd979bdSMark Fasheh si->si_num_slots = osb->max_slots; 244ccd979bdSMark Fasheh si->si_size = OCFS2_MAX_SLOTS; 245ccd979bdSMark Fasheh 246ccd979bdSMark Fasheh for(i = 0; i < si->si_num_slots; i++) 247ccd979bdSMark Fasheh si->si_global_node_nums[i] = OCFS2_INVALID_SLOT; 248ccd979bdSMark Fasheh 249ccd979bdSMark Fasheh inode = ocfs2_get_system_file_inode(osb, SLOT_MAP_SYSTEM_INODE, 250ccd979bdSMark Fasheh OCFS2_INVALID_SLOT); 251ccd979bdSMark Fasheh if (!inode) { 252ccd979bdSMark Fasheh status = -EINVAL; 253ccd979bdSMark Fasheh mlog_errno(status); 254ccd979bdSMark Fasheh goto bail; 255ccd979bdSMark Fasheh } 256ccd979bdSMark Fasheh 25749cb8d2dSMark Fasheh status = ocfs2_extent_map_get_blocks(inode, 0ULL, &blkno, NULL, NULL); 258ccd979bdSMark Fasheh if (status < 0) { 259ccd979bdSMark Fasheh mlog_errno(status); 260ccd979bdSMark Fasheh goto bail; 261ccd979bdSMark Fasheh } 262ccd979bdSMark Fasheh 263ccd979bdSMark Fasheh status = ocfs2_read_block(osb, blkno, &bh, 0, inode); 264ccd979bdSMark Fasheh if (status < 0) { 265ccd979bdSMark Fasheh mlog_errno(status); 266ccd979bdSMark Fasheh goto bail; 267ccd979bdSMark Fasheh } 268ccd979bdSMark Fasheh 269ccd979bdSMark Fasheh si->si_inode = inode; 270ccd979bdSMark Fasheh si->si_bh = bh; 271*d85b20e4SJoel Becker osb->slot_info = (struct ocfs2_slot_info *)si; 272ccd979bdSMark Fasheh bail: 273ccd979bdSMark Fasheh if (status < 0 && si) 2748e8a4603SMark Fasheh __ocfs2_free_slot_info(si); 275ccd979bdSMark Fasheh 276ccd979bdSMark Fasheh return status; 277ccd979bdSMark Fasheh } 278ccd979bdSMark Fasheh 2798e8a4603SMark Fasheh void ocfs2_free_slot_info(struct ocfs2_super *osb) 280ccd979bdSMark Fasheh { 2818e8a4603SMark Fasheh struct ocfs2_slot_info *si = osb->slot_info; 2828e8a4603SMark Fasheh 2838e8a4603SMark Fasheh osb->slot_info = NULL; 2848e8a4603SMark Fasheh __ocfs2_free_slot_info(si); 285ccd979bdSMark Fasheh } 286ccd979bdSMark Fasheh 287ccd979bdSMark Fasheh int ocfs2_find_slot(struct ocfs2_super *osb) 288ccd979bdSMark Fasheh { 289ccd979bdSMark Fasheh int status; 290ccd979bdSMark Fasheh s16 slot; 291ccd979bdSMark Fasheh struct ocfs2_slot_info *si; 292ccd979bdSMark Fasheh 293ccd979bdSMark Fasheh mlog_entry_void(); 294ccd979bdSMark Fasheh 295ccd979bdSMark Fasheh si = osb->slot_info; 296ccd979bdSMark Fasheh 297*d85b20e4SJoel Becker spin_lock(&osb->osb_lock); 298ccd979bdSMark Fasheh ocfs2_update_slot_info(si); 299ccd979bdSMark Fasheh 300ccd979bdSMark Fasheh /* search for ourselves first and take the slot if it already 301ccd979bdSMark Fasheh * exists. Perhaps we need to mark this in a variable for our 302ccd979bdSMark Fasheh * own journal recovery? Possibly not, though we certainly 303ccd979bdSMark Fasheh * need to warn to the user */ 304ccd979bdSMark Fasheh slot = __ocfs2_node_num_to_slot(si, osb->node_num); 305ccd979bdSMark Fasheh if (slot == OCFS2_INVALID_SLOT) { 306ccd979bdSMark Fasheh /* if no slot yet, then just take 1st available 307ccd979bdSMark Fasheh * one. */ 308baf4661aSSunil Mushran slot = __ocfs2_find_empty_slot(si, osb->preferred_slot); 309ccd979bdSMark Fasheh if (slot == OCFS2_INVALID_SLOT) { 310*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 311ccd979bdSMark Fasheh mlog(ML_ERROR, "no free slots available!\n"); 312ccd979bdSMark Fasheh status = -EINVAL; 313ccd979bdSMark Fasheh goto bail; 314ccd979bdSMark Fasheh } 315ccd979bdSMark Fasheh } else 316ccd979bdSMark Fasheh mlog(ML_NOTICE, "slot %d is already allocated to this node!\n", 317ccd979bdSMark Fasheh slot); 318ccd979bdSMark Fasheh 319ccd979bdSMark Fasheh __ocfs2_fill_slot(si, slot, osb->node_num); 320ccd979bdSMark Fasheh osb->slot_num = slot; 321*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 322ccd979bdSMark Fasheh 323e7607ab3SMark Fasheh mlog(0, "taking node slot %d\n", osb->slot_num); 324ccd979bdSMark Fasheh 325ccd979bdSMark Fasheh status = ocfs2_update_disk_slots(osb, si); 326ccd979bdSMark Fasheh if (status < 0) 327ccd979bdSMark Fasheh mlog_errno(status); 328ccd979bdSMark Fasheh 329ccd979bdSMark Fasheh bail: 330ccd979bdSMark Fasheh mlog_exit(status); 331ccd979bdSMark Fasheh return status; 332ccd979bdSMark Fasheh } 333ccd979bdSMark Fasheh 334ccd979bdSMark Fasheh void ocfs2_put_slot(struct ocfs2_super *osb) 335ccd979bdSMark Fasheh { 336ccd979bdSMark Fasheh int status; 337ccd979bdSMark Fasheh struct ocfs2_slot_info *si = osb->slot_info; 338ccd979bdSMark Fasheh 339ccd979bdSMark Fasheh if (!si) 340ccd979bdSMark Fasheh return; 341ccd979bdSMark Fasheh 342*d85b20e4SJoel Becker spin_lock(&osb->osb_lock); 343ccd979bdSMark Fasheh ocfs2_update_slot_info(si); 344ccd979bdSMark Fasheh 345ccd979bdSMark Fasheh __ocfs2_fill_slot(si, osb->slot_num, OCFS2_INVALID_SLOT); 346ccd979bdSMark Fasheh osb->slot_num = OCFS2_INVALID_SLOT; 347*d85b20e4SJoel Becker spin_unlock(&osb->osb_lock); 348ccd979bdSMark Fasheh 349ccd979bdSMark Fasheh status = ocfs2_update_disk_slots(osb, si); 350ccd979bdSMark Fasheh if (status < 0) { 351ccd979bdSMark Fasheh mlog_errno(status); 352ccd979bdSMark Fasheh goto bail; 353ccd979bdSMark Fasheh } 354ccd979bdSMark Fasheh 355ccd979bdSMark Fasheh bail: 3568e8a4603SMark Fasheh ocfs2_free_slot_info(osb); 357ccd979bdSMark Fasheh } 358ccd979bdSMark Fasheh 359