1e7fd4179SDavid Teigland /****************************************************************************** 2e7fd4179SDavid Teigland ******************************************************************************* 3e7fd4179SDavid Teigland ** 4e7fd4179SDavid Teigland ** Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved. 5dbcfc347SDavid Teigland ** Copyright (C) 2005-2008 Red Hat, Inc. All rights reserved. 6e7fd4179SDavid Teigland ** 7e7fd4179SDavid Teigland ** This copyrighted material is made available to anyone wishing to use, 8e7fd4179SDavid Teigland ** modify, copy, or redistribute it subject to the terms and conditions 9e7fd4179SDavid Teigland ** of the GNU General Public License v.2. 10e7fd4179SDavid Teigland ** 11e7fd4179SDavid Teigland ******************************************************************************* 12e7fd4179SDavid Teigland ******************************************************************************/ 13e7fd4179SDavid Teigland 14e7fd4179SDavid Teigland #include "dlm_internal.h" 15e7fd4179SDavid Teigland #include "lockspace.h" 16e7fd4179SDavid Teigland #include "member.h" 17e7fd4179SDavid Teigland #include "lowcomms.h" 18e7fd4179SDavid Teigland #include "midcomms.h" 19e7fd4179SDavid Teigland #include "rcom.h" 20e7fd4179SDavid Teigland #include "recover.h" 21e7fd4179SDavid Teigland #include "dir.h" 22e7fd4179SDavid Teigland #include "config.h" 23e7fd4179SDavid Teigland #include "memory.h" 24e7fd4179SDavid Teigland #include "lock.h" 25e7fd4179SDavid Teigland #include "util.h" 26e7fd4179SDavid Teigland 27e7fd4179SDavid Teigland static int rcom_response(struct dlm_ls *ls) 28e7fd4179SDavid Teigland { 29e7fd4179SDavid Teigland return test_bit(LSFL_RCOM_READY, &ls->ls_flags); 30e7fd4179SDavid Teigland } 31e7fd4179SDavid Teigland 32e7fd4179SDavid Teigland static int create_rcom(struct dlm_ls *ls, int to_nodeid, int type, int len, 33e7fd4179SDavid Teigland struct dlm_rcom **rc_ret, struct dlm_mhandle **mh_ret) 34e7fd4179SDavid Teigland { 35e7fd4179SDavid Teigland struct dlm_rcom *rc; 36e7fd4179SDavid Teigland struct dlm_mhandle *mh; 37e7fd4179SDavid Teigland char *mb; 38e7fd4179SDavid Teigland int mb_len = sizeof(struct dlm_rcom) + len; 39e7fd4179SDavid Teigland 40573c24c4SDavid Teigland mh = dlm_lowcomms_get_buffer(to_nodeid, mb_len, GFP_NOFS, &mb); 41e7fd4179SDavid Teigland if (!mh) { 42e7fd4179SDavid Teigland log_print("create_rcom to %d type %d len %d ENOBUFS", 43e7fd4179SDavid Teigland to_nodeid, type, len); 44e7fd4179SDavid Teigland return -ENOBUFS; 45e7fd4179SDavid Teigland } 46e7fd4179SDavid Teigland memset(mb, 0, mb_len); 47e7fd4179SDavid Teigland 48e7fd4179SDavid Teigland rc = (struct dlm_rcom *) mb; 49e7fd4179SDavid Teigland 50e7fd4179SDavid Teigland rc->rc_header.h_version = (DLM_HEADER_MAJOR | DLM_HEADER_MINOR); 51e7fd4179SDavid Teigland rc->rc_header.h_lockspace = ls->ls_global_id; 52e7fd4179SDavid Teigland rc->rc_header.h_nodeid = dlm_our_nodeid(); 53e7fd4179SDavid Teigland rc->rc_header.h_length = mb_len; 54e7fd4179SDavid Teigland rc->rc_header.h_cmd = DLM_RCOM; 55e7fd4179SDavid Teigland 56e7fd4179SDavid Teigland rc->rc_type = type; 57e7fd4179SDavid Teigland 5838aa8b0cSDavid Teigland spin_lock(&ls->ls_recover_lock); 5938aa8b0cSDavid Teigland rc->rc_seq = ls->ls_recover_seq; 6038aa8b0cSDavid Teigland spin_unlock(&ls->ls_recover_lock); 6138aa8b0cSDavid Teigland 62e7fd4179SDavid Teigland *mh_ret = mh; 63e7fd4179SDavid Teigland *rc_ret = rc; 64e7fd4179SDavid Teigland return 0; 65e7fd4179SDavid Teigland } 66e7fd4179SDavid Teigland 67e7fd4179SDavid Teigland static void send_rcom(struct dlm_ls *ls, struct dlm_mhandle *mh, 68e7fd4179SDavid Teigland struct dlm_rcom *rc) 69e7fd4179SDavid Teigland { 70e7fd4179SDavid Teigland dlm_rcom_out(rc); 71e7fd4179SDavid Teigland dlm_lowcomms_commit_buffer(mh); 72e7fd4179SDavid Teigland } 73e7fd4179SDavid Teigland 74757a4271SDavid Teigland static void set_rcom_status(struct dlm_ls *ls, struct rcom_status *rs, 75757a4271SDavid Teigland uint32_t flags) 76757a4271SDavid Teigland { 77757a4271SDavid Teigland rs->rs_flags = cpu_to_le32(flags); 78757a4271SDavid Teigland } 79757a4271SDavid Teigland 80e7fd4179SDavid Teigland /* When replying to a status request, a node also sends back its 81e7fd4179SDavid Teigland configuration values. The requesting node then checks that the remote 82e7fd4179SDavid Teigland node is configured the same way as itself. */ 83e7fd4179SDavid Teigland 84757a4271SDavid Teigland static void set_rcom_config(struct dlm_ls *ls, struct rcom_config *rf, 85757a4271SDavid Teigland uint32_t num_slots) 86e7fd4179SDavid Teigland { 8793ff2971SAl Viro rf->rf_lvblen = cpu_to_le32(ls->ls_lvblen); 8893ff2971SAl Viro rf->rf_lsflags = cpu_to_le32(ls->ls_exflags); 89757a4271SDavid Teigland 90757a4271SDavid Teigland rf->rf_our_slot = cpu_to_le16(ls->ls_slot); 91757a4271SDavid Teigland rf->rf_num_slots = cpu_to_le16(num_slots); 92757a4271SDavid Teigland rf->rf_generation = cpu_to_le32(ls->ls_generation); 93e7fd4179SDavid Teigland } 94e7fd4179SDavid Teigland 95757a4271SDavid Teigland static int check_rcom_config(struct dlm_ls *ls, struct dlm_rcom *rc, int nodeid) 96e7fd4179SDavid Teigland { 979e971b71SDavid Teigland struct rcom_config *rf = (struct rcom_config *) rc->rc_buf; 989e971b71SDavid Teigland 999e971b71SDavid Teigland if ((rc->rc_header.h_version & 0xFFFF0000) != DLM_HEADER_MAJOR) { 1009e971b71SDavid Teigland log_error(ls, "version mismatch: %x nodeid %d: %x", 1019e971b71SDavid Teigland DLM_HEADER_MAJOR | DLM_HEADER_MINOR, nodeid, 1029e971b71SDavid Teigland rc->rc_header.h_version); 1038b0e7b2cSDavid Teigland return -EPROTO; 1049e971b71SDavid Teigland } 1059e971b71SDavid Teigland 10693ff2971SAl Viro if (le32_to_cpu(rf->rf_lvblen) != ls->ls_lvblen || 10793ff2971SAl Viro le32_to_cpu(rf->rf_lsflags) != ls->ls_exflags) { 108e7fd4179SDavid Teigland log_error(ls, "config mismatch: %d,%x nodeid %d: %d,%x", 10993ff2971SAl Viro ls->ls_lvblen, ls->ls_exflags, nodeid, 11093ff2971SAl Viro le32_to_cpu(rf->rf_lvblen), 11193ff2971SAl Viro le32_to_cpu(rf->rf_lsflags)); 1128b0e7b2cSDavid Teigland return -EPROTO; 113e7fd4179SDavid Teigland } 114e7fd4179SDavid Teigland return 0; 115e7fd4179SDavid Teigland } 116e7fd4179SDavid Teigland 11798f176fbSDavid Teigland static void allow_sync_reply(struct dlm_ls *ls, uint64_t *new_seq) 11898f176fbSDavid Teigland { 11998f176fbSDavid Teigland spin_lock(&ls->ls_rcom_spin); 12098f176fbSDavid Teigland *new_seq = ++ls->ls_rcom_seq; 12198f176fbSDavid Teigland set_bit(LSFL_RCOM_WAIT, &ls->ls_flags); 12298f176fbSDavid Teigland spin_unlock(&ls->ls_rcom_spin); 12398f176fbSDavid Teigland } 12498f176fbSDavid Teigland 12598f176fbSDavid Teigland static void disallow_sync_reply(struct dlm_ls *ls) 12698f176fbSDavid Teigland { 12798f176fbSDavid Teigland spin_lock(&ls->ls_rcom_spin); 12898f176fbSDavid Teigland clear_bit(LSFL_RCOM_WAIT, &ls->ls_flags); 12998f176fbSDavid Teigland clear_bit(LSFL_RCOM_READY, &ls->ls_flags); 13098f176fbSDavid Teigland spin_unlock(&ls->ls_rcom_spin); 13198f176fbSDavid Teigland } 13298f176fbSDavid Teigland 133757a4271SDavid Teigland /* 134757a4271SDavid Teigland * low nodeid gathers one slot value at a time from each node. 135757a4271SDavid Teigland * it sets need_slots=0, and saves rf_our_slot returned from each 136757a4271SDavid Teigland * rcom_config. 137757a4271SDavid Teigland * 138757a4271SDavid Teigland * other nodes gather all slot values at once from the low nodeid. 139757a4271SDavid Teigland * they set need_slots=1, and ignore the rf_our_slot returned from each 140757a4271SDavid Teigland * rcom_config. they use the rf_num_slots returned from the low 141757a4271SDavid Teigland * node's rcom_config. 142757a4271SDavid Teigland */ 143757a4271SDavid Teigland 144757a4271SDavid Teigland int dlm_rcom_status(struct dlm_ls *ls, int nodeid, uint32_t status_flags) 145e7fd4179SDavid Teigland { 146e7fd4179SDavid Teigland struct dlm_rcom *rc; 147e7fd4179SDavid Teigland struct dlm_mhandle *mh; 148e7fd4179SDavid Teigland int error = 0; 149e7fd4179SDavid Teigland 150faa0f267SDavid Teigland ls->ls_recover_nodeid = nodeid; 151e7fd4179SDavid Teigland 152e7fd4179SDavid Teigland if (nodeid == dlm_our_nodeid()) { 1534007685cSAl Viro rc = ls->ls_recover_buf; 154e7fd4179SDavid Teigland rc->rc_result = dlm_recover_status(ls); 155e7fd4179SDavid Teigland goto out; 156e7fd4179SDavid Teigland } 157e7fd4179SDavid Teigland 15859661212Stsutomu.owa@toshiba.co.jp retry: 159757a4271SDavid Teigland error = create_rcom(ls, nodeid, DLM_RCOM_STATUS, 160757a4271SDavid Teigland sizeof(struct rcom_status), &rc, &mh); 161e7fd4179SDavid Teigland if (error) 162e7fd4179SDavid Teigland goto out; 16398f176fbSDavid Teigland 164757a4271SDavid Teigland set_rcom_status(ls, (struct rcom_status *)rc->rc_buf, status_flags); 165757a4271SDavid Teigland 16698f176fbSDavid Teigland allow_sync_reply(ls, &rc->rc_id); 16768c817a1SDavid Teigland memset(ls->ls_recover_buf, 0, dlm_config.ci_buffer_size); 168e7fd4179SDavid Teigland 169e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 170e7fd4179SDavid Teigland 171e7fd4179SDavid Teigland error = dlm_wait_function(ls, &rcom_response); 17298f176fbSDavid Teigland disallow_sync_reply(ls); 17359661212Stsutomu.owa@toshiba.co.jp if (error == -ETIMEDOUT) 17459661212Stsutomu.owa@toshiba.co.jp goto retry; 175e7fd4179SDavid Teigland if (error) 176e7fd4179SDavid Teigland goto out; 177e7fd4179SDavid Teigland 1784007685cSAl Viro rc = ls->ls_recover_buf; 179e7fd4179SDavid Teigland 180e7fd4179SDavid Teigland if (rc->rc_result == -ESRCH) { 181e7fd4179SDavid Teigland /* we pretend the remote lockspace exists with 0 status */ 182e7fd4179SDavid Teigland log_debug(ls, "remote node %d not ready", nodeid); 183e7fd4179SDavid Teigland rc->rc_result = 0; 184757a4271SDavid Teigland error = 0; 185757a4271SDavid Teigland } else { 186757a4271SDavid Teigland error = check_rcom_config(ls, rc, nodeid); 187757a4271SDavid Teigland } 188757a4271SDavid Teigland 189e7fd4179SDavid Teigland /* the caller looks at rc_result for the remote recovery status */ 190e7fd4179SDavid Teigland out: 191e7fd4179SDavid Teigland return error; 192e7fd4179SDavid Teigland } 193e7fd4179SDavid Teigland 194e7fd4179SDavid Teigland static void receive_rcom_status(struct dlm_ls *ls, struct dlm_rcom *rc_in) 195e7fd4179SDavid Teigland { 196e7fd4179SDavid Teigland struct dlm_rcom *rc; 197e7fd4179SDavid Teigland struct dlm_mhandle *mh; 198757a4271SDavid Teigland struct rcom_status *rs; 199757a4271SDavid Teigland uint32_t status; 200757a4271SDavid Teigland int nodeid = rc_in->rc_header.h_nodeid; 201757a4271SDavid Teigland int len = sizeof(struct rcom_config); 202757a4271SDavid Teigland int num_slots = 0; 203757a4271SDavid Teigland int error; 204e7fd4179SDavid Teigland 205757a4271SDavid Teigland if (!dlm_slots_version(&rc_in->rc_header)) { 206757a4271SDavid Teigland status = dlm_recover_status(ls); 207757a4271SDavid Teigland goto do_create; 208757a4271SDavid Teigland } 209757a4271SDavid Teigland 210757a4271SDavid Teigland rs = (struct rcom_status *)rc_in->rc_buf; 211757a4271SDavid Teigland 212c07127b4SNeale Ferguson if (!(le32_to_cpu(rs->rs_flags) & DLM_RSF_NEED_SLOTS)) { 213757a4271SDavid Teigland status = dlm_recover_status(ls); 214757a4271SDavid Teigland goto do_create; 215757a4271SDavid Teigland } 216757a4271SDavid Teigland 217757a4271SDavid Teigland spin_lock(&ls->ls_recover_lock); 218757a4271SDavid Teigland status = ls->ls_recover_status; 219757a4271SDavid Teigland num_slots = ls->ls_num_slots; 220757a4271SDavid Teigland spin_unlock(&ls->ls_recover_lock); 221757a4271SDavid Teigland len += num_slots * sizeof(struct rcom_slot); 222757a4271SDavid Teigland 223757a4271SDavid Teigland do_create: 224e7fd4179SDavid Teigland error = create_rcom(ls, nodeid, DLM_RCOM_STATUS_REPLY, 225757a4271SDavid Teigland len, &rc, &mh); 226e7fd4179SDavid Teigland if (error) 227e7fd4179SDavid Teigland return; 228757a4271SDavid Teigland 2294a99c3d9SDavid Teigland rc->rc_id = rc_in->rc_id; 23038aa8b0cSDavid Teigland rc->rc_seq_reply = rc_in->rc_seq; 231757a4271SDavid Teigland rc->rc_result = status; 232e7fd4179SDavid Teigland 233757a4271SDavid Teigland set_rcom_config(ls, (struct rcom_config *)rc->rc_buf, num_slots); 234757a4271SDavid Teigland 235757a4271SDavid Teigland if (!num_slots) 236757a4271SDavid Teigland goto do_send; 237757a4271SDavid Teigland 238757a4271SDavid Teigland spin_lock(&ls->ls_recover_lock); 239757a4271SDavid Teigland if (ls->ls_num_slots != num_slots) { 240757a4271SDavid Teigland spin_unlock(&ls->ls_recover_lock); 241757a4271SDavid Teigland log_debug(ls, "receive_rcom_status num_slots %d to %d", 242757a4271SDavid Teigland num_slots, ls->ls_num_slots); 243757a4271SDavid Teigland rc->rc_result = 0; 244757a4271SDavid Teigland set_rcom_config(ls, (struct rcom_config *)rc->rc_buf, 0); 245757a4271SDavid Teigland goto do_send; 246757a4271SDavid Teigland } 247757a4271SDavid Teigland 248757a4271SDavid Teigland dlm_slots_copy_out(ls, rc); 249757a4271SDavid Teigland spin_unlock(&ls->ls_recover_lock); 250757a4271SDavid Teigland 251757a4271SDavid Teigland do_send: 252e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 253e7fd4179SDavid Teigland } 254e7fd4179SDavid Teigland 2554a99c3d9SDavid Teigland static void receive_sync_reply(struct dlm_ls *ls, struct dlm_rcom *rc_in) 256e7fd4179SDavid Teigland { 25798f176fbSDavid Teigland spin_lock(&ls->ls_rcom_spin); 25898f176fbSDavid Teigland if (!test_bit(LSFL_RCOM_WAIT, &ls->ls_flags) || 25998f176fbSDavid Teigland rc_in->rc_id != ls->ls_rcom_seq) { 26098f176fbSDavid Teigland log_debug(ls, "reject reply %d from %d seq %llx expect %llx", 26198f176fbSDavid Teigland rc_in->rc_type, rc_in->rc_header.h_nodeid, 26257adf7eeSRyusuke Konishi (unsigned long long)rc_in->rc_id, 26357adf7eeSRyusuke Konishi (unsigned long long)ls->ls_rcom_seq); 26498f176fbSDavid Teigland goto out; 2654a99c3d9SDavid Teigland } 266e7fd4179SDavid Teigland memcpy(ls->ls_recover_buf, rc_in, rc_in->rc_header.h_length); 267e7fd4179SDavid Teigland set_bit(LSFL_RCOM_READY, &ls->ls_flags); 26898f176fbSDavid Teigland clear_bit(LSFL_RCOM_WAIT, &ls->ls_flags); 269e7fd4179SDavid Teigland wake_up(&ls->ls_wait_general); 27098f176fbSDavid Teigland out: 27198f176fbSDavid Teigland spin_unlock(&ls->ls_rcom_spin); 272e7fd4179SDavid Teigland } 273e7fd4179SDavid Teigland 274e7fd4179SDavid Teigland int dlm_rcom_names(struct dlm_ls *ls, int nodeid, char *last_name, int last_len) 275e7fd4179SDavid Teigland { 276e7fd4179SDavid Teigland struct dlm_rcom *rc; 277e7fd4179SDavid Teigland struct dlm_mhandle *mh; 2784007685cSAl Viro int error = 0; 279e7fd4179SDavid Teigland 280faa0f267SDavid Teigland ls->ls_recover_nodeid = nodeid; 281e7fd4179SDavid Teigland 28259661212Stsutomu.owa@toshiba.co.jp retry: 283e7fd4179SDavid Teigland error = create_rcom(ls, nodeid, DLM_RCOM_NAMES, last_len, &rc, &mh); 284e7fd4179SDavid Teigland if (error) 285e7fd4179SDavid Teigland goto out; 286e7fd4179SDavid Teigland memcpy(rc->rc_buf, last_name, last_len); 28798f176fbSDavid Teigland 28898f176fbSDavid Teigland allow_sync_reply(ls, &rc->rc_id); 28968c817a1SDavid Teigland memset(ls->ls_recover_buf, 0, dlm_config.ci_buffer_size); 290e7fd4179SDavid Teigland 291e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 292e7fd4179SDavid Teigland 293e7fd4179SDavid Teigland error = dlm_wait_function(ls, &rcom_response); 29498f176fbSDavid Teigland disallow_sync_reply(ls); 29559661212Stsutomu.owa@toshiba.co.jp if (error == -ETIMEDOUT) 29659661212Stsutomu.owa@toshiba.co.jp goto retry; 297e7fd4179SDavid Teigland out: 298e7fd4179SDavid Teigland return error; 299e7fd4179SDavid Teigland } 300e7fd4179SDavid Teigland 301e7fd4179SDavid Teigland static void receive_rcom_names(struct dlm_ls *ls, struct dlm_rcom *rc_in) 302e7fd4179SDavid Teigland { 303e7fd4179SDavid Teigland struct dlm_rcom *rc; 304e7fd4179SDavid Teigland struct dlm_mhandle *mh; 30538aa8b0cSDavid Teigland int error, inlen, outlen, nodeid; 306e7fd4179SDavid Teigland 307e7fd4179SDavid Teigland nodeid = rc_in->rc_header.h_nodeid; 308e7fd4179SDavid Teigland inlen = rc_in->rc_header.h_length - sizeof(struct dlm_rcom); 30968c817a1SDavid Teigland outlen = dlm_config.ci_buffer_size - sizeof(struct dlm_rcom); 310e7fd4179SDavid Teigland 311e7fd4179SDavid Teigland error = create_rcom(ls, nodeid, DLM_RCOM_NAMES_REPLY, outlen, &rc, &mh); 312e7fd4179SDavid Teigland if (error) 313e7fd4179SDavid Teigland return; 3144a99c3d9SDavid Teigland rc->rc_id = rc_in->rc_id; 31538aa8b0cSDavid Teigland rc->rc_seq_reply = rc_in->rc_seq; 316e7fd4179SDavid Teigland 317e7fd4179SDavid Teigland dlm_copy_master_names(ls, rc_in->rc_buf, inlen, rc->rc_buf, outlen, 318e7fd4179SDavid Teigland nodeid); 319e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 320e7fd4179SDavid Teigland } 321e7fd4179SDavid Teigland 322e7fd4179SDavid Teigland int dlm_send_rcom_lookup(struct dlm_rsb *r, int dir_nodeid) 323e7fd4179SDavid Teigland { 324e7fd4179SDavid Teigland struct dlm_rcom *rc; 325e7fd4179SDavid Teigland struct dlm_mhandle *mh; 326e7fd4179SDavid Teigland struct dlm_ls *ls = r->res_ls; 327e7fd4179SDavid Teigland int error; 328e7fd4179SDavid Teigland 329e7fd4179SDavid Teigland error = create_rcom(ls, dir_nodeid, DLM_RCOM_LOOKUP, r->res_length, 330e7fd4179SDavid Teigland &rc, &mh); 331e7fd4179SDavid Teigland if (error) 332e7fd4179SDavid Teigland goto out; 333e7fd4179SDavid Teigland memcpy(rc->rc_buf, r->res_name, r->res_length); 3341d7c484eSDavid Teigland rc->rc_id = (unsigned long) r->res_id; 335e7fd4179SDavid Teigland 336e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 337e7fd4179SDavid Teigland out: 338e7fd4179SDavid Teigland return error; 339e7fd4179SDavid Teigland } 340e7fd4179SDavid Teigland 341e7fd4179SDavid Teigland static void receive_rcom_lookup(struct dlm_ls *ls, struct dlm_rcom *rc_in) 342e7fd4179SDavid Teigland { 343e7fd4179SDavid Teigland struct dlm_rcom *rc; 344e7fd4179SDavid Teigland struct dlm_mhandle *mh; 345e7fd4179SDavid Teigland int error, ret_nodeid, nodeid = rc_in->rc_header.h_nodeid; 346e7fd4179SDavid Teigland int len = rc_in->rc_header.h_length - sizeof(struct dlm_rcom); 347e7fd4179SDavid Teigland 348e7fd4179SDavid Teigland error = create_rcom(ls, nodeid, DLM_RCOM_LOOKUP_REPLY, 0, &rc, &mh); 349e7fd4179SDavid Teigland if (error) 350e7fd4179SDavid Teigland return; 351e7fd4179SDavid Teigland 352*9250e523SDavid Teigland /* Old code would send this special id to trigger a debug dump. */ 353c04fecb4SDavid Teigland if (rc_in->rc_id == 0xFFFFFFFF) { 354c04fecb4SDavid Teigland log_error(ls, "receive_rcom_lookup dump from %d", nodeid); 355c04fecb4SDavid Teigland dlm_dump_rsb_name(ls, rc_in->rc_buf, len); 356c04fecb4SDavid Teigland return; 357c04fecb4SDavid Teigland } 358c04fecb4SDavid Teigland 359c04fecb4SDavid Teigland error = dlm_master_lookup(ls, nodeid, rc_in->rc_buf, len, 360c04fecb4SDavid Teigland DLM_LU_RECOVER_MASTER, &ret_nodeid, NULL); 361e7fd4179SDavid Teigland if (error) 362e7fd4179SDavid Teigland ret_nodeid = error; 363e7fd4179SDavid Teigland rc->rc_result = ret_nodeid; 364e7fd4179SDavid Teigland rc->rc_id = rc_in->rc_id; 36538aa8b0cSDavid Teigland rc->rc_seq_reply = rc_in->rc_seq; 366e7fd4179SDavid Teigland 367e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 368e7fd4179SDavid Teigland } 369e7fd4179SDavid Teigland 370e7fd4179SDavid Teigland static void receive_rcom_lookup_reply(struct dlm_ls *ls, struct dlm_rcom *rc_in) 371e7fd4179SDavid Teigland { 372e7fd4179SDavid Teigland dlm_recover_master_reply(ls, rc_in); 373e7fd4179SDavid Teigland } 374e7fd4179SDavid Teigland 375e7fd4179SDavid Teigland static void pack_rcom_lock(struct dlm_rsb *r, struct dlm_lkb *lkb, 376e7fd4179SDavid Teigland struct rcom_lock *rl) 377e7fd4179SDavid Teigland { 378e7fd4179SDavid Teigland memset(rl, 0, sizeof(*rl)); 379e7fd4179SDavid Teigland 380163a1859SAl Viro rl->rl_ownpid = cpu_to_le32(lkb->lkb_ownpid); 381163a1859SAl Viro rl->rl_lkid = cpu_to_le32(lkb->lkb_id); 382163a1859SAl Viro rl->rl_exflags = cpu_to_le32(lkb->lkb_exflags); 383163a1859SAl Viro rl->rl_flags = cpu_to_le32(lkb->lkb_flags); 384163a1859SAl Viro rl->rl_lvbseq = cpu_to_le32(lkb->lkb_lvbseq); 385e7fd4179SDavid Teigland rl->rl_rqmode = lkb->lkb_rqmode; 386e7fd4179SDavid Teigland rl->rl_grmode = lkb->lkb_grmode; 387e7fd4179SDavid Teigland rl->rl_status = lkb->lkb_status; 388163a1859SAl Viro rl->rl_wait_type = cpu_to_le16(lkb->lkb_wait_type); 389e7fd4179SDavid Teigland 390e5dae548SDavid Teigland if (lkb->lkb_bastfn) 3918304d6f2SDavid Teigland rl->rl_asts |= DLM_CB_BAST; 392e5dae548SDavid Teigland if (lkb->lkb_astfn) 3938304d6f2SDavid Teigland rl->rl_asts |= DLM_CB_CAST; 394e7fd4179SDavid Teigland 395163a1859SAl Viro rl->rl_namelen = cpu_to_le16(r->res_length); 396e7fd4179SDavid Teigland memcpy(rl->rl_name, r->res_name, r->res_length); 397e7fd4179SDavid Teigland 398e7fd4179SDavid Teigland /* FIXME: might we have an lvb without DLM_LKF_VALBLK set ? 399e7fd4179SDavid Teigland If so, receive_rcom_lock_args() won't take this copy. */ 400e7fd4179SDavid Teigland 401e7fd4179SDavid Teigland if (lkb->lkb_lvbptr) 402e7fd4179SDavid Teigland memcpy(rl->rl_lvb, lkb->lkb_lvbptr, r->res_ls->ls_lvblen); 403e7fd4179SDavid Teigland } 404e7fd4179SDavid Teigland 405e7fd4179SDavid Teigland int dlm_send_rcom_lock(struct dlm_rsb *r, struct dlm_lkb *lkb) 406e7fd4179SDavid Teigland { 407e7fd4179SDavid Teigland struct dlm_ls *ls = r->res_ls; 408e7fd4179SDavid Teigland struct dlm_rcom *rc; 409e7fd4179SDavid Teigland struct dlm_mhandle *mh; 410e7fd4179SDavid Teigland struct rcom_lock *rl; 411e7fd4179SDavid Teigland int error, len = sizeof(struct rcom_lock); 412e7fd4179SDavid Teigland 413e7fd4179SDavid Teigland if (lkb->lkb_lvbptr) 414e7fd4179SDavid Teigland len += ls->ls_lvblen; 415e7fd4179SDavid Teigland 416e7fd4179SDavid Teigland error = create_rcom(ls, r->res_nodeid, DLM_RCOM_LOCK, len, &rc, &mh); 417e7fd4179SDavid Teigland if (error) 418e7fd4179SDavid Teigland goto out; 419e7fd4179SDavid Teigland 420e7fd4179SDavid Teigland rl = (struct rcom_lock *) rc->rc_buf; 421e7fd4179SDavid Teigland pack_rcom_lock(r, lkb, rl); 422e7fd4179SDavid Teigland rc->rc_id = (unsigned long) r; 423e7fd4179SDavid Teigland 424e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 425e7fd4179SDavid Teigland out: 426e7fd4179SDavid Teigland return error; 427e7fd4179SDavid Teigland } 428e7fd4179SDavid Teigland 429ae773d0bSAl Viro /* needs at least dlm_rcom + rcom_lock */ 430e7fd4179SDavid Teigland static void receive_rcom_lock(struct dlm_ls *ls, struct dlm_rcom *rc_in) 431e7fd4179SDavid Teigland { 432e7fd4179SDavid Teigland struct dlm_rcom *rc; 433e7fd4179SDavid Teigland struct dlm_mhandle *mh; 434e7fd4179SDavid Teigland int error, nodeid = rc_in->rc_header.h_nodeid; 435e7fd4179SDavid Teigland 436e7fd4179SDavid Teigland dlm_recover_master_copy(ls, rc_in); 437e7fd4179SDavid Teigland 438e7fd4179SDavid Teigland error = create_rcom(ls, nodeid, DLM_RCOM_LOCK_REPLY, 439e7fd4179SDavid Teigland sizeof(struct rcom_lock), &rc, &mh); 440e7fd4179SDavid Teigland if (error) 441e7fd4179SDavid Teigland return; 442e7fd4179SDavid Teigland 443e7fd4179SDavid Teigland /* We send back the same rcom_lock struct we received, but 444e7fd4179SDavid Teigland dlm_recover_master_copy() has filled in rl_remid and rl_result */ 445e7fd4179SDavid Teigland 446e7fd4179SDavid Teigland memcpy(rc->rc_buf, rc_in->rc_buf, sizeof(struct rcom_lock)); 447e7fd4179SDavid Teigland rc->rc_id = rc_in->rc_id; 44838aa8b0cSDavid Teigland rc->rc_seq_reply = rc_in->rc_seq; 449e7fd4179SDavid Teigland 450e7fd4179SDavid Teigland send_rcom(ls, mh, rc); 451e7fd4179SDavid Teigland } 452e7fd4179SDavid Teigland 453c36258b5SDavid Teigland /* If the lockspace doesn't exist then still send a status message 454c36258b5SDavid Teigland back; it's possible that it just doesn't have its global_id yet. */ 455c36258b5SDavid Teigland 456c36258b5SDavid Teigland int dlm_send_ls_not_ready(int nodeid, struct dlm_rcom *rc_in) 457e7fd4179SDavid Teigland { 458e7fd4179SDavid Teigland struct dlm_rcom *rc; 4591babdb45SDavid Teigland struct rcom_config *rf; 460e7fd4179SDavid Teigland struct dlm_mhandle *mh; 461e7fd4179SDavid Teigland char *mb; 4621babdb45SDavid Teigland int mb_len = sizeof(struct dlm_rcom) + sizeof(struct rcom_config); 463e7fd4179SDavid Teigland 46441684f95SDavid Teigland mh = dlm_lowcomms_get_buffer(nodeid, mb_len, GFP_NOFS, &mb); 465e7fd4179SDavid Teigland if (!mh) 466e7fd4179SDavid Teigland return -ENOBUFS; 467e7fd4179SDavid Teigland memset(mb, 0, mb_len); 468e7fd4179SDavid Teigland 469e7fd4179SDavid Teigland rc = (struct dlm_rcom *) mb; 470e7fd4179SDavid Teigland 471e7fd4179SDavid Teigland rc->rc_header.h_version = (DLM_HEADER_MAJOR | DLM_HEADER_MINOR); 472e7fd4179SDavid Teigland rc->rc_header.h_lockspace = rc_in->rc_header.h_lockspace; 473e7fd4179SDavid Teigland rc->rc_header.h_nodeid = dlm_our_nodeid(); 474e7fd4179SDavid Teigland rc->rc_header.h_length = mb_len; 475e7fd4179SDavid Teigland rc->rc_header.h_cmd = DLM_RCOM; 476e7fd4179SDavid Teigland 477e7fd4179SDavid Teigland rc->rc_type = DLM_RCOM_STATUS_REPLY; 478f5888750SDavid Teigland rc->rc_id = rc_in->rc_id; 47938aa8b0cSDavid Teigland rc->rc_seq_reply = rc_in->rc_seq; 480e7fd4179SDavid Teigland rc->rc_result = -ESRCH; 481e7fd4179SDavid Teigland 4821babdb45SDavid Teigland rf = (struct rcom_config *) rc->rc_buf; 48393ff2971SAl Viro rf->rf_lvblen = cpu_to_le32(~0U); 4841babdb45SDavid Teigland 485e7fd4179SDavid Teigland dlm_rcom_out(rc); 486e7fd4179SDavid Teigland dlm_lowcomms_commit_buffer(mh); 487e7fd4179SDavid Teigland 488e7fd4179SDavid Teigland return 0; 489e7fd4179SDavid Teigland } 490e7fd4179SDavid Teigland 491c04fecb4SDavid Teigland /* 492c04fecb4SDavid Teigland * Ignore messages for stage Y before we set 493c04fecb4SDavid Teigland * recover_status bit for stage X: 494c04fecb4SDavid Teigland * 495c04fecb4SDavid Teigland * recover_status = 0 496c04fecb4SDavid Teigland * 497c04fecb4SDavid Teigland * dlm_recover_members() 498c04fecb4SDavid Teigland * - send nothing 499c04fecb4SDavid Teigland * - recv nothing 500c04fecb4SDavid Teigland * - ignore NAMES, NAMES_REPLY 501c04fecb4SDavid Teigland * - ignore LOOKUP, LOOKUP_REPLY 502c04fecb4SDavid Teigland * - ignore LOCK, LOCK_REPLY 503c04fecb4SDavid Teigland * 504c04fecb4SDavid Teigland * recover_status |= NODES 505c04fecb4SDavid Teigland * 506c04fecb4SDavid Teigland * dlm_recover_members_wait() 507c04fecb4SDavid Teigland * 508c04fecb4SDavid Teigland * dlm_recover_directory() 509c04fecb4SDavid Teigland * - send NAMES 510c04fecb4SDavid Teigland * - recv NAMES_REPLY 511c04fecb4SDavid Teigland * - ignore LOOKUP, LOOKUP_REPLY 512c04fecb4SDavid Teigland * - ignore LOCK, LOCK_REPLY 513c04fecb4SDavid Teigland * 514c04fecb4SDavid Teigland * recover_status |= DIR 515c04fecb4SDavid Teigland * 516c04fecb4SDavid Teigland * dlm_recover_directory_wait() 517c04fecb4SDavid Teigland * 518c04fecb4SDavid Teigland * dlm_recover_masters() 519c04fecb4SDavid Teigland * - send LOOKUP 520c04fecb4SDavid Teigland * - recv LOOKUP_REPLY 521c04fecb4SDavid Teigland * 522c04fecb4SDavid Teigland * dlm_recover_locks() 523c04fecb4SDavid Teigland * - send LOCKS 524c04fecb4SDavid Teigland * - recv LOCKS_REPLY 525c04fecb4SDavid Teigland * 526c04fecb4SDavid Teigland * recover_status |= LOCKS 527c04fecb4SDavid Teigland * 528c04fecb4SDavid Teigland * dlm_recover_locks_wait() 529c04fecb4SDavid Teigland * 530c04fecb4SDavid Teigland * recover_status |= DONE 531c04fecb4SDavid Teigland */ 532c04fecb4SDavid Teigland 533c36258b5SDavid Teigland /* Called by dlm_recv; corresponds to dlm_receive_message() but special 534e7fd4179SDavid Teigland recovery-only comms are sent through here. */ 535e7fd4179SDavid Teigland 536c36258b5SDavid Teigland void dlm_receive_rcom(struct dlm_ls *ls, struct dlm_rcom *rc, int nodeid) 537e7fd4179SDavid Teigland { 538ae773d0bSAl Viro int lock_size = sizeof(struct dlm_rcom) + sizeof(struct rcom_lock); 539c04fecb4SDavid Teigland int stop, reply = 0, names = 0, lookup = 0, lock = 0; 5404875647aSDavid Teigland uint32_t status; 541d6e24788SDavid Teigland uint64_t seq; 542ae773d0bSAl Viro 543d6e24788SDavid Teigland switch (rc->rc_type) { 544c04fecb4SDavid Teigland case DLM_RCOM_STATUS_REPLY: 545c04fecb4SDavid Teigland reply = 1; 546c04fecb4SDavid Teigland break; 547c04fecb4SDavid Teigland case DLM_RCOM_NAMES: 548c04fecb4SDavid Teigland names = 1; 549c04fecb4SDavid Teigland break; 550c04fecb4SDavid Teigland case DLM_RCOM_NAMES_REPLY: 551c04fecb4SDavid Teigland names = 1; 552c04fecb4SDavid Teigland reply = 1; 553c04fecb4SDavid Teigland break; 554c04fecb4SDavid Teigland case DLM_RCOM_LOOKUP: 555c04fecb4SDavid Teigland lookup = 1; 556c04fecb4SDavid Teigland break; 557c04fecb4SDavid Teigland case DLM_RCOM_LOOKUP_REPLY: 558c04fecb4SDavid Teigland lookup = 1; 559c04fecb4SDavid Teigland reply = 1; 560c04fecb4SDavid Teigland break; 5614875647aSDavid Teigland case DLM_RCOM_LOCK: 5624875647aSDavid Teigland lock = 1; 5634875647aSDavid Teigland break; 5644875647aSDavid Teigland case DLM_RCOM_LOCK_REPLY: 5654875647aSDavid Teigland lock = 1; 5664875647aSDavid Teigland reply = 1; 5674875647aSDavid Teigland break; 568d6e24788SDavid Teigland }; 569d6e24788SDavid Teigland 570d6e24788SDavid Teigland spin_lock(&ls->ls_recover_lock); 5714875647aSDavid Teigland status = ls->ls_recover_status; 572475f230cSDavid Teigland stop = test_bit(LSFL_RECOVER_STOP, &ls->ls_flags); 573d6e24788SDavid Teigland seq = ls->ls_recover_seq; 574d6e24788SDavid Teigland spin_unlock(&ls->ls_recover_lock); 575d6e24788SDavid Teigland 576c04fecb4SDavid Teigland if (stop && (rc->rc_type != DLM_RCOM_STATUS)) 577c04fecb4SDavid Teigland goto ignore; 578c04fecb4SDavid Teigland 579c04fecb4SDavid Teigland if (reply && (rc->rc_seq_reply != seq)) 580c04fecb4SDavid Teigland goto ignore; 581c04fecb4SDavid Teigland 582c04fecb4SDavid Teigland if (!(status & DLM_RS_NODES) && (names || lookup || lock)) 583c04fecb4SDavid Teigland goto ignore; 584c04fecb4SDavid Teigland 585c04fecb4SDavid Teigland if (!(status & DLM_RS_DIR) && (lookup || lock)) 586c04fecb4SDavid Teigland goto ignore; 587e7fd4179SDavid Teigland 588e7fd4179SDavid Teigland switch (rc->rc_type) { 589e7fd4179SDavid Teigland case DLM_RCOM_STATUS: 590e7fd4179SDavid Teigland receive_rcom_status(ls, rc); 591e7fd4179SDavid Teigland break; 592e7fd4179SDavid Teigland 593e7fd4179SDavid Teigland case DLM_RCOM_NAMES: 594e7fd4179SDavid Teigland receive_rcom_names(ls, rc); 595e7fd4179SDavid Teigland break; 596e7fd4179SDavid Teigland 597e7fd4179SDavid Teigland case DLM_RCOM_LOOKUP: 598e7fd4179SDavid Teigland receive_rcom_lookup(ls, rc); 599e7fd4179SDavid Teigland break; 600e7fd4179SDavid Teigland 601e7fd4179SDavid Teigland case DLM_RCOM_LOCK: 602ae773d0bSAl Viro if (rc->rc_header.h_length < lock_size) 603ae773d0bSAl Viro goto Eshort; 604e7fd4179SDavid Teigland receive_rcom_lock(ls, rc); 605e7fd4179SDavid Teigland break; 606e7fd4179SDavid Teigland 607e7fd4179SDavid Teigland case DLM_RCOM_STATUS_REPLY: 608dbcfc347SDavid Teigland receive_sync_reply(ls, rc); 609e7fd4179SDavid Teigland break; 610e7fd4179SDavid Teigland 611e7fd4179SDavid Teigland case DLM_RCOM_NAMES_REPLY: 612dbcfc347SDavid Teigland receive_sync_reply(ls, rc); 613e7fd4179SDavid Teigland break; 614e7fd4179SDavid Teigland 615e7fd4179SDavid Teigland case DLM_RCOM_LOOKUP_REPLY: 616e7fd4179SDavid Teigland receive_rcom_lookup_reply(ls, rc); 617e7fd4179SDavid Teigland break; 618e7fd4179SDavid Teigland 619e7fd4179SDavid Teigland case DLM_RCOM_LOCK_REPLY: 620ae773d0bSAl Viro if (rc->rc_header.h_length < lock_size) 621ae773d0bSAl Viro goto Eshort; 622dbcfc347SDavid Teigland dlm_recover_process_copy(ls, rc); 623e7fd4179SDavid Teigland break; 624e7fd4179SDavid Teigland 625e7fd4179SDavid Teigland default: 626dbcfc347SDavid Teigland log_error(ls, "receive_rcom bad type %d", rc->rc_type); 627e7fd4179SDavid Teigland } 628c04fecb4SDavid Teigland return; 629c04fecb4SDavid Teigland 630c04fecb4SDavid Teigland ignore: 631c04fecb4SDavid Teigland log_limit(ls, "dlm_receive_rcom ignore msg %d " 632c04fecb4SDavid Teigland "from %d %llu %llu recover seq %llu sts %x gen %u", 633c04fecb4SDavid Teigland rc->rc_type, 634c04fecb4SDavid Teigland nodeid, 635c04fecb4SDavid Teigland (unsigned long long)rc->rc_seq, 636c04fecb4SDavid Teigland (unsigned long long)rc->rc_seq_reply, 637c04fecb4SDavid Teigland (unsigned long long)seq, 638c04fecb4SDavid Teigland status, ls->ls_generation); 639c36258b5SDavid Teigland return; 640ae773d0bSAl Viro Eshort: 641c04fecb4SDavid Teigland log_error(ls, "recovery message %d from %d is too short", 642ae773d0bSAl Viro rc->rc_type, nodeid); 643e7fd4179SDavid Teigland } 644e7fd4179SDavid Teigland 645