xref: /openbmc/linux/fs/dlm/rcom.c (revision 88aa023a2556aae92664f135eae794be9449e4f3)
12522fe45SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2e7fd4179SDavid Teigland /******************************************************************************
3e7fd4179SDavid Teigland *******************************************************************************
4e7fd4179SDavid Teigland **
5e7fd4179SDavid Teigland **  Copyright (C) Sistina Software, Inc.  1997-2003  All rights reserved.
6dbcfc347SDavid Teigland **  Copyright (C) 2005-2008 Red Hat, Inc.  All rights reserved.
7e7fd4179SDavid Teigland **
8e7fd4179SDavid Teigland **
9e7fd4179SDavid Teigland *******************************************************************************
10e7fd4179SDavid Teigland ******************************************************************************/
11e7fd4179SDavid Teigland 
12e7fd4179SDavid Teigland #include "dlm_internal.h"
13e7fd4179SDavid Teigland #include "lockspace.h"
14e7fd4179SDavid Teigland #include "member.h"
15e7fd4179SDavid Teigland #include "lowcomms.h"
16e7fd4179SDavid Teigland #include "midcomms.h"
17e7fd4179SDavid Teigland #include "rcom.h"
18e7fd4179SDavid Teigland #include "recover.h"
19e7fd4179SDavid Teigland #include "dir.h"
20e7fd4179SDavid Teigland #include "config.h"
21e7fd4179SDavid Teigland #include "memory.h"
22e7fd4179SDavid Teigland #include "lock.h"
23e7fd4179SDavid Teigland #include "util.h"
24e7fd4179SDavid Teigland 
25e7fd4179SDavid Teigland static int rcom_response(struct dlm_ls *ls)
26e7fd4179SDavid Teigland {
27e7fd4179SDavid Teigland 	return test_bit(LSFL_RCOM_READY, &ls->ls_flags);
28e7fd4179SDavid Teigland }
29e7fd4179SDavid Teigland 
30a070a91cSAlexander Aring static void _create_rcom(struct dlm_ls *ls, int to_nodeid, int type, int len,
31a070a91cSAlexander Aring 			 struct dlm_rcom **rc_ret, char *mb, int mb_len)
32e7fd4179SDavid Teigland {
33e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
34e7fd4179SDavid Teigland 
35e7fd4179SDavid Teigland 	rc = (struct dlm_rcom *) mb;
36e7fd4179SDavid Teigland 
37e7fd4179SDavid Teigland 	rc->rc_header.h_version = (DLM_HEADER_MAJOR | DLM_HEADER_MINOR);
388e2e4086SAlexander Aring 	rc->rc_header.u.h_lockspace = ls->ls_global_id;
39e7fd4179SDavid Teigland 	rc->rc_header.h_nodeid = dlm_our_nodeid();
40e7fd4179SDavid Teigland 	rc->rc_header.h_length = mb_len;
41e7fd4179SDavid Teigland 	rc->rc_header.h_cmd = DLM_RCOM;
42e7fd4179SDavid Teigland 
43e7fd4179SDavid Teigland 	rc->rc_type = type;
44e7fd4179SDavid Teigland 
4538aa8b0cSDavid Teigland 	spin_lock(&ls->ls_recover_lock);
4638aa8b0cSDavid Teigland 	rc->rc_seq = ls->ls_recover_seq;
4738aa8b0cSDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
4838aa8b0cSDavid Teigland 
49e7fd4179SDavid Teigland 	*rc_ret = rc;
50a070a91cSAlexander Aring }
51a070a91cSAlexander Aring 
52a070a91cSAlexander Aring static int create_rcom(struct dlm_ls *ls, int to_nodeid, int type, int len,
53a070a91cSAlexander Aring 		       struct dlm_rcom **rc_ret, struct dlm_mhandle **mh_ret)
54a070a91cSAlexander Aring {
55a070a91cSAlexander Aring 	int mb_len = sizeof(struct dlm_rcom) + len;
56a070a91cSAlexander Aring 	struct dlm_mhandle *mh;
57a070a91cSAlexander Aring 	char *mb;
58a070a91cSAlexander Aring 
59a070a91cSAlexander Aring 	mh = dlm_midcomms_get_mhandle(to_nodeid, mb_len, GFP_NOFS, &mb);
60a070a91cSAlexander Aring 	if (!mh) {
61a070a91cSAlexander Aring 		log_print("%s to %d type %d len %d ENOBUFS",
62a070a91cSAlexander Aring 			  __func__, to_nodeid, type, len);
63a070a91cSAlexander Aring 		return -ENOBUFS;
64a070a91cSAlexander Aring 	}
65a070a91cSAlexander Aring 
66a070a91cSAlexander Aring 	_create_rcom(ls, to_nodeid, type, len, rc_ret, mb, mb_len);
67a070a91cSAlexander Aring 	*mh_ret = mh;
68e7fd4179SDavid Teigland 	return 0;
69e7fd4179SDavid Teigland }
70e7fd4179SDavid Teigland 
71a070a91cSAlexander Aring static int create_rcom_stateless(struct dlm_ls *ls, int to_nodeid, int type,
72a070a91cSAlexander Aring 				 int len, struct dlm_rcom **rc_ret,
738f2dc78dSAlexander Aring 				 struct dlm_msg **msg_ret)
74a070a91cSAlexander Aring {
75a070a91cSAlexander Aring 	int mb_len = sizeof(struct dlm_rcom) + len;
768f2dc78dSAlexander Aring 	struct dlm_msg *msg;
77a070a91cSAlexander Aring 	char *mb;
78a070a91cSAlexander Aring 
798f2dc78dSAlexander Aring 	msg = dlm_lowcomms_new_msg(to_nodeid, mb_len, GFP_NOFS, &mb,
808f2dc78dSAlexander Aring 				   NULL, NULL);
818f2dc78dSAlexander Aring 	if (!msg) {
82a070a91cSAlexander Aring 		log_print("create_rcom to %d type %d len %d ENOBUFS",
83a070a91cSAlexander Aring 			  to_nodeid, type, len);
84a070a91cSAlexander Aring 		return -ENOBUFS;
85a070a91cSAlexander Aring 	}
86a070a91cSAlexander Aring 
87a070a91cSAlexander Aring 	_create_rcom(ls, to_nodeid, type, len, rc_ret, mb, mb_len);
888f2dc78dSAlexander Aring 	*msg_ret = msg;
89a070a91cSAlexander Aring 	return 0;
90a070a91cSAlexander Aring }
91a070a91cSAlexander Aring 
92*88aa023aSAlexander Aring static void send_rcom(struct dlm_mhandle *mh, struct dlm_rcom *rc)
93a070a91cSAlexander Aring {
94a070a91cSAlexander Aring 	dlm_rcom_out(rc);
95a070a91cSAlexander Aring 	dlm_midcomms_commit_mhandle(mh);
96a070a91cSAlexander Aring }
97a070a91cSAlexander Aring 
98*88aa023aSAlexander Aring static void send_rcom_stateless(struct dlm_msg *msg, struct dlm_rcom *rc)
99a070a91cSAlexander Aring {
100*88aa023aSAlexander Aring 	dlm_rcom_out(rc);
1018f2dc78dSAlexander Aring 	dlm_lowcomms_commit_msg(msg);
1028f2dc78dSAlexander Aring 	dlm_lowcomms_put_msg(msg);
103e7fd4179SDavid Teigland }
104e7fd4179SDavid Teigland 
105757a4271SDavid Teigland static void set_rcom_status(struct dlm_ls *ls, struct rcom_status *rs,
106757a4271SDavid Teigland 			    uint32_t flags)
107757a4271SDavid Teigland {
108757a4271SDavid Teigland 	rs->rs_flags = cpu_to_le32(flags);
109757a4271SDavid Teigland }
110757a4271SDavid Teigland 
111e7fd4179SDavid Teigland /* When replying to a status request, a node also sends back its
112e7fd4179SDavid Teigland    configuration values.  The requesting node then checks that the remote
113e7fd4179SDavid Teigland    node is configured the same way as itself. */
114e7fd4179SDavid Teigland 
115757a4271SDavid Teigland static void set_rcom_config(struct dlm_ls *ls, struct rcom_config *rf,
116757a4271SDavid Teigland 			    uint32_t num_slots)
117e7fd4179SDavid Teigland {
11893ff2971SAl Viro 	rf->rf_lvblen = cpu_to_le32(ls->ls_lvblen);
11993ff2971SAl Viro 	rf->rf_lsflags = cpu_to_le32(ls->ls_exflags);
120757a4271SDavid Teigland 
121757a4271SDavid Teigland 	rf->rf_our_slot = cpu_to_le16(ls->ls_slot);
122757a4271SDavid Teigland 	rf->rf_num_slots = cpu_to_le16(num_slots);
123757a4271SDavid Teigland 	rf->rf_generation =  cpu_to_le32(ls->ls_generation);
124e7fd4179SDavid Teigland }
125e7fd4179SDavid Teigland 
126757a4271SDavid Teigland static int check_rcom_config(struct dlm_ls *ls, struct dlm_rcom *rc, int nodeid)
127e7fd4179SDavid Teigland {
1289e971b71SDavid Teigland 	struct rcom_config *rf = (struct rcom_config *) rc->rc_buf;
1299e971b71SDavid Teigland 
1309e971b71SDavid Teigland 	if ((rc->rc_header.h_version & 0xFFFF0000) != DLM_HEADER_MAJOR) {
1319e971b71SDavid Teigland 		log_error(ls, "version mismatch: %x nodeid %d: %x",
1329e971b71SDavid Teigland 			  DLM_HEADER_MAJOR | DLM_HEADER_MINOR, nodeid,
1339e971b71SDavid Teigland 			  rc->rc_header.h_version);
1348b0e7b2cSDavid Teigland 		return -EPROTO;
1359e971b71SDavid Teigland 	}
1369e971b71SDavid Teigland 
13793ff2971SAl Viro 	if (le32_to_cpu(rf->rf_lvblen) != ls->ls_lvblen ||
13893ff2971SAl Viro 	    le32_to_cpu(rf->rf_lsflags) != ls->ls_exflags) {
139e7fd4179SDavid Teigland 		log_error(ls, "config mismatch: %d,%x nodeid %d: %d,%x",
14093ff2971SAl Viro 			  ls->ls_lvblen, ls->ls_exflags, nodeid,
14193ff2971SAl Viro 			  le32_to_cpu(rf->rf_lvblen),
14293ff2971SAl Viro 			  le32_to_cpu(rf->rf_lsflags));
1438b0e7b2cSDavid Teigland 		return -EPROTO;
144e7fd4179SDavid Teigland 	}
145e7fd4179SDavid Teigland 	return 0;
146e7fd4179SDavid Teigland }
147e7fd4179SDavid Teigland 
14898f176fbSDavid Teigland static void allow_sync_reply(struct dlm_ls *ls, uint64_t *new_seq)
14998f176fbSDavid Teigland {
15098f176fbSDavid Teigland 	spin_lock(&ls->ls_rcom_spin);
15198f176fbSDavid Teigland 	*new_seq = ++ls->ls_rcom_seq;
15298f176fbSDavid Teigland 	set_bit(LSFL_RCOM_WAIT, &ls->ls_flags);
15398f176fbSDavid Teigland 	spin_unlock(&ls->ls_rcom_spin);
15498f176fbSDavid Teigland }
15598f176fbSDavid Teigland 
15698f176fbSDavid Teigland static void disallow_sync_reply(struct dlm_ls *ls)
15798f176fbSDavid Teigland {
15898f176fbSDavid Teigland 	spin_lock(&ls->ls_rcom_spin);
15998f176fbSDavid Teigland 	clear_bit(LSFL_RCOM_WAIT, &ls->ls_flags);
16098f176fbSDavid Teigland 	clear_bit(LSFL_RCOM_READY, &ls->ls_flags);
16198f176fbSDavid Teigland 	spin_unlock(&ls->ls_rcom_spin);
16298f176fbSDavid Teigland }
16398f176fbSDavid Teigland 
164757a4271SDavid Teigland /*
165757a4271SDavid Teigland  * low nodeid gathers one slot value at a time from each node.
166757a4271SDavid Teigland  * it sets need_slots=0, and saves rf_our_slot returned from each
167757a4271SDavid Teigland  * rcom_config.
168757a4271SDavid Teigland  *
169757a4271SDavid Teigland  * other nodes gather all slot values at once from the low nodeid.
170757a4271SDavid Teigland  * they set need_slots=1, and ignore the rf_our_slot returned from each
171757a4271SDavid Teigland  * rcom_config.  they use the rf_num_slots returned from the low
172757a4271SDavid Teigland  * node's rcom_config.
173757a4271SDavid Teigland  */
174757a4271SDavid Teigland 
175757a4271SDavid Teigland int dlm_rcom_status(struct dlm_ls *ls, int nodeid, uint32_t status_flags)
176e7fd4179SDavid Teigland {
177e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
1788f2dc78dSAlexander Aring 	struct dlm_msg *msg;
179e7fd4179SDavid Teigland 	int error = 0;
180e7fd4179SDavid Teigland 
181faa0f267SDavid Teigland 	ls->ls_recover_nodeid = nodeid;
182e7fd4179SDavid Teigland 
183e7fd4179SDavid Teigland 	if (nodeid == dlm_our_nodeid()) {
1844007685cSAl Viro 		rc = ls->ls_recover_buf;
185e7fd4179SDavid Teigland 		rc->rc_result = dlm_recover_status(ls);
186e7fd4179SDavid Teigland 		goto out;
187e7fd4179SDavid Teigland 	}
188e7fd4179SDavid Teigland 
18959661212Stsutomu.owa@toshiba.co.jp retry:
190a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_STATUS,
1918f2dc78dSAlexander Aring 				      sizeof(struct rcom_status), &rc, &msg);
192e7fd4179SDavid Teigland 	if (error)
193e7fd4179SDavid Teigland 		goto out;
19498f176fbSDavid Teigland 
195757a4271SDavid Teigland 	set_rcom_status(ls, (struct rcom_status *)rc->rc_buf, status_flags);
196757a4271SDavid Teigland 
19798f176fbSDavid Teigland 	allow_sync_reply(ls, &rc->rc_id);
198d10a0b88SAlexander Aring 	memset(ls->ls_recover_buf, 0, DLM_MAX_SOCKET_BUFSIZE);
199e7fd4179SDavid Teigland 
200*88aa023aSAlexander Aring 	send_rcom_stateless(msg, rc);
201e7fd4179SDavid Teigland 
202e7fd4179SDavid Teigland 	error = dlm_wait_function(ls, &rcom_response);
20398f176fbSDavid Teigland 	disallow_sync_reply(ls);
20459661212Stsutomu.owa@toshiba.co.jp 	if (error == -ETIMEDOUT)
20559661212Stsutomu.owa@toshiba.co.jp 		goto retry;
206e7fd4179SDavid Teigland 	if (error)
207e7fd4179SDavid Teigland 		goto out;
208e7fd4179SDavid Teigland 
2094007685cSAl Viro 	rc = ls->ls_recover_buf;
210e7fd4179SDavid Teigland 
211e7fd4179SDavid Teigland 	if (rc->rc_result == -ESRCH) {
212e7fd4179SDavid Teigland 		/* we pretend the remote lockspace exists with 0 status */
213e7fd4179SDavid Teigland 		log_debug(ls, "remote node %d not ready", nodeid);
214e7fd4179SDavid Teigland 		rc->rc_result = 0;
215757a4271SDavid Teigland 		error = 0;
216757a4271SDavid Teigland 	} else {
217757a4271SDavid Teigland 		error = check_rcom_config(ls, rc, nodeid);
218757a4271SDavid Teigland 	}
219757a4271SDavid Teigland 
220e7fd4179SDavid Teigland 	/* the caller looks at rc_result for the remote recovery status */
221e7fd4179SDavid Teigland  out:
222e7fd4179SDavid Teigland 	return error;
223e7fd4179SDavid Teigland }
224e7fd4179SDavid Teigland 
225e7fd4179SDavid Teigland static void receive_rcom_status(struct dlm_ls *ls, struct dlm_rcom *rc_in)
226e7fd4179SDavid Teigland {
227e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
228757a4271SDavid Teigland 	struct rcom_status *rs;
229757a4271SDavid Teigland 	uint32_t status;
230757a4271SDavid Teigland 	int nodeid = rc_in->rc_header.h_nodeid;
231757a4271SDavid Teigland 	int len = sizeof(struct rcom_config);
2328f2dc78dSAlexander Aring 	struct dlm_msg *msg;
233757a4271SDavid Teigland 	int num_slots = 0;
234757a4271SDavid Teigland 	int error;
235e7fd4179SDavid Teigland 
236757a4271SDavid Teigland 	if (!dlm_slots_version(&rc_in->rc_header)) {
237757a4271SDavid Teigland 		status = dlm_recover_status(ls);
238757a4271SDavid Teigland 		goto do_create;
239757a4271SDavid Teigland 	}
240757a4271SDavid Teigland 
241757a4271SDavid Teigland 	rs = (struct rcom_status *)rc_in->rc_buf;
242757a4271SDavid Teigland 
243c07127b4SNeale Ferguson 	if (!(le32_to_cpu(rs->rs_flags) & DLM_RSF_NEED_SLOTS)) {
244757a4271SDavid Teigland 		status = dlm_recover_status(ls);
245757a4271SDavid Teigland 		goto do_create;
246757a4271SDavid Teigland 	}
247757a4271SDavid Teigland 
248757a4271SDavid Teigland 	spin_lock(&ls->ls_recover_lock);
249757a4271SDavid Teigland 	status = ls->ls_recover_status;
250757a4271SDavid Teigland 	num_slots = ls->ls_num_slots;
251757a4271SDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
252757a4271SDavid Teigland 	len += num_slots * sizeof(struct rcom_slot);
253757a4271SDavid Teigland 
254757a4271SDavid Teigland  do_create:
255a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_STATUS_REPLY,
2568f2dc78dSAlexander Aring 				      len, &rc, &msg);
257e7fd4179SDavid Teigland 	if (error)
258e7fd4179SDavid Teigland 		return;
259757a4271SDavid Teigland 
2604a99c3d9SDavid Teigland 	rc->rc_id = rc_in->rc_id;
26138aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
262757a4271SDavid Teigland 	rc->rc_result = status;
263e7fd4179SDavid Teigland 
264757a4271SDavid Teigland 	set_rcom_config(ls, (struct rcom_config *)rc->rc_buf, num_slots);
265757a4271SDavid Teigland 
266757a4271SDavid Teigland 	if (!num_slots)
267757a4271SDavid Teigland 		goto do_send;
268757a4271SDavid Teigland 
269757a4271SDavid Teigland 	spin_lock(&ls->ls_recover_lock);
270757a4271SDavid Teigland 	if (ls->ls_num_slots != num_slots) {
271757a4271SDavid Teigland 		spin_unlock(&ls->ls_recover_lock);
272757a4271SDavid Teigland 		log_debug(ls, "receive_rcom_status num_slots %d to %d",
273757a4271SDavid Teigland 			  num_slots, ls->ls_num_slots);
274757a4271SDavid Teigland 		rc->rc_result = 0;
275757a4271SDavid Teigland 		set_rcom_config(ls, (struct rcom_config *)rc->rc_buf, 0);
276757a4271SDavid Teigland 		goto do_send;
277757a4271SDavid Teigland 	}
278757a4271SDavid Teigland 
279757a4271SDavid Teigland 	dlm_slots_copy_out(ls, rc);
280757a4271SDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
281757a4271SDavid Teigland 
282757a4271SDavid Teigland  do_send:
283*88aa023aSAlexander Aring 	send_rcom_stateless(msg, rc);
284e7fd4179SDavid Teigland }
285e7fd4179SDavid Teigland 
2864a99c3d9SDavid Teigland static void receive_sync_reply(struct dlm_ls *ls, struct dlm_rcom *rc_in)
287e7fd4179SDavid Teigland {
28898f176fbSDavid Teigland 	spin_lock(&ls->ls_rcom_spin);
28998f176fbSDavid Teigland 	if (!test_bit(LSFL_RCOM_WAIT, &ls->ls_flags) ||
29098f176fbSDavid Teigland 	    rc_in->rc_id != ls->ls_rcom_seq) {
29198f176fbSDavid Teigland 		log_debug(ls, "reject reply %d from %d seq %llx expect %llx",
29298f176fbSDavid Teigland 			  rc_in->rc_type, rc_in->rc_header.h_nodeid,
29357adf7eeSRyusuke Konishi 			  (unsigned long long)rc_in->rc_id,
29457adf7eeSRyusuke Konishi 			  (unsigned long long)ls->ls_rcom_seq);
29598f176fbSDavid Teigland 		goto out;
2964a99c3d9SDavid Teigland 	}
297e7fd4179SDavid Teigland 	memcpy(ls->ls_recover_buf, rc_in, rc_in->rc_header.h_length);
298e7fd4179SDavid Teigland 	set_bit(LSFL_RCOM_READY, &ls->ls_flags);
29998f176fbSDavid Teigland 	clear_bit(LSFL_RCOM_WAIT, &ls->ls_flags);
300e7fd4179SDavid Teigland 	wake_up(&ls->ls_wait_general);
30198f176fbSDavid Teigland  out:
30298f176fbSDavid Teigland 	spin_unlock(&ls->ls_rcom_spin);
303e7fd4179SDavid Teigland }
304e7fd4179SDavid Teigland 
305e7fd4179SDavid Teigland int dlm_rcom_names(struct dlm_ls *ls, int nodeid, char *last_name, int last_len)
306e7fd4179SDavid Teigland {
307e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
3088f2dc78dSAlexander Aring 	struct dlm_msg *msg;
3094007685cSAl Viro 	int error = 0;
310e7fd4179SDavid Teigland 
311faa0f267SDavid Teigland 	ls->ls_recover_nodeid = nodeid;
312e7fd4179SDavid Teigland 
31359661212Stsutomu.owa@toshiba.co.jp retry:
314a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_NAMES, last_len,
3158f2dc78dSAlexander Aring 				      &rc, &msg);
316e7fd4179SDavid Teigland 	if (error)
317e7fd4179SDavid Teigland 		goto out;
318e7fd4179SDavid Teigland 	memcpy(rc->rc_buf, last_name, last_len);
31998f176fbSDavid Teigland 
32098f176fbSDavid Teigland 	allow_sync_reply(ls, &rc->rc_id);
321d10a0b88SAlexander Aring 	memset(ls->ls_recover_buf, 0, DLM_MAX_SOCKET_BUFSIZE);
322e7fd4179SDavid Teigland 
323*88aa023aSAlexander Aring 	send_rcom_stateless(msg, rc);
324e7fd4179SDavid Teigland 
325e7fd4179SDavid Teigland 	error = dlm_wait_function(ls, &rcom_response);
32698f176fbSDavid Teigland 	disallow_sync_reply(ls);
32759661212Stsutomu.owa@toshiba.co.jp 	if (error == -ETIMEDOUT)
32859661212Stsutomu.owa@toshiba.co.jp 		goto retry;
329e7fd4179SDavid Teigland  out:
330e7fd4179SDavid Teigland 	return error;
331e7fd4179SDavid Teigland }
332e7fd4179SDavid Teigland 
333e7fd4179SDavid Teigland static void receive_rcom_names(struct dlm_ls *ls, struct dlm_rcom *rc_in)
334e7fd4179SDavid Teigland {
335e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
33638aa8b0cSDavid Teigland 	int error, inlen, outlen, nodeid;
3378f2dc78dSAlexander Aring 	struct dlm_msg *msg;
338e7fd4179SDavid Teigland 
339e7fd4179SDavid Teigland 	nodeid = rc_in->rc_header.h_nodeid;
340e7fd4179SDavid Teigland 	inlen = rc_in->rc_header.h_length - sizeof(struct dlm_rcom);
341d10a0b88SAlexander Aring 	outlen = DLM_MAX_APP_BUFSIZE - sizeof(struct dlm_rcom);
342e7fd4179SDavid Teigland 
343a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_NAMES_REPLY, outlen,
3448f2dc78dSAlexander Aring 				      &rc, &msg);
345e7fd4179SDavid Teigland 	if (error)
346e7fd4179SDavid Teigland 		return;
3474a99c3d9SDavid Teigland 	rc->rc_id = rc_in->rc_id;
34838aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
349e7fd4179SDavid Teigland 
350e7fd4179SDavid Teigland 	dlm_copy_master_names(ls, rc_in->rc_buf, inlen, rc->rc_buf, outlen,
351e7fd4179SDavid Teigland 			      nodeid);
352*88aa023aSAlexander Aring 	send_rcom_stateless(msg, rc);
353e7fd4179SDavid Teigland }
354e7fd4179SDavid Teigland 
355e7fd4179SDavid Teigland int dlm_send_rcom_lookup(struct dlm_rsb *r, int dir_nodeid)
356e7fd4179SDavid Teigland {
357e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
358e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
359e7fd4179SDavid Teigland 	struct dlm_ls *ls = r->res_ls;
360e7fd4179SDavid Teigland 	int error;
361e7fd4179SDavid Teigland 
362e7fd4179SDavid Teigland 	error = create_rcom(ls, dir_nodeid, DLM_RCOM_LOOKUP, r->res_length,
363e7fd4179SDavid Teigland 			    &rc, &mh);
364e7fd4179SDavid Teigland 	if (error)
365e7fd4179SDavid Teigland 		goto out;
366e7fd4179SDavid Teigland 	memcpy(rc->rc_buf, r->res_name, r->res_length);
3671d7c484eSDavid Teigland 	rc->rc_id = (unsigned long) r->res_id;
368e7fd4179SDavid Teigland 
369*88aa023aSAlexander Aring 	send_rcom(mh, rc);
370e7fd4179SDavid Teigland  out:
371e7fd4179SDavid Teigland 	return error;
372e7fd4179SDavid Teigland }
373e7fd4179SDavid Teigland 
374e7fd4179SDavid Teigland static void receive_rcom_lookup(struct dlm_ls *ls, struct dlm_rcom *rc_in)
375e7fd4179SDavid Teigland {
376e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
377e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
378e7fd4179SDavid Teigland 	int error, ret_nodeid, nodeid = rc_in->rc_header.h_nodeid;
379e7fd4179SDavid Teigland 	int len = rc_in->rc_header.h_length - sizeof(struct dlm_rcom);
380e7fd4179SDavid Teigland 
3819250e523SDavid Teigland 	/* Old code would send this special id to trigger a debug dump. */
382c04fecb4SDavid Teigland 	if (rc_in->rc_id == 0xFFFFFFFF) {
383c04fecb4SDavid Teigland 		log_error(ls, "receive_rcom_lookup dump from %d", nodeid);
384c04fecb4SDavid Teigland 		dlm_dump_rsb_name(ls, rc_in->rc_buf, len);
385c04fecb4SDavid Teigland 		return;
386c04fecb4SDavid Teigland 	}
387c04fecb4SDavid Teigland 
388f6089981SColin Ian King 	error = create_rcom(ls, nodeid, DLM_RCOM_LOOKUP_REPLY, 0, &rc, &mh);
389f6089981SColin Ian King 	if (error)
390f6089981SColin Ian King 		return;
391f6089981SColin Ian King 
392c04fecb4SDavid Teigland 	error = dlm_master_lookup(ls, nodeid, rc_in->rc_buf, len,
393c04fecb4SDavid Teigland 				  DLM_LU_RECOVER_MASTER, &ret_nodeid, NULL);
394e7fd4179SDavid Teigland 	if (error)
395e7fd4179SDavid Teigland 		ret_nodeid = error;
396e7fd4179SDavid Teigland 	rc->rc_result = ret_nodeid;
397e7fd4179SDavid Teigland 	rc->rc_id = rc_in->rc_id;
39838aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
399e7fd4179SDavid Teigland 
400*88aa023aSAlexander Aring 	send_rcom(mh, rc);
401e7fd4179SDavid Teigland }
402e7fd4179SDavid Teigland 
403e7fd4179SDavid Teigland static void receive_rcom_lookup_reply(struct dlm_ls *ls, struct dlm_rcom *rc_in)
404e7fd4179SDavid Teigland {
405e7fd4179SDavid Teigland 	dlm_recover_master_reply(ls, rc_in);
406e7fd4179SDavid Teigland }
407e7fd4179SDavid Teigland 
408e7fd4179SDavid Teigland static void pack_rcom_lock(struct dlm_rsb *r, struct dlm_lkb *lkb,
409e7fd4179SDavid Teigland 			   struct rcom_lock *rl)
410e7fd4179SDavid Teigland {
411e7fd4179SDavid Teigland 	memset(rl, 0, sizeof(*rl));
412e7fd4179SDavid Teigland 
413163a1859SAl Viro 	rl->rl_ownpid = cpu_to_le32(lkb->lkb_ownpid);
414163a1859SAl Viro 	rl->rl_lkid = cpu_to_le32(lkb->lkb_id);
415163a1859SAl Viro 	rl->rl_exflags = cpu_to_le32(lkb->lkb_exflags);
416163a1859SAl Viro 	rl->rl_flags = cpu_to_le32(lkb->lkb_flags);
417163a1859SAl Viro 	rl->rl_lvbseq = cpu_to_le32(lkb->lkb_lvbseq);
418e7fd4179SDavid Teigland 	rl->rl_rqmode = lkb->lkb_rqmode;
419e7fd4179SDavid Teigland 	rl->rl_grmode = lkb->lkb_grmode;
420e7fd4179SDavid Teigland 	rl->rl_status = lkb->lkb_status;
421163a1859SAl Viro 	rl->rl_wait_type = cpu_to_le16(lkb->lkb_wait_type);
422e7fd4179SDavid Teigland 
423e5dae548SDavid Teigland 	if (lkb->lkb_bastfn)
4248304d6f2SDavid Teigland 		rl->rl_asts |= DLM_CB_BAST;
425e5dae548SDavid Teigland 	if (lkb->lkb_astfn)
4268304d6f2SDavid Teigland 		rl->rl_asts |= DLM_CB_CAST;
427e7fd4179SDavid Teigland 
428163a1859SAl Viro 	rl->rl_namelen = cpu_to_le16(r->res_length);
429e7fd4179SDavid Teigland 	memcpy(rl->rl_name, r->res_name, r->res_length);
430e7fd4179SDavid Teigland 
431e7fd4179SDavid Teigland 	/* FIXME: might we have an lvb without DLM_LKF_VALBLK set ?
432e7fd4179SDavid Teigland 	   If so, receive_rcom_lock_args() won't take this copy. */
433e7fd4179SDavid Teigland 
434e7fd4179SDavid Teigland 	if (lkb->lkb_lvbptr)
435e7fd4179SDavid Teigland 		memcpy(rl->rl_lvb, lkb->lkb_lvbptr, r->res_ls->ls_lvblen);
436e7fd4179SDavid Teigland }
437e7fd4179SDavid Teigland 
438e7fd4179SDavid Teigland int dlm_send_rcom_lock(struct dlm_rsb *r, struct dlm_lkb *lkb)
439e7fd4179SDavid Teigland {
440e7fd4179SDavid Teigland 	struct dlm_ls *ls = r->res_ls;
441e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
442e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
443e7fd4179SDavid Teigland 	struct rcom_lock *rl;
444e7fd4179SDavid Teigland 	int error, len = sizeof(struct rcom_lock);
445e7fd4179SDavid Teigland 
446e7fd4179SDavid Teigland 	if (lkb->lkb_lvbptr)
447e7fd4179SDavid Teigland 		len += ls->ls_lvblen;
448e7fd4179SDavid Teigland 
449e7fd4179SDavid Teigland 	error = create_rcom(ls, r->res_nodeid, DLM_RCOM_LOCK, len, &rc, &mh);
450e7fd4179SDavid Teigland 	if (error)
451e7fd4179SDavid Teigland 		goto out;
452e7fd4179SDavid Teigland 
453e7fd4179SDavid Teigland 	rl = (struct rcom_lock *) rc->rc_buf;
454e7fd4179SDavid Teigland 	pack_rcom_lock(r, lkb, rl);
455e7fd4179SDavid Teigland 	rc->rc_id = (unsigned long) r;
456e7fd4179SDavid Teigland 
457*88aa023aSAlexander Aring 	send_rcom(mh, rc);
458e7fd4179SDavid Teigland  out:
459e7fd4179SDavid Teigland 	return error;
460e7fd4179SDavid Teigland }
461e7fd4179SDavid Teigland 
462ae773d0bSAl Viro /* needs at least dlm_rcom + rcom_lock */
463e7fd4179SDavid Teigland static void receive_rcom_lock(struct dlm_ls *ls, struct dlm_rcom *rc_in)
464e7fd4179SDavid Teigland {
465e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
466e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
467e7fd4179SDavid Teigland 	int error, nodeid = rc_in->rc_header.h_nodeid;
468e7fd4179SDavid Teigland 
469e7fd4179SDavid Teigland 	dlm_recover_master_copy(ls, rc_in);
470e7fd4179SDavid Teigland 
471e7fd4179SDavid Teigland 	error = create_rcom(ls, nodeid, DLM_RCOM_LOCK_REPLY,
472e7fd4179SDavid Teigland 			    sizeof(struct rcom_lock), &rc, &mh);
473e7fd4179SDavid Teigland 	if (error)
474e7fd4179SDavid Teigland 		return;
475e7fd4179SDavid Teigland 
476e7fd4179SDavid Teigland 	/* We send back the same rcom_lock struct we received, but
477e7fd4179SDavid Teigland 	   dlm_recover_master_copy() has filled in rl_remid and rl_result */
478e7fd4179SDavid Teigland 
479e7fd4179SDavid Teigland 	memcpy(rc->rc_buf, rc_in->rc_buf, sizeof(struct rcom_lock));
480e7fd4179SDavid Teigland 	rc->rc_id = rc_in->rc_id;
48138aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
482e7fd4179SDavid Teigland 
483*88aa023aSAlexander Aring 	send_rcom(mh, rc);
484e7fd4179SDavid Teigland }
485e7fd4179SDavid Teigland 
486c36258b5SDavid Teigland /* If the lockspace doesn't exist then still send a status message
487c36258b5SDavid Teigland    back; it's possible that it just doesn't have its global_id yet. */
488c36258b5SDavid Teigland 
489c36258b5SDavid Teigland int dlm_send_ls_not_ready(int nodeid, struct dlm_rcom *rc_in)
490e7fd4179SDavid Teigland {
491e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
4921babdb45SDavid Teigland 	struct rcom_config *rf;
493e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
494e7fd4179SDavid Teigland 	char *mb;
4951babdb45SDavid Teigland 	int mb_len = sizeof(struct dlm_rcom) + sizeof(struct rcom_config);
496e7fd4179SDavid Teigland 
497a070a91cSAlexander Aring 	mh = dlm_midcomms_get_mhandle(nodeid, mb_len, GFP_NOFS, &mb);
498e7fd4179SDavid Teigland 	if (!mh)
499e7fd4179SDavid Teigland 		return -ENOBUFS;
500e7fd4179SDavid Teigland 
501e7fd4179SDavid Teigland 	rc = (struct dlm_rcom *) mb;
502e7fd4179SDavid Teigland 
503e7fd4179SDavid Teigland 	rc->rc_header.h_version = (DLM_HEADER_MAJOR | DLM_HEADER_MINOR);
5048e2e4086SAlexander Aring 	rc->rc_header.u.h_lockspace = rc_in->rc_header.u.h_lockspace;
505e7fd4179SDavid Teigland 	rc->rc_header.h_nodeid = dlm_our_nodeid();
506e7fd4179SDavid Teigland 	rc->rc_header.h_length = mb_len;
507e7fd4179SDavid Teigland 	rc->rc_header.h_cmd = DLM_RCOM;
508e7fd4179SDavid Teigland 
509e7fd4179SDavid Teigland 	rc->rc_type = DLM_RCOM_STATUS_REPLY;
510f5888750SDavid Teigland 	rc->rc_id = rc_in->rc_id;
51138aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
512e7fd4179SDavid Teigland 	rc->rc_result = -ESRCH;
513e7fd4179SDavid Teigland 
5141babdb45SDavid Teigland 	rf = (struct rcom_config *) rc->rc_buf;
51593ff2971SAl Viro 	rf->rf_lvblen = cpu_to_le32(~0U);
5161babdb45SDavid Teigland 
517e7fd4179SDavid Teigland 	dlm_rcom_out(rc);
518a070a91cSAlexander Aring 	dlm_midcomms_commit_mhandle(mh);
519e7fd4179SDavid Teigland 
520e7fd4179SDavid Teigland 	return 0;
521e7fd4179SDavid Teigland }
522e7fd4179SDavid Teigland 
523c04fecb4SDavid Teigland /*
524c04fecb4SDavid Teigland  * Ignore messages for stage Y before we set
525c04fecb4SDavid Teigland  * recover_status bit for stage X:
526c04fecb4SDavid Teigland  *
527c04fecb4SDavid Teigland  * recover_status = 0
528c04fecb4SDavid Teigland  *
529c04fecb4SDavid Teigland  * dlm_recover_members()
530c04fecb4SDavid Teigland  * - send nothing
531c04fecb4SDavid Teigland  * - recv nothing
532c04fecb4SDavid Teigland  * - ignore NAMES, NAMES_REPLY
533c04fecb4SDavid Teigland  * - ignore LOOKUP, LOOKUP_REPLY
534c04fecb4SDavid Teigland  * - ignore LOCK, LOCK_REPLY
535c04fecb4SDavid Teigland  *
536c04fecb4SDavid Teigland  * recover_status |= NODES
537c04fecb4SDavid Teigland  *
538c04fecb4SDavid Teigland  * dlm_recover_members_wait()
539c04fecb4SDavid Teigland  *
540c04fecb4SDavid Teigland  * dlm_recover_directory()
541c04fecb4SDavid Teigland  * - send NAMES
542c04fecb4SDavid Teigland  * - recv NAMES_REPLY
543c04fecb4SDavid Teigland  * - ignore LOOKUP, LOOKUP_REPLY
544c04fecb4SDavid Teigland  * - ignore LOCK, LOCK_REPLY
545c04fecb4SDavid Teigland  *
546c04fecb4SDavid Teigland  * recover_status |= DIR
547c04fecb4SDavid Teigland  *
548c04fecb4SDavid Teigland  * dlm_recover_directory_wait()
549c04fecb4SDavid Teigland  *
550c04fecb4SDavid Teigland  * dlm_recover_masters()
551c04fecb4SDavid Teigland  * - send LOOKUP
552c04fecb4SDavid Teigland  * - recv LOOKUP_REPLY
553c04fecb4SDavid Teigland  *
554c04fecb4SDavid Teigland  * dlm_recover_locks()
555c04fecb4SDavid Teigland  * - send LOCKS
556c04fecb4SDavid Teigland  * - recv LOCKS_REPLY
557c04fecb4SDavid Teigland  *
558c04fecb4SDavid Teigland  * recover_status |= LOCKS
559c04fecb4SDavid Teigland  *
560c04fecb4SDavid Teigland  * dlm_recover_locks_wait()
561c04fecb4SDavid Teigland  *
562c04fecb4SDavid Teigland  * recover_status |= DONE
563c04fecb4SDavid Teigland  */
564c04fecb4SDavid Teigland 
565c36258b5SDavid Teigland /* Called by dlm_recv; corresponds to dlm_receive_message() but special
566e7fd4179SDavid Teigland    recovery-only comms are sent through here. */
567e7fd4179SDavid Teigland 
568c36258b5SDavid Teigland void dlm_receive_rcom(struct dlm_ls *ls, struct dlm_rcom *rc, int nodeid)
569e7fd4179SDavid Teigland {
570ae773d0bSAl Viro 	int lock_size = sizeof(struct dlm_rcom) + sizeof(struct rcom_lock);
571c04fecb4SDavid Teigland 	int stop, reply = 0, names = 0, lookup = 0, lock = 0;
5724875647aSDavid Teigland 	uint32_t status;
573d6e24788SDavid Teigland 	uint64_t seq;
574ae773d0bSAl Viro 
575d6e24788SDavid Teigland 	switch (rc->rc_type) {
576c04fecb4SDavid Teigland 	case DLM_RCOM_STATUS_REPLY:
577c04fecb4SDavid Teigland 		reply = 1;
578c04fecb4SDavid Teigland 		break;
579c04fecb4SDavid Teigland 	case DLM_RCOM_NAMES:
580c04fecb4SDavid Teigland 		names = 1;
581c04fecb4SDavid Teigland 		break;
582c04fecb4SDavid Teigland 	case DLM_RCOM_NAMES_REPLY:
583c04fecb4SDavid Teigland 		names = 1;
584c04fecb4SDavid Teigland 		reply = 1;
585c04fecb4SDavid Teigland 		break;
586c04fecb4SDavid Teigland 	case DLM_RCOM_LOOKUP:
587c04fecb4SDavid Teigland 		lookup = 1;
588c04fecb4SDavid Teigland 		break;
589c04fecb4SDavid Teigland 	case DLM_RCOM_LOOKUP_REPLY:
590c04fecb4SDavid Teigland 		lookup = 1;
591c04fecb4SDavid Teigland 		reply = 1;
592c04fecb4SDavid Teigland 		break;
5934875647aSDavid Teigland 	case DLM_RCOM_LOCK:
5944875647aSDavid Teigland 		lock = 1;
5954875647aSDavid Teigland 		break;
5964875647aSDavid Teigland 	case DLM_RCOM_LOCK_REPLY:
5974875647aSDavid Teigland 		lock = 1;
5984875647aSDavid Teigland 		reply = 1;
5994875647aSDavid Teigland 		break;
60090db4f8bSWu Bo 	}
601d6e24788SDavid Teigland 
602d6e24788SDavid Teigland 	spin_lock(&ls->ls_recover_lock);
6034875647aSDavid Teigland 	status = ls->ls_recover_status;
604475f230cSDavid Teigland 	stop = test_bit(LSFL_RECOVER_STOP, &ls->ls_flags);
605d6e24788SDavid Teigland 	seq = ls->ls_recover_seq;
606d6e24788SDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
607d6e24788SDavid Teigland 
608c04fecb4SDavid Teigland 	if (stop && (rc->rc_type != DLM_RCOM_STATUS))
609c04fecb4SDavid Teigland 		goto ignore;
610c04fecb4SDavid Teigland 
611c04fecb4SDavid Teigland 	if (reply && (rc->rc_seq_reply != seq))
612c04fecb4SDavid Teigland 		goto ignore;
613c04fecb4SDavid Teigland 
614c04fecb4SDavid Teigland 	if (!(status & DLM_RS_NODES) && (names || lookup || lock))
615c04fecb4SDavid Teigland 		goto ignore;
616c04fecb4SDavid Teigland 
617c04fecb4SDavid Teigland 	if (!(status & DLM_RS_DIR) && (lookup || lock))
618c04fecb4SDavid Teigland 		goto ignore;
619e7fd4179SDavid Teigland 
620e7fd4179SDavid Teigland 	switch (rc->rc_type) {
621e7fd4179SDavid Teigland 	case DLM_RCOM_STATUS:
622e7fd4179SDavid Teigland 		receive_rcom_status(ls, rc);
623e7fd4179SDavid Teigland 		break;
624e7fd4179SDavid Teigland 
625e7fd4179SDavid Teigland 	case DLM_RCOM_NAMES:
626e7fd4179SDavid Teigland 		receive_rcom_names(ls, rc);
627e7fd4179SDavid Teigland 		break;
628e7fd4179SDavid Teigland 
629e7fd4179SDavid Teigland 	case DLM_RCOM_LOOKUP:
630e7fd4179SDavid Teigland 		receive_rcom_lookup(ls, rc);
631e7fd4179SDavid Teigland 		break;
632e7fd4179SDavid Teigland 
633e7fd4179SDavid Teigland 	case DLM_RCOM_LOCK:
634ae773d0bSAl Viro 		if (rc->rc_header.h_length < lock_size)
635ae773d0bSAl Viro 			goto Eshort;
636e7fd4179SDavid Teigland 		receive_rcom_lock(ls, rc);
637e7fd4179SDavid Teigland 		break;
638e7fd4179SDavid Teigland 
639e7fd4179SDavid Teigland 	case DLM_RCOM_STATUS_REPLY:
640dbcfc347SDavid Teigland 		receive_sync_reply(ls, rc);
641e7fd4179SDavid Teigland 		break;
642e7fd4179SDavid Teigland 
643e7fd4179SDavid Teigland 	case DLM_RCOM_NAMES_REPLY:
644dbcfc347SDavid Teigland 		receive_sync_reply(ls, rc);
645e7fd4179SDavid Teigland 		break;
646e7fd4179SDavid Teigland 
647e7fd4179SDavid Teigland 	case DLM_RCOM_LOOKUP_REPLY:
648e7fd4179SDavid Teigland 		receive_rcom_lookup_reply(ls, rc);
649e7fd4179SDavid Teigland 		break;
650e7fd4179SDavid Teigland 
651e7fd4179SDavid Teigland 	case DLM_RCOM_LOCK_REPLY:
652ae773d0bSAl Viro 		if (rc->rc_header.h_length < lock_size)
653ae773d0bSAl Viro 			goto Eshort;
654dbcfc347SDavid Teigland 		dlm_recover_process_copy(ls, rc);
655e7fd4179SDavid Teigland 		break;
656e7fd4179SDavid Teigland 
657e7fd4179SDavid Teigland 	default:
658dbcfc347SDavid Teigland 		log_error(ls, "receive_rcom bad type %d", rc->rc_type);
659e7fd4179SDavid Teigland 	}
660c04fecb4SDavid Teigland 	return;
661c04fecb4SDavid Teigland 
662c04fecb4SDavid Teigland ignore:
663c04fecb4SDavid Teigland 	log_limit(ls, "dlm_receive_rcom ignore msg %d "
664c04fecb4SDavid Teigland 		  "from %d %llu %llu recover seq %llu sts %x gen %u",
665c04fecb4SDavid Teigland 		   rc->rc_type,
666c04fecb4SDavid Teigland 		   nodeid,
667c04fecb4SDavid Teigland 		   (unsigned long long)rc->rc_seq,
668c04fecb4SDavid Teigland 		   (unsigned long long)rc->rc_seq_reply,
669c04fecb4SDavid Teigland 		   (unsigned long long)seq,
670c04fecb4SDavid Teigland 		   status, ls->ls_generation);
671c36258b5SDavid Teigland 	return;
672ae773d0bSAl Viro Eshort:
673c04fecb4SDavid Teigland 	log_error(ls, "recovery message %d from %d is too short",
674ae773d0bSAl Viro 		  rc->rc_type, nodeid);
675e7fd4179SDavid Teigland }
676e7fd4179SDavid Teigland 
677