xref: /openbmc/linux/fs/dlm/rcom.c (revision 8f2dc78dbc2010b497bb58e0460cb44c678a3c5b)
12522fe45SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2e7fd4179SDavid Teigland /******************************************************************************
3e7fd4179SDavid Teigland *******************************************************************************
4e7fd4179SDavid Teigland **
5e7fd4179SDavid Teigland **  Copyright (C) Sistina Software, Inc.  1997-2003  All rights reserved.
6dbcfc347SDavid Teigland **  Copyright (C) 2005-2008 Red Hat, Inc.  All rights reserved.
7e7fd4179SDavid Teigland **
8e7fd4179SDavid Teigland **
9e7fd4179SDavid Teigland *******************************************************************************
10e7fd4179SDavid Teigland ******************************************************************************/
11e7fd4179SDavid Teigland 
12e7fd4179SDavid Teigland #include "dlm_internal.h"
13e7fd4179SDavid Teigland #include "lockspace.h"
14e7fd4179SDavid Teigland #include "member.h"
15e7fd4179SDavid Teigland #include "lowcomms.h"
16e7fd4179SDavid Teigland #include "midcomms.h"
17e7fd4179SDavid Teigland #include "rcom.h"
18e7fd4179SDavid Teigland #include "recover.h"
19e7fd4179SDavid Teigland #include "dir.h"
20e7fd4179SDavid Teigland #include "config.h"
21e7fd4179SDavid Teigland #include "memory.h"
22e7fd4179SDavid Teigland #include "lock.h"
23e7fd4179SDavid Teigland #include "util.h"
24e7fd4179SDavid Teigland 
25e7fd4179SDavid Teigland static int rcom_response(struct dlm_ls *ls)
26e7fd4179SDavid Teigland {
27e7fd4179SDavid Teigland 	return test_bit(LSFL_RCOM_READY, &ls->ls_flags);
28e7fd4179SDavid Teigland }
29e7fd4179SDavid Teigland 
30a070a91cSAlexander Aring static void _create_rcom(struct dlm_ls *ls, int to_nodeid, int type, int len,
31a070a91cSAlexander Aring 			 struct dlm_rcom **rc_ret, char *mb, int mb_len)
32e7fd4179SDavid Teigland {
33e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
34e7fd4179SDavid Teigland 
35e7fd4179SDavid Teigland 	rc = (struct dlm_rcom *) mb;
36e7fd4179SDavid Teigland 
37e7fd4179SDavid Teigland 	rc->rc_header.h_version = (DLM_HEADER_MAJOR | DLM_HEADER_MINOR);
38e7fd4179SDavid Teigland 	rc->rc_header.h_lockspace = ls->ls_global_id;
39e7fd4179SDavid Teigland 	rc->rc_header.h_nodeid = dlm_our_nodeid();
40e7fd4179SDavid Teigland 	rc->rc_header.h_length = mb_len;
41e7fd4179SDavid Teigland 	rc->rc_header.h_cmd = DLM_RCOM;
42e7fd4179SDavid Teigland 
43e7fd4179SDavid Teigland 	rc->rc_type = type;
44e7fd4179SDavid Teigland 
4538aa8b0cSDavid Teigland 	spin_lock(&ls->ls_recover_lock);
4638aa8b0cSDavid Teigland 	rc->rc_seq = ls->ls_recover_seq;
4738aa8b0cSDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
4838aa8b0cSDavid Teigland 
49e7fd4179SDavid Teigland 	*rc_ret = rc;
50a070a91cSAlexander Aring }
51a070a91cSAlexander Aring 
52a070a91cSAlexander Aring static int create_rcom(struct dlm_ls *ls, int to_nodeid, int type, int len,
53a070a91cSAlexander Aring 		       struct dlm_rcom **rc_ret, struct dlm_mhandle **mh_ret)
54a070a91cSAlexander Aring {
55a070a91cSAlexander Aring 	int mb_len = sizeof(struct dlm_rcom) + len;
56a070a91cSAlexander Aring 	struct dlm_mhandle *mh;
57a070a91cSAlexander Aring 	char *mb;
58a070a91cSAlexander Aring 
59a070a91cSAlexander Aring 	mh = dlm_midcomms_get_mhandle(to_nodeid, mb_len, GFP_NOFS, &mb);
60a070a91cSAlexander Aring 	if (!mh) {
61a070a91cSAlexander Aring 		log_print("%s to %d type %d len %d ENOBUFS",
62a070a91cSAlexander Aring 			  __func__, to_nodeid, type, len);
63a070a91cSAlexander Aring 		return -ENOBUFS;
64a070a91cSAlexander Aring 	}
65a070a91cSAlexander Aring 
66a070a91cSAlexander Aring 	_create_rcom(ls, to_nodeid, type, len, rc_ret, mb, mb_len);
67a070a91cSAlexander Aring 	*mh_ret = mh;
68e7fd4179SDavid Teigland 	return 0;
69e7fd4179SDavid Teigland }
70e7fd4179SDavid Teigland 
71a070a91cSAlexander Aring static int create_rcom_stateless(struct dlm_ls *ls, int to_nodeid, int type,
72a070a91cSAlexander Aring 				 int len, struct dlm_rcom **rc_ret,
73*8f2dc78dSAlexander Aring 				 struct dlm_msg **msg_ret)
74a070a91cSAlexander Aring {
75a070a91cSAlexander Aring 	int mb_len = sizeof(struct dlm_rcom) + len;
76*8f2dc78dSAlexander Aring 	struct dlm_msg *msg;
77a070a91cSAlexander Aring 	char *mb;
78a070a91cSAlexander Aring 
79*8f2dc78dSAlexander Aring 	msg = dlm_lowcomms_new_msg(to_nodeid, mb_len, GFP_NOFS, &mb,
80*8f2dc78dSAlexander Aring 				   NULL, NULL);
81*8f2dc78dSAlexander Aring 	if (!msg) {
82a070a91cSAlexander Aring 		log_print("create_rcom to %d type %d len %d ENOBUFS",
83a070a91cSAlexander Aring 			  to_nodeid, type, len);
84a070a91cSAlexander Aring 		return -ENOBUFS;
85a070a91cSAlexander Aring 	}
86a070a91cSAlexander Aring 
87a070a91cSAlexander Aring 	_create_rcom(ls, to_nodeid, type, len, rc_ret, mb, mb_len);
88*8f2dc78dSAlexander Aring 	*msg_ret = msg;
89a070a91cSAlexander Aring 	return 0;
90a070a91cSAlexander Aring }
91a070a91cSAlexander Aring 
92a070a91cSAlexander Aring static void _send_rcom(struct dlm_ls *ls, struct dlm_rcom *rc)
93a070a91cSAlexander Aring {
94a070a91cSAlexander Aring 	dlm_rcom_out(rc);
95a070a91cSAlexander Aring }
96a070a91cSAlexander Aring 
97e7fd4179SDavid Teigland static void send_rcom(struct dlm_ls *ls, struct dlm_mhandle *mh,
98e7fd4179SDavid Teigland 		      struct dlm_rcom *rc)
99e7fd4179SDavid Teigland {
100a070a91cSAlexander Aring 	_send_rcom(ls, rc);
101a070a91cSAlexander Aring 	dlm_midcomms_commit_mhandle(mh);
102a070a91cSAlexander Aring }
103a070a91cSAlexander Aring 
104*8f2dc78dSAlexander Aring static void send_rcom_stateless(struct dlm_ls *ls, struct dlm_msg *msg,
105a070a91cSAlexander Aring 				struct dlm_rcom *rc)
106a070a91cSAlexander Aring {
107a070a91cSAlexander Aring 	_send_rcom(ls, rc);
108*8f2dc78dSAlexander Aring 	dlm_lowcomms_commit_msg(msg);
109*8f2dc78dSAlexander Aring 	dlm_lowcomms_put_msg(msg);
110e7fd4179SDavid Teigland }
111e7fd4179SDavid Teigland 
112757a4271SDavid Teigland static void set_rcom_status(struct dlm_ls *ls, struct rcom_status *rs,
113757a4271SDavid Teigland 			    uint32_t flags)
114757a4271SDavid Teigland {
115757a4271SDavid Teigland 	rs->rs_flags = cpu_to_le32(flags);
116757a4271SDavid Teigland }
117757a4271SDavid Teigland 
118e7fd4179SDavid Teigland /* When replying to a status request, a node also sends back its
119e7fd4179SDavid Teigland    configuration values.  The requesting node then checks that the remote
120e7fd4179SDavid Teigland    node is configured the same way as itself. */
121e7fd4179SDavid Teigland 
122757a4271SDavid Teigland static void set_rcom_config(struct dlm_ls *ls, struct rcom_config *rf,
123757a4271SDavid Teigland 			    uint32_t num_slots)
124e7fd4179SDavid Teigland {
12593ff2971SAl Viro 	rf->rf_lvblen = cpu_to_le32(ls->ls_lvblen);
12693ff2971SAl Viro 	rf->rf_lsflags = cpu_to_le32(ls->ls_exflags);
127757a4271SDavid Teigland 
128757a4271SDavid Teigland 	rf->rf_our_slot = cpu_to_le16(ls->ls_slot);
129757a4271SDavid Teigland 	rf->rf_num_slots = cpu_to_le16(num_slots);
130757a4271SDavid Teigland 	rf->rf_generation =  cpu_to_le32(ls->ls_generation);
131e7fd4179SDavid Teigland }
132e7fd4179SDavid Teigland 
133757a4271SDavid Teigland static int check_rcom_config(struct dlm_ls *ls, struct dlm_rcom *rc, int nodeid)
134e7fd4179SDavid Teigland {
1359e971b71SDavid Teigland 	struct rcom_config *rf = (struct rcom_config *) rc->rc_buf;
1369e971b71SDavid Teigland 
1379e971b71SDavid Teigland 	if ((rc->rc_header.h_version & 0xFFFF0000) != DLM_HEADER_MAJOR) {
1389e971b71SDavid Teigland 		log_error(ls, "version mismatch: %x nodeid %d: %x",
1399e971b71SDavid Teigland 			  DLM_HEADER_MAJOR | DLM_HEADER_MINOR, nodeid,
1409e971b71SDavid Teigland 			  rc->rc_header.h_version);
1418b0e7b2cSDavid Teigland 		return -EPROTO;
1429e971b71SDavid Teigland 	}
1439e971b71SDavid Teigland 
14493ff2971SAl Viro 	if (le32_to_cpu(rf->rf_lvblen) != ls->ls_lvblen ||
14593ff2971SAl Viro 	    le32_to_cpu(rf->rf_lsflags) != ls->ls_exflags) {
146e7fd4179SDavid Teigland 		log_error(ls, "config mismatch: %d,%x nodeid %d: %d,%x",
14793ff2971SAl Viro 			  ls->ls_lvblen, ls->ls_exflags, nodeid,
14893ff2971SAl Viro 			  le32_to_cpu(rf->rf_lvblen),
14993ff2971SAl Viro 			  le32_to_cpu(rf->rf_lsflags));
1508b0e7b2cSDavid Teigland 		return -EPROTO;
151e7fd4179SDavid Teigland 	}
152e7fd4179SDavid Teigland 	return 0;
153e7fd4179SDavid Teigland }
154e7fd4179SDavid Teigland 
15598f176fbSDavid Teigland static void allow_sync_reply(struct dlm_ls *ls, uint64_t *new_seq)
15698f176fbSDavid Teigland {
15798f176fbSDavid Teigland 	spin_lock(&ls->ls_rcom_spin);
15898f176fbSDavid Teigland 	*new_seq = ++ls->ls_rcom_seq;
15998f176fbSDavid Teigland 	set_bit(LSFL_RCOM_WAIT, &ls->ls_flags);
16098f176fbSDavid Teigland 	spin_unlock(&ls->ls_rcom_spin);
16198f176fbSDavid Teigland }
16298f176fbSDavid Teigland 
16398f176fbSDavid Teigland static void disallow_sync_reply(struct dlm_ls *ls)
16498f176fbSDavid Teigland {
16598f176fbSDavid Teigland 	spin_lock(&ls->ls_rcom_spin);
16698f176fbSDavid Teigland 	clear_bit(LSFL_RCOM_WAIT, &ls->ls_flags);
16798f176fbSDavid Teigland 	clear_bit(LSFL_RCOM_READY, &ls->ls_flags);
16898f176fbSDavid Teigland 	spin_unlock(&ls->ls_rcom_spin);
16998f176fbSDavid Teigland }
17098f176fbSDavid Teigland 
171757a4271SDavid Teigland /*
172757a4271SDavid Teigland  * low nodeid gathers one slot value at a time from each node.
173757a4271SDavid Teigland  * it sets need_slots=0, and saves rf_our_slot returned from each
174757a4271SDavid Teigland  * rcom_config.
175757a4271SDavid Teigland  *
176757a4271SDavid Teigland  * other nodes gather all slot values at once from the low nodeid.
177757a4271SDavid Teigland  * they set need_slots=1, and ignore the rf_our_slot returned from each
178757a4271SDavid Teigland  * rcom_config.  they use the rf_num_slots returned from the low
179757a4271SDavid Teigland  * node's rcom_config.
180757a4271SDavid Teigland  */
181757a4271SDavid Teigland 
182757a4271SDavid Teigland int dlm_rcom_status(struct dlm_ls *ls, int nodeid, uint32_t status_flags)
183e7fd4179SDavid Teigland {
184e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
185*8f2dc78dSAlexander Aring 	struct dlm_msg *msg;
186e7fd4179SDavid Teigland 	int error = 0;
187e7fd4179SDavid Teigland 
188faa0f267SDavid Teigland 	ls->ls_recover_nodeid = nodeid;
189e7fd4179SDavid Teigland 
190e7fd4179SDavid Teigland 	if (nodeid == dlm_our_nodeid()) {
1914007685cSAl Viro 		rc = ls->ls_recover_buf;
192e7fd4179SDavid Teigland 		rc->rc_result = dlm_recover_status(ls);
193e7fd4179SDavid Teigland 		goto out;
194e7fd4179SDavid Teigland 	}
195e7fd4179SDavid Teigland 
19659661212Stsutomu.owa@toshiba.co.jp retry:
197a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_STATUS,
198*8f2dc78dSAlexander Aring 				      sizeof(struct rcom_status), &rc, &msg);
199e7fd4179SDavid Teigland 	if (error)
200e7fd4179SDavid Teigland 		goto out;
20198f176fbSDavid Teigland 
202757a4271SDavid Teigland 	set_rcom_status(ls, (struct rcom_status *)rc->rc_buf, status_flags);
203757a4271SDavid Teigland 
20498f176fbSDavid Teigland 	allow_sync_reply(ls, &rc->rc_id);
2059f8f9c77SAlexander Aring 	memset(ls->ls_recover_buf, 0, LOWCOMMS_MAX_TX_BUFFER_LEN);
206e7fd4179SDavid Teigland 
207*8f2dc78dSAlexander Aring 	send_rcom_stateless(ls, msg, rc);
208e7fd4179SDavid Teigland 
209e7fd4179SDavid Teigland 	error = dlm_wait_function(ls, &rcom_response);
21098f176fbSDavid Teigland 	disallow_sync_reply(ls);
21159661212Stsutomu.owa@toshiba.co.jp 	if (error == -ETIMEDOUT)
21259661212Stsutomu.owa@toshiba.co.jp 		goto retry;
213e7fd4179SDavid Teigland 	if (error)
214e7fd4179SDavid Teigland 		goto out;
215e7fd4179SDavid Teigland 
2164007685cSAl Viro 	rc = ls->ls_recover_buf;
217e7fd4179SDavid Teigland 
218e7fd4179SDavid Teigland 	if (rc->rc_result == -ESRCH) {
219e7fd4179SDavid Teigland 		/* we pretend the remote lockspace exists with 0 status */
220e7fd4179SDavid Teigland 		log_debug(ls, "remote node %d not ready", nodeid);
221e7fd4179SDavid Teigland 		rc->rc_result = 0;
222757a4271SDavid Teigland 		error = 0;
223757a4271SDavid Teigland 	} else {
224757a4271SDavid Teigland 		error = check_rcom_config(ls, rc, nodeid);
225757a4271SDavid Teigland 	}
226757a4271SDavid Teigland 
227e7fd4179SDavid Teigland 	/* the caller looks at rc_result for the remote recovery status */
228e7fd4179SDavid Teigland  out:
229e7fd4179SDavid Teigland 	return error;
230e7fd4179SDavid Teigland }
231e7fd4179SDavid Teigland 
232e7fd4179SDavid Teigland static void receive_rcom_status(struct dlm_ls *ls, struct dlm_rcom *rc_in)
233e7fd4179SDavid Teigland {
234e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
235757a4271SDavid Teigland 	struct rcom_status *rs;
236757a4271SDavid Teigland 	uint32_t status;
237757a4271SDavid Teigland 	int nodeid = rc_in->rc_header.h_nodeid;
238757a4271SDavid Teigland 	int len = sizeof(struct rcom_config);
239*8f2dc78dSAlexander Aring 	struct dlm_msg *msg;
240757a4271SDavid Teigland 	int num_slots = 0;
241757a4271SDavid Teigland 	int error;
242e7fd4179SDavid Teigland 
243757a4271SDavid Teigland 	if (!dlm_slots_version(&rc_in->rc_header)) {
244757a4271SDavid Teigland 		status = dlm_recover_status(ls);
245757a4271SDavid Teigland 		goto do_create;
246757a4271SDavid Teigland 	}
247757a4271SDavid Teigland 
248757a4271SDavid Teigland 	rs = (struct rcom_status *)rc_in->rc_buf;
249757a4271SDavid Teigland 
250c07127b4SNeale Ferguson 	if (!(le32_to_cpu(rs->rs_flags) & DLM_RSF_NEED_SLOTS)) {
251757a4271SDavid Teigland 		status = dlm_recover_status(ls);
252757a4271SDavid Teigland 		goto do_create;
253757a4271SDavid Teigland 	}
254757a4271SDavid Teigland 
255757a4271SDavid Teigland 	spin_lock(&ls->ls_recover_lock);
256757a4271SDavid Teigland 	status = ls->ls_recover_status;
257757a4271SDavid Teigland 	num_slots = ls->ls_num_slots;
258757a4271SDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
259757a4271SDavid Teigland 	len += num_slots * sizeof(struct rcom_slot);
260757a4271SDavid Teigland 
261757a4271SDavid Teigland  do_create:
262a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_STATUS_REPLY,
263*8f2dc78dSAlexander Aring 				      len, &rc, &msg);
264e7fd4179SDavid Teigland 	if (error)
265e7fd4179SDavid Teigland 		return;
266757a4271SDavid Teigland 
2674a99c3d9SDavid Teigland 	rc->rc_id = rc_in->rc_id;
26838aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
269757a4271SDavid Teigland 	rc->rc_result = status;
270e7fd4179SDavid Teigland 
271757a4271SDavid Teigland 	set_rcom_config(ls, (struct rcom_config *)rc->rc_buf, num_slots);
272757a4271SDavid Teigland 
273757a4271SDavid Teigland 	if (!num_slots)
274757a4271SDavid Teigland 		goto do_send;
275757a4271SDavid Teigland 
276757a4271SDavid Teigland 	spin_lock(&ls->ls_recover_lock);
277757a4271SDavid Teigland 	if (ls->ls_num_slots != num_slots) {
278757a4271SDavid Teigland 		spin_unlock(&ls->ls_recover_lock);
279757a4271SDavid Teigland 		log_debug(ls, "receive_rcom_status num_slots %d to %d",
280757a4271SDavid Teigland 			  num_slots, ls->ls_num_slots);
281757a4271SDavid Teigland 		rc->rc_result = 0;
282757a4271SDavid Teigland 		set_rcom_config(ls, (struct rcom_config *)rc->rc_buf, 0);
283757a4271SDavid Teigland 		goto do_send;
284757a4271SDavid Teigland 	}
285757a4271SDavid Teigland 
286757a4271SDavid Teigland 	dlm_slots_copy_out(ls, rc);
287757a4271SDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
288757a4271SDavid Teigland 
289757a4271SDavid Teigland  do_send:
290*8f2dc78dSAlexander Aring 	send_rcom_stateless(ls, msg, rc);
291e7fd4179SDavid Teigland }
292e7fd4179SDavid Teigland 
2934a99c3d9SDavid Teigland static void receive_sync_reply(struct dlm_ls *ls, struct dlm_rcom *rc_in)
294e7fd4179SDavid Teigland {
29598f176fbSDavid Teigland 	spin_lock(&ls->ls_rcom_spin);
29698f176fbSDavid Teigland 	if (!test_bit(LSFL_RCOM_WAIT, &ls->ls_flags) ||
29798f176fbSDavid Teigland 	    rc_in->rc_id != ls->ls_rcom_seq) {
29898f176fbSDavid Teigland 		log_debug(ls, "reject reply %d from %d seq %llx expect %llx",
29998f176fbSDavid Teigland 			  rc_in->rc_type, rc_in->rc_header.h_nodeid,
30057adf7eeSRyusuke Konishi 			  (unsigned long long)rc_in->rc_id,
30157adf7eeSRyusuke Konishi 			  (unsigned long long)ls->ls_rcom_seq);
30298f176fbSDavid Teigland 		goto out;
3034a99c3d9SDavid Teigland 	}
304e7fd4179SDavid Teigland 	memcpy(ls->ls_recover_buf, rc_in, rc_in->rc_header.h_length);
305e7fd4179SDavid Teigland 	set_bit(LSFL_RCOM_READY, &ls->ls_flags);
30698f176fbSDavid Teigland 	clear_bit(LSFL_RCOM_WAIT, &ls->ls_flags);
307e7fd4179SDavid Teigland 	wake_up(&ls->ls_wait_general);
30898f176fbSDavid Teigland  out:
30998f176fbSDavid Teigland 	spin_unlock(&ls->ls_rcom_spin);
310e7fd4179SDavid Teigland }
311e7fd4179SDavid Teigland 
312e7fd4179SDavid Teigland int dlm_rcom_names(struct dlm_ls *ls, int nodeid, char *last_name, int last_len)
313e7fd4179SDavid Teigland {
314e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
315*8f2dc78dSAlexander Aring 	struct dlm_msg *msg;
3164007685cSAl Viro 	int error = 0;
317e7fd4179SDavid Teigland 
318faa0f267SDavid Teigland 	ls->ls_recover_nodeid = nodeid;
319e7fd4179SDavid Teigland 
32059661212Stsutomu.owa@toshiba.co.jp retry:
321a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_NAMES, last_len,
322*8f2dc78dSAlexander Aring 				      &rc, &msg);
323e7fd4179SDavid Teigland 	if (error)
324e7fd4179SDavid Teigland 		goto out;
325e7fd4179SDavid Teigland 	memcpy(rc->rc_buf, last_name, last_len);
32698f176fbSDavid Teigland 
32798f176fbSDavid Teigland 	allow_sync_reply(ls, &rc->rc_id);
3289f8f9c77SAlexander Aring 	memset(ls->ls_recover_buf, 0, LOWCOMMS_MAX_TX_BUFFER_LEN);
329e7fd4179SDavid Teigland 
330*8f2dc78dSAlexander Aring 	send_rcom_stateless(ls, msg, rc);
331e7fd4179SDavid Teigland 
332e7fd4179SDavid Teigland 	error = dlm_wait_function(ls, &rcom_response);
33398f176fbSDavid Teigland 	disallow_sync_reply(ls);
33459661212Stsutomu.owa@toshiba.co.jp 	if (error == -ETIMEDOUT)
33559661212Stsutomu.owa@toshiba.co.jp 		goto retry;
336e7fd4179SDavid Teigland  out:
337e7fd4179SDavid Teigland 	return error;
338e7fd4179SDavid Teigland }
339e7fd4179SDavid Teigland 
340e7fd4179SDavid Teigland static void receive_rcom_names(struct dlm_ls *ls, struct dlm_rcom *rc_in)
341e7fd4179SDavid Teigland {
342e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
34338aa8b0cSDavid Teigland 	int error, inlen, outlen, nodeid;
344*8f2dc78dSAlexander Aring 	struct dlm_msg *msg;
345e7fd4179SDavid Teigland 
346e7fd4179SDavid Teigland 	nodeid = rc_in->rc_header.h_nodeid;
347e7fd4179SDavid Teigland 	inlen = rc_in->rc_header.h_length - sizeof(struct dlm_rcom);
3489f8f9c77SAlexander Aring 	outlen = LOWCOMMS_MAX_TX_BUFFER_LEN - sizeof(struct dlm_rcom);
349e7fd4179SDavid Teigland 
350a070a91cSAlexander Aring 	error = create_rcom_stateless(ls, nodeid, DLM_RCOM_NAMES_REPLY, outlen,
351*8f2dc78dSAlexander Aring 				      &rc, &msg);
352e7fd4179SDavid Teigland 	if (error)
353e7fd4179SDavid Teigland 		return;
3544a99c3d9SDavid Teigland 	rc->rc_id = rc_in->rc_id;
35538aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
356e7fd4179SDavid Teigland 
357e7fd4179SDavid Teigland 	dlm_copy_master_names(ls, rc_in->rc_buf, inlen, rc->rc_buf, outlen,
358e7fd4179SDavid Teigland 			      nodeid);
359*8f2dc78dSAlexander Aring 	send_rcom_stateless(ls, msg, rc);
360e7fd4179SDavid Teigland }
361e7fd4179SDavid Teigland 
362e7fd4179SDavid Teigland int dlm_send_rcom_lookup(struct dlm_rsb *r, int dir_nodeid)
363e7fd4179SDavid Teigland {
364e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
365e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
366e7fd4179SDavid Teigland 	struct dlm_ls *ls = r->res_ls;
367e7fd4179SDavid Teigland 	int error;
368e7fd4179SDavid Teigland 
369e7fd4179SDavid Teigland 	error = create_rcom(ls, dir_nodeid, DLM_RCOM_LOOKUP, r->res_length,
370e7fd4179SDavid Teigland 			    &rc, &mh);
371e7fd4179SDavid Teigland 	if (error)
372e7fd4179SDavid Teigland 		goto out;
373e7fd4179SDavid Teigland 	memcpy(rc->rc_buf, r->res_name, r->res_length);
3741d7c484eSDavid Teigland 	rc->rc_id = (unsigned long) r->res_id;
375e7fd4179SDavid Teigland 
376e7fd4179SDavid Teigland 	send_rcom(ls, mh, rc);
377e7fd4179SDavid Teigland  out:
378e7fd4179SDavid Teigland 	return error;
379e7fd4179SDavid Teigland }
380e7fd4179SDavid Teigland 
381e7fd4179SDavid Teigland static void receive_rcom_lookup(struct dlm_ls *ls, struct dlm_rcom *rc_in)
382e7fd4179SDavid Teigland {
383e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
384e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
385e7fd4179SDavid Teigland 	int error, ret_nodeid, nodeid = rc_in->rc_header.h_nodeid;
386e7fd4179SDavid Teigland 	int len = rc_in->rc_header.h_length - sizeof(struct dlm_rcom);
387e7fd4179SDavid Teigland 
388e7fd4179SDavid Teigland 	error = create_rcom(ls, nodeid, DLM_RCOM_LOOKUP_REPLY, 0, &rc, &mh);
389e7fd4179SDavid Teigland 	if (error)
390e7fd4179SDavid Teigland 		return;
391e7fd4179SDavid Teigland 
3929250e523SDavid Teigland 	/* Old code would send this special id to trigger a debug dump. */
393c04fecb4SDavid Teigland 	if (rc_in->rc_id == 0xFFFFFFFF) {
394c04fecb4SDavid Teigland 		log_error(ls, "receive_rcom_lookup dump from %d", nodeid);
395c04fecb4SDavid Teigland 		dlm_dump_rsb_name(ls, rc_in->rc_buf, len);
396c04fecb4SDavid Teigland 		return;
397c04fecb4SDavid Teigland 	}
398c04fecb4SDavid Teigland 
399c04fecb4SDavid Teigland 	error = dlm_master_lookup(ls, nodeid, rc_in->rc_buf, len,
400c04fecb4SDavid Teigland 				  DLM_LU_RECOVER_MASTER, &ret_nodeid, NULL);
401e7fd4179SDavid Teigland 	if (error)
402e7fd4179SDavid Teigland 		ret_nodeid = error;
403e7fd4179SDavid Teigland 	rc->rc_result = ret_nodeid;
404e7fd4179SDavid Teigland 	rc->rc_id = rc_in->rc_id;
40538aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
406e7fd4179SDavid Teigland 
407e7fd4179SDavid Teigland 	send_rcom(ls, mh, rc);
408e7fd4179SDavid Teigland }
409e7fd4179SDavid Teigland 
410e7fd4179SDavid Teigland static void receive_rcom_lookup_reply(struct dlm_ls *ls, struct dlm_rcom *rc_in)
411e7fd4179SDavid Teigland {
412e7fd4179SDavid Teigland 	dlm_recover_master_reply(ls, rc_in);
413e7fd4179SDavid Teigland }
414e7fd4179SDavid Teigland 
415e7fd4179SDavid Teigland static void pack_rcom_lock(struct dlm_rsb *r, struct dlm_lkb *lkb,
416e7fd4179SDavid Teigland 			   struct rcom_lock *rl)
417e7fd4179SDavid Teigland {
418e7fd4179SDavid Teigland 	memset(rl, 0, sizeof(*rl));
419e7fd4179SDavid Teigland 
420163a1859SAl Viro 	rl->rl_ownpid = cpu_to_le32(lkb->lkb_ownpid);
421163a1859SAl Viro 	rl->rl_lkid = cpu_to_le32(lkb->lkb_id);
422163a1859SAl Viro 	rl->rl_exflags = cpu_to_le32(lkb->lkb_exflags);
423163a1859SAl Viro 	rl->rl_flags = cpu_to_le32(lkb->lkb_flags);
424163a1859SAl Viro 	rl->rl_lvbseq = cpu_to_le32(lkb->lkb_lvbseq);
425e7fd4179SDavid Teigland 	rl->rl_rqmode = lkb->lkb_rqmode;
426e7fd4179SDavid Teigland 	rl->rl_grmode = lkb->lkb_grmode;
427e7fd4179SDavid Teigland 	rl->rl_status = lkb->lkb_status;
428163a1859SAl Viro 	rl->rl_wait_type = cpu_to_le16(lkb->lkb_wait_type);
429e7fd4179SDavid Teigland 
430e5dae548SDavid Teigland 	if (lkb->lkb_bastfn)
4318304d6f2SDavid Teigland 		rl->rl_asts |= DLM_CB_BAST;
432e5dae548SDavid Teigland 	if (lkb->lkb_astfn)
4338304d6f2SDavid Teigland 		rl->rl_asts |= DLM_CB_CAST;
434e7fd4179SDavid Teigland 
435163a1859SAl Viro 	rl->rl_namelen = cpu_to_le16(r->res_length);
436e7fd4179SDavid Teigland 	memcpy(rl->rl_name, r->res_name, r->res_length);
437e7fd4179SDavid Teigland 
438e7fd4179SDavid Teigland 	/* FIXME: might we have an lvb without DLM_LKF_VALBLK set ?
439e7fd4179SDavid Teigland 	   If so, receive_rcom_lock_args() won't take this copy. */
440e7fd4179SDavid Teigland 
441e7fd4179SDavid Teigland 	if (lkb->lkb_lvbptr)
442e7fd4179SDavid Teigland 		memcpy(rl->rl_lvb, lkb->lkb_lvbptr, r->res_ls->ls_lvblen);
443e7fd4179SDavid Teigland }
444e7fd4179SDavid Teigland 
445e7fd4179SDavid Teigland int dlm_send_rcom_lock(struct dlm_rsb *r, struct dlm_lkb *lkb)
446e7fd4179SDavid Teigland {
447e7fd4179SDavid Teigland 	struct dlm_ls *ls = r->res_ls;
448e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
449e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
450e7fd4179SDavid Teigland 	struct rcom_lock *rl;
451e7fd4179SDavid Teigland 	int error, len = sizeof(struct rcom_lock);
452e7fd4179SDavid Teigland 
453e7fd4179SDavid Teigland 	if (lkb->lkb_lvbptr)
454e7fd4179SDavid Teigland 		len += ls->ls_lvblen;
455e7fd4179SDavid Teigland 
456e7fd4179SDavid Teigland 	error = create_rcom(ls, r->res_nodeid, DLM_RCOM_LOCK, len, &rc, &mh);
457e7fd4179SDavid Teigland 	if (error)
458e7fd4179SDavid Teigland 		goto out;
459e7fd4179SDavid Teigland 
460e7fd4179SDavid Teigland 	rl = (struct rcom_lock *) rc->rc_buf;
461e7fd4179SDavid Teigland 	pack_rcom_lock(r, lkb, rl);
462e7fd4179SDavid Teigland 	rc->rc_id = (unsigned long) r;
463e7fd4179SDavid Teigland 
464e7fd4179SDavid Teigland 	send_rcom(ls, mh, rc);
465e7fd4179SDavid Teigland  out:
466e7fd4179SDavid Teigland 	return error;
467e7fd4179SDavid Teigland }
468e7fd4179SDavid Teigland 
469ae773d0bSAl Viro /* needs at least dlm_rcom + rcom_lock */
470e7fd4179SDavid Teigland static void receive_rcom_lock(struct dlm_ls *ls, struct dlm_rcom *rc_in)
471e7fd4179SDavid Teigland {
472e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
473e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
474e7fd4179SDavid Teigland 	int error, nodeid = rc_in->rc_header.h_nodeid;
475e7fd4179SDavid Teigland 
476e7fd4179SDavid Teigland 	dlm_recover_master_copy(ls, rc_in);
477e7fd4179SDavid Teigland 
478e7fd4179SDavid Teigland 	error = create_rcom(ls, nodeid, DLM_RCOM_LOCK_REPLY,
479e7fd4179SDavid Teigland 			    sizeof(struct rcom_lock), &rc, &mh);
480e7fd4179SDavid Teigland 	if (error)
481e7fd4179SDavid Teigland 		return;
482e7fd4179SDavid Teigland 
483e7fd4179SDavid Teigland 	/* We send back the same rcom_lock struct we received, but
484e7fd4179SDavid Teigland 	   dlm_recover_master_copy() has filled in rl_remid and rl_result */
485e7fd4179SDavid Teigland 
486e7fd4179SDavid Teigland 	memcpy(rc->rc_buf, rc_in->rc_buf, sizeof(struct rcom_lock));
487e7fd4179SDavid Teigland 	rc->rc_id = rc_in->rc_id;
48838aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
489e7fd4179SDavid Teigland 
490e7fd4179SDavid Teigland 	send_rcom(ls, mh, rc);
491e7fd4179SDavid Teigland }
492e7fd4179SDavid Teigland 
493c36258b5SDavid Teigland /* If the lockspace doesn't exist then still send a status message
494c36258b5SDavid Teigland    back; it's possible that it just doesn't have its global_id yet. */
495c36258b5SDavid Teigland 
496c36258b5SDavid Teigland int dlm_send_ls_not_ready(int nodeid, struct dlm_rcom *rc_in)
497e7fd4179SDavid Teigland {
498e7fd4179SDavid Teigland 	struct dlm_rcom *rc;
4991babdb45SDavid Teigland 	struct rcom_config *rf;
500e7fd4179SDavid Teigland 	struct dlm_mhandle *mh;
501e7fd4179SDavid Teigland 	char *mb;
5021babdb45SDavid Teigland 	int mb_len = sizeof(struct dlm_rcom) + sizeof(struct rcom_config);
503e7fd4179SDavid Teigland 
504a070a91cSAlexander Aring 	mh = dlm_midcomms_get_mhandle(nodeid, mb_len, GFP_NOFS, &mb);
505e7fd4179SDavid Teigland 	if (!mh)
506e7fd4179SDavid Teigland 		return -ENOBUFS;
507e7fd4179SDavid Teigland 
508e7fd4179SDavid Teigland 	rc = (struct dlm_rcom *) mb;
509e7fd4179SDavid Teigland 
510e7fd4179SDavid Teigland 	rc->rc_header.h_version = (DLM_HEADER_MAJOR | DLM_HEADER_MINOR);
511e7fd4179SDavid Teigland 	rc->rc_header.h_lockspace = rc_in->rc_header.h_lockspace;
512e7fd4179SDavid Teigland 	rc->rc_header.h_nodeid = dlm_our_nodeid();
513e7fd4179SDavid Teigland 	rc->rc_header.h_length = mb_len;
514e7fd4179SDavid Teigland 	rc->rc_header.h_cmd = DLM_RCOM;
515e7fd4179SDavid Teigland 
516e7fd4179SDavid Teigland 	rc->rc_type = DLM_RCOM_STATUS_REPLY;
517f5888750SDavid Teigland 	rc->rc_id = rc_in->rc_id;
51838aa8b0cSDavid Teigland 	rc->rc_seq_reply = rc_in->rc_seq;
519e7fd4179SDavid Teigland 	rc->rc_result = -ESRCH;
520e7fd4179SDavid Teigland 
5211babdb45SDavid Teigland 	rf = (struct rcom_config *) rc->rc_buf;
52293ff2971SAl Viro 	rf->rf_lvblen = cpu_to_le32(~0U);
5231babdb45SDavid Teigland 
524e7fd4179SDavid Teigland 	dlm_rcom_out(rc);
525a070a91cSAlexander Aring 	dlm_midcomms_commit_mhandle(mh);
526e7fd4179SDavid Teigland 
527e7fd4179SDavid Teigland 	return 0;
528e7fd4179SDavid Teigland }
529e7fd4179SDavid Teigland 
530c04fecb4SDavid Teigland /*
531c04fecb4SDavid Teigland  * Ignore messages for stage Y before we set
532c04fecb4SDavid Teigland  * recover_status bit for stage X:
533c04fecb4SDavid Teigland  *
534c04fecb4SDavid Teigland  * recover_status = 0
535c04fecb4SDavid Teigland  *
536c04fecb4SDavid Teigland  * dlm_recover_members()
537c04fecb4SDavid Teigland  * - send nothing
538c04fecb4SDavid Teigland  * - recv nothing
539c04fecb4SDavid Teigland  * - ignore NAMES, NAMES_REPLY
540c04fecb4SDavid Teigland  * - ignore LOOKUP, LOOKUP_REPLY
541c04fecb4SDavid Teigland  * - ignore LOCK, LOCK_REPLY
542c04fecb4SDavid Teigland  *
543c04fecb4SDavid Teigland  * recover_status |= NODES
544c04fecb4SDavid Teigland  *
545c04fecb4SDavid Teigland  * dlm_recover_members_wait()
546c04fecb4SDavid Teigland  *
547c04fecb4SDavid Teigland  * dlm_recover_directory()
548c04fecb4SDavid Teigland  * - send NAMES
549c04fecb4SDavid Teigland  * - recv NAMES_REPLY
550c04fecb4SDavid Teigland  * - ignore LOOKUP, LOOKUP_REPLY
551c04fecb4SDavid Teigland  * - ignore LOCK, LOCK_REPLY
552c04fecb4SDavid Teigland  *
553c04fecb4SDavid Teigland  * recover_status |= DIR
554c04fecb4SDavid Teigland  *
555c04fecb4SDavid Teigland  * dlm_recover_directory_wait()
556c04fecb4SDavid Teigland  *
557c04fecb4SDavid Teigland  * dlm_recover_masters()
558c04fecb4SDavid Teigland  * - send LOOKUP
559c04fecb4SDavid Teigland  * - recv LOOKUP_REPLY
560c04fecb4SDavid Teigland  *
561c04fecb4SDavid Teigland  * dlm_recover_locks()
562c04fecb4SDavid Teigland  * - send LOCKS
563c04fecb4SDavid Teigland  * - recv LOCKS_REPLY
564c04fecb4SDavid Teigland  *
565c04fecb4SDavid Teigland  * recover_status |= LOCKS
566c04fecb4SDavid Teigland  *
567c04fecb4SDavid Teigland  * dlm_recover_locks_wait()
568c04fecb4SDavid Teigland  *
569c04fecb4SDavid Teigland  * recover_status |= DONE
570c04fecb4SDavid Teigland  */
571c04fecb4SDavid Teigland 
572c36258b5SDavid Teigland /* Called by dlm_recv; corresponds to dlm_receive_message() but special
573e7fd4179SDavid Teigland    recovery-only comms are sent through here. */
574e7fd4179SDavid Teigland 
575c36258b5SDavid Teigland void dlm_receive_rcom(struct dlm_ls *ls, struct dlm_rcom *rc, int nodeid)
576e7fd4179SDavid Teigland {
577ae773d0bSAl Viro 	int lock_size = sizeof(struct dlm_rcom) + sizeof(struct rcom_lock);
578c04fecb4SDavid Teigland 	int stop, reply = 0, names = 0, lookup = 0, lock = 0;
5794875647aSDavid Teigland 	uint32_t status;
580d6e24788SDavid Teigland 	uint64_t seq;
581ae773d0bSAl Viro 
582d6e24788SDavid Teigland 	switch (rc->rc_type) {
583c04fecb4SDavid Teigland 	case DLM_RCOM_STATUS_REPLY:
584c04fecb4SDavid Teigland 		reply = 1;
585c04fecb4SDavid Teigland 		break;
586c04fecb4SDavid Teigland 	case DLM_RCOM_NAMES:
587c04fecb4SDavid Teigland 		names = 1;
588c04fecb4SDavid Teigland 		break;
589c04fecb4SDavid Teigland 	case DLM_RCOM_NAMES_REPLY:
590c04fecb4SDavid Teigland 		names = 1;
591c04fecb4SDavid Teigland 		reply = 1;
592c04fecb4SDavid Teigland 		break;
593c04fecb4SDavid Teigland 	case DLM_RCOM_LOOKUP:
594c04fecb4SDavid Teigland 		lookup = 1;
595c04fecb4SDavid Teigland 		break;
596c04fecb4SDavid Teigland 	case DLM_RCOM_LOOKUP_REPLY:
597c04fecb4SDavid Teigland 		lookup = 1;
598c04fecb4SDavid Teigland 		reply = 1;
599c04fecb4SDavid Teigland 		break;
6004875647aSDavid Teigland 	case DLM_RCOM_LOCK:
6014875647aSDavid Teigland 		lock = 1;
6024875647aSDavid Teigland 		break;
6034875647aSDavid Teigland 	case DLM_RCOM_LOCK_REPLY:
6044875647aSDavid Teigland 		lock = 1;
6054875647aSDavid Teigland 		reply = 1;
6064875647aSDavid Teigland 		break;
60790db4f8bSWu Bo 	}
608d6e24788SDavid Teigland 
609d6e24788SDavid Teigland 	spin_lock(&ls->ls_recover_lock);
6104875647aSDavid Teigland 	status = ls->ls_recover_status;
611475f230cSDavid Teigland 	stop = test_bit(LSFL_RECOVER_STOP, &ls->ls_flags);
612d6e24788SDavid Teigland 	seq = ls->ls_recover_seq;
613d6e24788SDavid Teigland 	spin_unlock(&ls->ls_recover_lock);
614d6e24788SDavid Teigland 
615c04fecb4SDavid Teigland 	if (stop && (rc->rc_type != DLM_RCOM_STATUS))
616c04fecb4SDavid Teigland 		goto ignore;
617c04fecb4SDavid Teigland 
618c04fecb4SDavid Teigland 	if (reply && (rc->rc_seq_reply != seq))
619c04fecb4SDavid Teigland 		goto ignore;
620c04fecb4SDavid Teigland 
621c04fecb4SDavid Teigland 	if (!(status & DLM_RS_NODES) && (names || lookup || lock))
622c04fecb4SDavid Teigland 		goto ignore;
623c04fecb4SDavid Teigland 
624c04fecb4SDavid Teigland 	if (!(status & DLM_RS_DIR) && (lookup || lock))
625c04fecb4SDavid Teigland 		goto ignore;
626e7fd4179SDavid Teigland 
627e7fd4179SDavid Teigland 	switch (rc->rc_type) {
628e7fd4179SDavid Teigland 	case DLM_RCOM_STATUS:
629e7fd4179SDavid Teigland 		receive_rcom_status(ls, rc);
630e7fd4179SDavid Teigland 		break;
631e7fd4179SDavid Teigland 
632e7fd4179SDavid Teigland 	case DLM_RCOM_NAMES:
633e7fd4179SDavid Teigland 		receive_rcom_names(ls, rc);
634e7fd4179SDavid Teigland 		break;
635e7fd4179SDavid Teigland 
636e7fd4179SDavid Teigland 	case DLM_RCOM_LOOKUP:
637e7fd4179SDavid Teigland 		receive_rcom_lookup(ls, rc);
638e7fd4179SDavid Teigland 		break;
639e7fd4179SDavid Teigland 
640e7fd4179SDavid Teigland 	case DLM_RCOM_LOCK:
641ae773d0bSAl Viro 		if (rc->rc_header.h_length < lock_size)
642ae773d0bSAl Viro 			goto Eshort;
643e7fd4179SDavid Teigland 		receive_rcom_lock(ls, rc);
644e7fd4179SDavid Teigland 		break;
645e7fd4179SDavid Teigland 
646e7fd4179SDavid Teigland 	case DLM_RCOM_STATUS_REPLY:
647dbcfc347SDavid Teigland 		receive_sync_reply(ls, rc);
648e7fd4179SDavid Teigland 		break;
649e7fd4179SDavid Teigland 
650e7fd4179SDavid Teigland 	case DLM_RCOM_NAMES_REPLY:
651dbcfc347SDavid Teigland 		receive_sync_reply(ls, rc);
652e7fd4179SDavid Teigland 		break;
653e7fd4179SDavid Teigland 
654e7fd4179SDavid Teigland 	case DLM_RCOM_LOOKUP_REPLY:
655e7fd4179SDavid Teigland 		receive_rcom_lookup_reply(ls, rc);
656e7fd4179SDavid Teigland 		break;
657e7fd4179SDavid Teigland 
658e7fd4179SDavid Teigland 	case DLM_RCOM_LOCK_REPLY:
659ae773d0bSAl Viro 		if (rc->rc_header.h_length < lock_size)
660ae773d0bSAl Viro 			goto Eshort;
661dbcfc347SDavid Teigland 		dlm_recover_process_copy(ls, rc);
662e7fd4179SDavid Teigland 		break;
663e7fd4179SDavid Teigland 
664e7fd4179SDavid Teigland 	default:
665dbcfc347SDavid Teigland 		log_error(ls, "receive_rcom bad type %d", rc->rc_type);
666e7fd4179SDavid Teigland 	}
667c04fecb4SDavid Teigland 	return;
668c04fecb4SDavid Teigland 
669c04fecb4SDavid Teigland ignore:
670c04fecb4SDavid Teigland 	log_limit(ls, "dlm_receive_rcom ignore msg %d "
671c04fecb4SDavid Teigland 		  "from %d %llu %llu recover seq %llu sts %x gen %u",
672c04fecb4SDavid Teigland 		   rc->rc_type,
673c04fecb4SDavid Teigland 		   nodeid,
674c04fecb4SDavid Teigland 		   (unsigned long long)rc->rc_seq,
675c04fecb4SDavid Teigland 		   (unsigned long long)rc->rc_seq_reply,
676c04fecb4SDavid Teigland 		   (unsigned long long)seq,
677c04fecb4SDavid Teigland 		   status, ls->ls_generation);
678c36258b5SDavid Teigland 	return;
679ae773d0bSAl Viro Eshort:
680c04fecb4SDavid Teigland 	log_error(ls, "recovery message %d from %d is too short",
681ae773d0bSAl Viro 		  rc->rc_type, nodeid);
682e7fd4179SDavid Teigland }
683e7fd4179SDavid Teigland 
684