1 // SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0
2 /* Copyright (c) 2015-2018 Mellanox Technologies. All rights reserved */
3 
4 #include <linux/kernel.h>
5 #include <linux/module.h>
6 #include <linux/export.h>
7 #include <linux/err.h>
8 #include <linux/device.h>
9 #include <linux/pci.h>
10 #include <linux/interrupt.h>
11 #include <linux/wait.h>
12 #include <linux/types.h>
13 #include <linux/skbuff.h>
14 #include <linux/if_vlan.h>
15 #include <linux/log2.h>
16 #include <linux/string.h>
17 
18 #include "pci_hw.h"
19 #include "pci.h"
20 #include "core.h"
21 #include "cmd.h"
22 #include "port.h"
23 #include "resources.h"
24 
25 #define mlxsw_pci_write32(mlxsw_pci, reg, val) \
26 	iowrite32be(val, (mlxsw_pci)->hw_addr + (MLXSW_PCI_ ## reg))
27 #define mlxsw_pci_read32(mlxsw_pci, reg) \
28 	ioread32be((mlxsw_pci)->hw_addr + (MLXSW_PCI_ ## reg))
29 
30 enum mlxsw_pci_queue_type {
31 	MLXSW_PCI_QUEUE_TYPE_SDQ,
32 	MLXSW_PCI_QUEUE_TYPE_RDQ,
33 	MLXSW_PCI_QUEUE_TYPE_CQ,
34 	MLXSW_PCI_QUEUE_TYPE_EQ,
35 };
36 
37 #define MLXSW_PCI_QUEUE_TYPE_COUNT	4
38 
39 static const u16 mlxsw_pci_doorbell_type_offset[] = {
40 	MLXSW_PCI_DOORBELL_SDQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_SDQ */
41 	MLXSW_PCI_DOORBELL_RDQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_RDQ */
42 	MLXSW_PCI_DOORBELL_CQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_CQ */
43 	MLXSW_PCI_DOORBELL_EQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_EQ */
44 };
45 
46 static const u16 mlxsw_pci_doorbell_arm_type_offset[] = {
47 	0, /* unused */
48 	0, /* unused */
49 	MLXSW_PCI_DOORBELL_ARM_CQ_OFFSET, /* for type MLXSW_PCI_QUEUE_TYPE_CQ */
50 	MLXSW_PCI_DOORBELL_ARM_EQ_OFFSET, /* for type MLXSW_PCI_QUEUE_TYPE_EQ */
51 };
52 
53 struct mlxsw_pci_mem_item {
54 	char *buf;
55 	dma_addr_t mapaddr;
56 	size_t size;
57 };
58 
59 struct mlxsw_pci_queue_elem_info {
60 	char *elem; /* pointer to actual dma mapped element mem chunk */
61 	union {
62 		struct {
63 			struct sk_buff *skb;
64 		} sdq;
65 		struct {
66 			struct sk_buff *skb;
67 		} rdq;
68 	} u;
69 };
70 
71 struct mlxsw_pci_queue {
72 	spinlock_t lock; /* for queue accesses */
73 	struct mlxsw_pci_mem_item mem_item;
74 	struct mlxsw_pci_queue_elem_info *elem_info;
75 	u16 producer_counter;
76 	u16 consumer_counter;
77 	u16 count; /* number of elements in queue */
78 	u8 num; /* queue number */
79 	u8 elem_size; /* size of one element */
80 	enum mlxsw_pci_queue_type type;
81 	struct tasklet_struct tasklet; /* queue processing tasklet */
82 	struct mlxsw_pci *pci;
83 	union {
84 		struct {
85 			u32 comp_sdq_count;
86 			u32 comp_rdq_count;
87 			enum mlxsw_pci_cqe_v v;
88 		} cq;
89 		struct {
90 			u32 ev_cmd_count;
91 			u32 ev_comp_count;
92 			u32 ev_other_count;
93 		} eq;
94 	} u;
95 };
96 
97 struct mlxsw_pci_queue_type_group {
98 	struct mlxsw_pci_queue *q;
99 	u8 count; /* number of queues in group */
100 };
101 
102 struct mlxsw_pci {
103 	struct pci_dev *pdev;
104 	u8 __iomem *hw_addr;
105 	u64 free_running_clock_offset;
106 	struct mlxsw_pci_queue_type_group queues[MLXSW_PCI_QUEUE_TYPE_COUNT];
107 	u32 doorbell_offset;
108 	struct mlxsw_core *core;
109 	struct {
110 		struct mlxsw_pci_mem_item *items;
111 		unsigned int count;
112 	} fw_area;
113 	struct {
114 		struct mlxsw_pci_mem_item out_mbox;
115 		struct mlxsw_pci_mem_item in_mbox;
116 		struct mutex lock; /* Lock access to command registers */
117 		bool nopoll;
118 		wait_queue_head_t wait;
119 		bool wait_done;
120 		struct {
121 			u8 status;
122 			u64 out_param;
123 		} comp;
124 	} cmd;
125 	struct mlxsw_bus_info bus_info;
126 	const struct pci_device_id *id;
127 	enum mlxsw_pci_cqe_v max_cqe_ver; /* Maximal supported CQE version */
128 	u8 num_sdq_cqs; /* Number of CQs used for SDQs */
129 };
130 
131 static void mlxsw_pci_queue_tasklet_schedule(struct mlxsw_pci_queue *q)
132 {
133 	tasklet_schedule(&q->tasklet);
134 }
135 
136 static char *__mlxsw_pci_queue_elem_get(struct mlxsw_pci_queue *q,
137 					size_t elem_size, int elem_index)
138 {
139 	return q->mem_item.buf + (elem_size * elem_index);
140 }
141 
142 static struct mlxsw_pci_queue_elem_info *
143 mlxsw_pci_queue_elem_info_get(struct mlxsw_pci_queue *q, int elem_index)
144 {
145 	return &q->elem_info[elem_index];
146 }
147 
148 static struct mlxsw_pci_queue_elem_info *
149 mlxsw_pci_queue_elem_info_producer_get(struct mlxsw_pci_queue *q)
150 {
151 	int index = q->producer_counter & (q->count - 1);
152 
153 	if ((u16) (q->producer_counter - q->consumer_counter) == q->count)
154 		return NULL;
155 	return mlxsw_pci_queue_elem_info_get(q, index);
156 }
157 
158 static struct mlxsw_pci_queue_elem_info *
159 mlxsw_pci_queue_elem_info_consumer_get(struct mlxsw_pci_queue *q)
160 {
161 	int index = q->consumer_counter & (q->count - 1);
162 
163 	return mlxsw_pci_queue_elem_info_get(q, index);
164 }
165 
166 static char *mlxsw_pci_queue_elem_get(struct mlxsw_pci_queue *q, int elem_index)
167 {
168 	return mlxsw_pci_queue_elem_info_get(q, elem_index)->elem;
169 }
170 
171 static bool mlxsw_pci_elem_hw_owned(struct mlxsw_pci_queue *q, bool owner_bit)
172 {
173 	return owner_bit != !!(q->consumer_counter & q->count);
174 }
175 
176 static struct mlxsw_pci_queue_type_group *
177 mlxsw_pci_queue_type_group_get(struct mlxsw_pci *mlxsw_pci,
178 			       enum mlxsw_pci_queue_type q_type)
179 {
180 	return &mlxsw_pci->queues[q_type];
181 }
182 
183 static u8 __mlxsw_pci_queue_count(struct mlxsw_pci *mlxsw_pci,
184 				  enum mlxsw_pci_queue_type q_type)
185 {
186 	struct mlxsw_pci_queue_type_group *queue_group;
187 
188 	queue_group = mlxsw_pci_queue_type_group_get(mlxsw_pci, q_type);
189 	return queue_group->count;
190 }
191 
192 static u8 mlxsw_pci_sdq_count(struct mlxsw_pci *mlxsw_pci)
193 {
194 	return __mlxsw_pci_queue_count(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_SDQ);
195 }
196 
197 static u8 mlxsw_pci_cq_count(struct mlxsw_pci *mlxsw_pci)
198 {
199 	return __mlxsw_pci_queue_count(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_CQ);
200 }
201 
202 static struct mlxsw_pci_queue *
203 __mlxsw_pci_queue_get(struct mlxsw_pci *mlxsw_pci,
204 		      enum mlxsw_pci_queue_type q_type, u8 q_num)
205 {
206 	return &mlxsw_pci->queues[q_type].q[q_num];
207 }
208 
209 static struct mlxsw_pci_queue *mlxsw_pci_sdq_get(struct mlxsw_pci *mlxsw_pci,
210 						 u8 q_num)
211 {
212 	return __mlxsw_pci_queue_get(mlxsw_pci,
213 				     MLXSW_PCI_QUEUE_TYPE_SDQ, q_num);
214 }
215 
216 static struct mlxsw_pci_queue *mlxsw_pci_rdq_get(struct mlxsw_pci *mlxsw_pci,
217 						 u8 q_num)
218 {
219 	return __mlxsw_pci_queue_get(mlxsw_pci,
220 				     MLXSW_PCI_QUEUE_TYPE_RDQ, q_num);
221 }
222 
223 static struct mlxsw_pci_queue *mlxsw_pci_cq_get(struct mlxsw_pci *mlxsw_pci,
224 						u8 q_num)
225 {
226 	return __mlxsw_pci_queue_get(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_CQ, q_num);
227 }
228 
229 static struct mlxsw_pci_queue *mlxsw_pci_eq_get(struct mlxsw_pci *mlxsw_pci,
230 						u8 q_num)
231 {
232 	return __mlxsw_pci_queue_get(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_EQ, q_num);
233 }
234 
235 static void __mlxsw_pci_queue_doorbell_set(struct mlxsw_pci *mlxsw_pci,
236 					   struct mlxsw_pci_queue *q,
237 					   u16 val)
238 {
239 	mlxsw_pci_write32(mlxsw_pci,
240 			  DOORBELL(mlxsw_pci->doorbell_offset,
241 				   mlxsw_pci_doorbell_type_offset[q->type],
242 				   q->num), val);
243 }
244 
245 static void __mlxsw_pci_queue_doorbell_arm_set(struct mlxsw_pci *mlxsw_pci,
246 					       struct mlxsw_pci_queue *q,
247 					       u16 val)
248 {
249 	mlxsw_pci_write32(mlxsw_pci,
250 			  DOORBELL(mlxsw_pci->doorbell_offset,
251 				   mlxsw_pci_doorbell_arm_type_offset[q->type],
252 				   q->num), val);
253 }
254 
255 static void mlxsw_pci_queue_doorbell_producer_ring(struct mlxsw_pci *mlxsw_pci,
256 						   struct mlxsw_pci_queue *q)
257 {
258 	wmb(); /* ensure all writes are done before we ring a bell */
259 	__mlxsw_pci_queue_doorbell_set(mlxsw_pci, q, q->producer_counter);
260 }
261 
262 static void mlxsw_pci_queue_doorbell_consumer_ring(struct mlxsw_pci *mlxsw_pci,
263 						   struct mlxsw_pci_queue *q)
264 {
265 	wmb(); /* ensure all writes are done before we ring a bell */
266 	__mlxsw_pci_queue_doorbell_set(mlxsw_pci, q,
267 				       q->consumer_counter + q->count);
268 }
269 
270 static void
271 mlxsw_pci_queue_doorbell_arm_consumer_ring(struct mlxsw_pci *mlxsw_pci,
272 					   struct mlxsw_pci_queue *q)
273 {
274 	wmb(); /* ensure all writes are done before we ring a bell */
275 	__mlxsw_pci_queue_doorbell_arm_set(mlxsw_pci, q, q->consumer_counter);
276 }
277 
278 static dma_addr_t __mlxsw_pci_queue_page_get(struct mlxsw_pci_queue *q,
279 					     int page_index)
280 {
281 	return q->mem_item.mapaddr + MLXSW_PCI_PAGE_SIZE * page_index;
282 }
283 
284 static int mlxsw_pci_sdq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
285 			      struct mlxsw_pci_queue *q)
286 {
287 	int i;
288 	int err;
289 
290 	q->producer_counter = 0;
291 	q->consumer_counter = 0;
292 
293 	/* Set CQ of same number of this SDQ. */
294 	mlxsw_cmd_mbox_sw2hw_dq_cq_set(mbox, q->num);
295 	mlxsw_cmd_mbox_sw2hw_dq_sdq_tclass_set(mbox, 3);
296 	mlxsw_cmd_mbox_sw2hw_dq_log2_dq_sz_set(mbox, 3); /* 8 pages */
297 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
298 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
299 
300 		mlxsw_cmd_mbox_sw2hw_dq_pa_set(mbox, i, mapaddr);
301 	}
302 
303 	err = mlxsw_cmd_sw2hw_sdq(mlxsw_pci->core, mbox, q->num);
304 	if (err)
305 		return err;
306 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
307 	return 0;
308 }
309 
310 static void mlxsw_pci_sdq_fini(struct mlxsw_pci *mlxsw_pci,
311 			       struct mlxsw_pci_queue *q)
312 {
313 	mlxsw_cmd_hw2sw_sdq(mlxsw_pci->core, q->num);
314 }
315 
316 static int mlxsw_pci_wqe_frag_map(struct mlxsw_pci *mlxsw_pci, char *wqe,
317 				  int index, char *frag_data, size_t frag_len,
318 				  int direction)
319 {
320 	struct pci_dev *pdev = mlxsw_pci->pdev;
321 	dma_addr_t mapaddr;
322 
323 	mapaddr = pci_map_single(pdev, frag_data, frag_len, direction);
324 	if (unlikely(pci_dma_mapping_error(pdev, mapaddr))) {
325 		dev_err_ratelimited(&pdev->dev, "failed to dma map tx frag\n");
326 		return -EIO;
327 	}
328 	mlxsw_pci_wqe_address_set(wqe, index, mapaddr);
329 	mlxsw_pci_wqe_byte_count_set(wqe, index, frag_len);
330 	return 0;
331 }
332 
333 static void mlxsw_pci_wqe_frag_unmap(struct mlxsw_pci *mlxsw_pci, char *wqe,
334 				     int index, int direction)
335 {
336 	struct pci_dev *pdev = mlxsw_pci->pdev;
337 	size_t frag_len = mlxsw_pci_wqe_byte_count_get(wqe, index);
338 	dma_addr_t mapaddr = mlxsw_pci_wqe_address_get(wqe, index);
339 
340 	if (!frag_len)
341 		return;
342 	pci_unmap_single(pdev, mapaddr, frag_len, direction);
343 }
344 
345 static int mlxsw_pci_rdq_skb_alloc(struct mlxsw_pci *mlxsw_pci,
346 				   struct mlxsw_pci_queue_elem_info *elem_info)
347 {
348 	size_t buf_len = MLXSW_PORT_MAX_MTU;
349 	char *wqe = elem_info->elem;
350 	struct sk_buff *skb;
351 	int err;
352 
353 	elem_info->u.rdq.skb = NULL;
354 	skb = netdev_alloc_skb_ip_align(NULL, buf_len);
355 	if (!skb)
356 		return -ENOMEM;
357 
358 	/* Assume that wqe was previously zeroed. */
359 
360 	err = mlxsw_pci_wqe_frag_map(mlxsw_pci, wqe, 0, skb->data,
361 				     buf_len, DMA_FROM_DEVICE);
362 	if (err)
363 		goto err_frag_map;
364 
365 	elem_info->u.rdq.skb = skb;
366 	return 0;
367 
368 err_frag_map:
369 	dev_kfree_skb_any(skb);
370 	return err;
371 }
372 
373 static void mlxsw_pci_rdq_skb_free(struct mlxsw_pci *mlxsw_pci,
374 				   struct mlxsw_pci_queue_elem_info *elem_info)
375 {
376 	struct sk_buff *skb;
377 	char *wqe;
378 
379 	skb = elem_info->u.rdq.skb;
380 	wqe = elem_info->elem;
381 
382 	mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, 0, DMA_FROM_DEVICE);
383 	dev_kfree_skb_any(skb);
384 }
385 
386 static int mlxsw_pci_rdq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
387 			      struct mlxsw_pci_queue *q)
388 {
389 	struct mlxsw_pci_queue_elem_info *elem_info;
390 	u8 sdq_count = mlxsw_pci_sdq_count(mlxsw_pci);
391 	int i;
392 	int err;
393 
394 	q->producer_counter = 0;
395 	q->consumer_counter = 0;
396 
397 	/* Set CQ of same number of this RDQ with base
398 	 * above SDQ count as the lower ones are assigned to SDQs.
399 	 */
400 	mlxsw_cmd_mbox_sw2hw_dq_cq_set(mbox, sdq_count + q->num);
401 	mlxsw_cmd_mbox_sw2hw_dq_log2_dq_sz_set(mbox, 3); /* 8 pages */
402 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
403 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
404 
405 		mlxsw_cmd_mbox_sw2hw_dq_pa_set(mbox, i, mapaddr);
406 	}
407 
408 	err = mlxsw_cmd_sw2hw_rdq(mlxsw_pci->core, mbox, q->num);
409 	if (err)
410 		return err;
411 
412 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
413 
414 	for (i = 0; i < q->count; i++) {
415 		elem_info = mlxsw_pci_queue_elem_info_producer_get(q);
416 		BUG_ON(!elem_info);
417 		err = mlxsw_pci_rdq_skb_alloc(mlxsw_pci, elem_info);
418 		if (err)
419 			goto rollback;
420 		/* Everything is set up, ring doorbell to pass elem to HW */
421 		q->producer_counter++;
422 		mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
423 	}
424 
425 	return 0;
426 
427 rollback:
428 	for (i--; i >= 0; i--) {
429 		elem_info = mlxsw_pci_queue_elem_info_get(q, i);
430 		mlxsw_pci_rdq_skb_free(mlxsw_pci, elem_info);
431 	}
432 	mlxsw_cmd_hw2sw_rdq(mlxsw_pci->core, q->num);
433 
434 	return err;
435 }
436 
437 static void mlxsw_pci_rdq_fini(struct mlxsw_pci *mlxsw_pci,
438 			       struct mlxsw_pci_queue *q)
439 {
440 	struct mlxsw_pci_queue_elem_info *elem_info;
441 	int i;
442 
443 	mlxsw_cmd_hw2sw_rdq(mlxsw_pci->core, q->num);
444 	for (i = 0; i < q->count; i++) {
445 		elem_info = mlxsw_pci_queue_elem_info_get(q, i);
446 		mlxsw_pci_rdq_skb_free(mlxsw_pci, elem_info);
447 	}
448 }
449 
450 static void mlxsw_pci_cq_pre_init(struct mlxsw_pci *mlxsw_pci,
451 				  struct mlxsw_pci_queue *q)
452 {
453 	q->u.cq.v = mlxsw_pci->max_cqe_ver;
454 
455 	/* For SDQ it is pointless to use CQEv2, so use CQEv1 instead */
456 	if (q->u.cq.v == MLXSW_PCI_CQE_V2 &&
457 	    q->num < mlxsw_pci->num_sdq_cqs)
458 		q->u.cq.v = MLXSW_PCI_CQE_V1;
459 }
460 
461 static int mlxsw_pci_cq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
462 			     struct mlxsw_pci_queue *q)
463 {
464 	int i;
465 	int err;
466 
467 	q->consumer_counter = 0;
468 
469 	for (i = 0; i < q->count; i++) {
470 		char *elem = mlxsw_pci_queue_elem_get(q, i);
471 
472 		mlxsw_pci_cqe_owner_set(q->u.cq.v, elem, 1);
473 	}
474 
475 	if (q->u.cq.v == MLXSW_PCI_CQE_V1)
476 		mlxsw_cmd_mbox_sw2hw_cq_cqe_ver_set(mbox,
477 				MLXSW_CMD_MBOX_SW2HW_CQ_CQE_VER_1);
478 	else if (q->u.cq.v == MLXSW_PCI_CQE_V2)
479 		mlxsw_cmd_mbox_sw2hw_cq_cqe_ver_set(mbox,
480 				MLXSW_CMD_MBOX_SW2HW_CQ_CQE_VER_2);
481 
482 	mlxsw_cmd_mbox_sw2hw_cq_c_eqn_set(mbox, MLXSW_PCI_EQ_COMP_NUM);
483 	mlxsw_cmd_mbox_sw2hw_cq_st_set(mbox, 0);
484 	mlxsw_cmd_mbox_sw2hw_cq_log_cq_size_set(mbox, ilog2(q->count));
485 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
486 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
487 
488 		mlxsw_cmd_mbox_sw2hw_cq_pa_set(mbox, i, mapaddr);
489 	}
490 	err = mlxsw_cmd_sw2hw_cq(mlxsw_pci->core, mbox, q->num);
491 	if (err)
492 		return err;
493 	mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
494 	mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
495 	return 0;
496 }
497 
498 static void mlxsw_pci_cq_fini(struct mlxsw_pci *mlxsw_pci,
499 			      struct mlxsw_pci_queue *q)
500 {
501 	mlxsw_cmd_hw2sw_cq(mlxsw_pci->core, q->num);
502 }
503 
504 static void mlxsw_pci_cqe_sdq_handle(struct mlxsw_pci *mlxsw_pci,
505 				     struct mlxsw_pci_queue *q,
506 				     u16 consumer_counter_limit,
507 				     char *cqe)
508 {
509 	struct pci_dev *pdev = mlxsw_pci->pdev;
510 	struct mlxsw_pci_queue_elem_info *elem_info;
511 	struct mlxsw_tx_info tx_info;
512 	char *wqe;
513 	struct sk_buff *skb;
514 	int i;
515 
516 	spin_lock(&q->lock);
517 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
518 	tx_info = mlxsw_skb_cb(elem_info->u.sdq.skb)->tx_info;
519 	skb = elem_info->u.sdq.skb;
520 	wqe = elem_info->elem;
521 	for (i = 0; i < MLXSW_PCI_WQE_SG_ENTRIES; i++)
522 		mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, i, DMA_TO_DEVICE);
523 
524 	if (unlikely(!tx_info.is_emad &&
525 		     skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP)) {
526 		mlxsw_core_ptp_transmitted(mlxsw_pci->core, skb,
527 					   tx_info.local_port);
528 		skb = NULL;
529 	}
530 
531 	if (skb)
532 		dev_kfree_skb_any(skb);
533 	elem_info->u.sdq.skb = NULL;
534 
535 	if (q->consumer_counter++ != consumer_counter_limit)
536 		dev_dbg_ratelimited(&pdev->dev, "Consumer counter does not match limit in SDQ\n");
537 	spin_unlock(&q->lock);
538 }
539 
540 static void mlxsw_pci_cqe_rdq_handle(struct mlxsw_pci *mlxsw_pci,
541 				     struct mlxsw_pci_queue *q,
542 				     u16 consumer_counter_limit,
543 				     enum mlxsw_pci_cqe_v cqe_v, char *cqe)
544 {
545 	struct pci_dev *pdev = mlxsw_pci->pdev;
546 	struct mlxsw_pci_queue_elem_info *elem_info;
547 	char *wqe;
548 	struct sk_buff *skb;
549 	struct mlxsw_rx_info rx_info;
550 	u16 byte_count;
551 	int err;
552 
553 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
554 	skb = elem_info->u.sdq.skb;
555 	if (!skb)
556 		return;
557 	wqe = elem_info->elem;
558 	mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, 0, DMA_FROM_DEVICE);
559 
560 	if (q->consumer_counter++ != consumer_counter_limit)
561 		dev_dbg_ratelimited(&pdev->dev, "Consumer counter does not match limit in RDQ\n");
562 
563 	if (mlxsw_pci_cqe_lag_get(cqe_v, cqe)) {
564 		rx_info.is_lag = true;
565 		rx_info.u.lag_id = mlxsw_pci_cqe_lag_id_get(cqe_v, cqe);
566 		rx_info.lag_port_index =
567 			mlxsw_pci_cqe_lag_subport_get(cqe_v, cqe);
568 	} else {
569 		rx_info.is_lag = false;
570 		rx_info.u.sys_port = mlxsw_pci_cqe_system_port_get(cqe);
571 	}
572 
573 	rx_info.trap_id = mlxsw_pci_cqe_trap_id_get(cqe);
574 
575 	byte_count = mlxsw_pci_cqe_byte_count_get(cqe);
576 	if (mlxsw_pci_cqe_crc_get(cqe_v, cqe))
577 		byte_count -= ETH_FCS_LEN;
578 	skb_put(skb, byte_count);
579 	mlxsw_core_skb_receive(mlxsw_pci->core, skb, &rx_info);
580 
581 	memset(wqe, 0, q->elem_size);
582 	err = mlxsw_pci_rdq_skb_alloc(mlxsw_pci, elem_info);
583 	if (err)
584 		dev_dbg_ratelimited(&pdev->dev, "Failed to alloc skb for RDQ\n");
585 	/* Everything is set up, ring doorbell to pass elem to HW */
586 	q->producer_counter++;
587 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
588 	return;
589 }
590 
591 static char *mlxsw_pci_cq_sw_cqe_get(struct mlxsw_pci_queue *q)
592 {
593 	struct mlxsw_pci_queue_elem_info *elem_info;
594 	char *elem;
595 	bool owner_bit;
596 
597 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
598 	elem = elem_info->elem;
599 	owner_bit = mlxsw_pci_cqe_owner_get(q->u.cq.v, elem);
600 	if (mlxsw_pci_elem_hw_owned(q, owner_bit))
601 		return NULL;
602 	q->consumer_counter++;
603 	rmb(); /* make sure we read owned bit before the rest of elem */
604 	return elem;
605 }
606 
607 static void mlxsw_pci_cq_tasklet(unsigned long data)
608 {
609 	struct mlxsw_pci_queue *q = (struct mlxsw_pci_queue *) data;
610 	struct mlxsw_pci *mlxsw_pci = q->pci;
611 	char *cqe;
612 	int items = 0;
613 	int credits = q->count >> 1;
614 
615 	while ((cqe = mlxsw_pci_cq_sw_cqe_get(q))) {
616 		u16 wqe_counter = mlxsw_pci_cqe_wqe_counter_get(cqe);
617 		u8 sendq = mlxsw_pci_cqe_sr_get(q->u.cq.v, cqe);
618 		u8 dqn = mlxsw_pci_cqe_dqn_get(q->u.cq.v, cqe);
619 		char ncqe[MLXSW_PCI_CQE_SIZE_MAX];
620 
621 		memcpy(ncqe, cqe, q->elem_size);
622 		mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
623 
624 		if (sendq) {
625 			struct mlxsw_pci_queue *sdq;
626 
627 			sdq = mlxsw_pci_sdq_get(mlxsw_pci, dqn);
628 			mlxsw_pci_cqe_sdq_handle(mlxsw_pci, sdq,
629 						 wqe_counter, ncqe);
630 			q->u.cq.comp_sdq_count++;
631 		} else {
632 			struct mlxsw_pci_queue *rdq;
633 
634 			rdq = mlxsw_pci_rdq_get(mlxsw_pci, dqn);
635 			mlxsw_pci_cqe_rdq_handle(mlxsw_pci, rdq,
636 						 wqe_counter, q->u.cq.v, ncqe);
637 			q->u.cq.comp_rdq_count++;
638 		}
639 		if (++items == credits)
640 			break;
641 	}
642 	if (items)
643 		mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
644 }
645 
646 static u16 mlxsw_pci_cq_elem_count(const struct mlxsw_pci_queue *q)
647 {
648 	return q->u.cq.v == MLXSW_PCI_CQE_V2 ? MLXSW_PCI_CQE2_COUNT :
649 					       MLXSW_PCI_CQE01_COUNT;
650 }
651 
652 static u8 mlxsw_pci_cq_elem_size(const struct mlxsw_pci_queue *q)
653 {
654 	return q->u.cq.v == MLXSW_PCI_CQE_V2 ? MLXSW_PCI_CQE2_SIZE :
655 					       MLXSW_PCI_CQE01_SIZE;
656 }
657 
658 static int mlxsw_pci_eq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
659 			     struct mlxsw_pci_queue *q)
660 {
661 	int i;
662 	int err;
663 
664 	q->consumer_counter = 0;
665 
666 	for (i = 0; i < q->count; i++) {
667 		char *elem = mlxsw_pci_queue_elem_get(q, i);
668 
669 		mlxsw_pci_eqe_owner_set(elem, 1);
670 	}
671 
672 	mlxsw_cmd_mbox_sw2hw_eq_int_msix_set(mbox, 1); /* MSI-X used */
673 	mlxsw_cmd_mbox_sw2hw_eq_st_set(mbox, 1); /* armed */
674 	mlxsw_cmd_mbox_sw2hw_eq_log_eq_size_set(mbox, ilog2(q->count));
675 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
676 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
677 
678 		mlxsw_cmd_mbox_sw2hw_eq_pa_set(mbox, i, mapaddr);
679 	}
680 	err = mlxsw_cmd_sw2hw_eq(mlxsw_pci->core, mbox, q->num);
681 	if (err)
682 		return err;
683 	mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
684 	mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
685 	return 0;
686 }
687 
688 static void mlxsw_pci_eq_fini(struct mlxsw_pci *mlxsw_pci,
689 			      struct mlxsw_pci_queue *q)
690 {
691 	mlxsw_cmd_hw2sw_eq(mlxsw_pci->core, q->num);
692 }
693 
694 static void mlxsw_pci_eq_cmd_event(struct mlxsw_pci *mlxsw_pci, char *eqe)
695 {
696 	mlxsw_pci->cmd.comp.status = mlxsw_pci_eqe_cmd_status_get(eqe);
697 	mlxsw_pci->cmd.comp.out_param =
698 		((u64) mlxsw_pci_eqe_cmd_out_param_h_get(eqe)) << 32 |
699 		mlxsw_pci_eqe_cmd_out_param_l_get(eqe);
700 	mlxsw_pci->cmd.wait_done = true;
701 	wake_up(&mlxsw_pci->cmd.wait);
702 }
703 
704 static char *mlxsw_pci_eq_sw_eqe_get(struct mlxsw_pci_queue *q)
705 {
706 	struct mlxsw_pci_queue_elem_info *elem_info;
707 	char *elem;
708 	bool owner_bit;
709 
710 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
711 	elem = elem_info->elem;
712 	owner_bit = mlxsw_pci_eqe_owner_get(elem);
713 	if (mlxsw_pci_elem_hw_owned(q, owner_bit))
714 		return NULL;
715 	q->consumer_counter++;
716 	rmb(); /* make sure we read owned bit before the rest of elem */
717 	return elem;
718 }
719 
720 static void mlxsw_pci_eq_tasklet(unsigned long data)
721 {
722 	struct mlxsw_pci_queue *q = (struct mlxsw_pci_queue *) data;
723 	struct mlxsw_pci *mlxsw_pci = q->pci;
724 	u8 cq_count = mlxsw_pci_cq_count(mlxsw_pci);
725 	unsigned long active_cqns[BITS_TO_LONGS(MLXSW_PCI_CQS_MAX)];
726 	char *eqe;
727 	u8 cqn;
728 	bool cq_handle = false;
729 	int items = 0;
730 	int credits = q->count >> 1;
731 
732 	memset(&active_cqns, 0, sizeof(active_cqns));
733 
734 	while ((eqe = mlxsw_pci_eq_sw_eqe_get(q))) {
735 
736 		/* Command interface completion events are always received on
737 		 * queue MLXSW_PCI_EQ_ASYNC_NUM (EQ0) and completion events
738 		 * are mapped to queue MLXSW_PCI_EQ_COMP_NUM (EQ1).
739 		 */
740 		switch (q->num) {
741 		case MLXSW_PCI_EQ_ASYNC_NUM:
742 			mlxsw_pci_eq_cmd_event(mlxsw_pci, eqe);
743 			q->u.eq.ev_cmd_count++;
744 			break;
745 		case MLXSW_PCI_EQ_COMP_NUM:
746 			cqn = mlxsw_pci_eqe_cqn_get(eqe);
747 			set_bit(cqn, active_cqns);
748 			cq_handle = true;
749 			q->u.eq.ev_comp_count++;
750 			break;
751 		default:
752 			q->u.eq.ev_other_count++;
753 		}
754 		if (++items == credits)
755 			break;
756 	}
757 	if (items) {
758 		mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
759 		mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
760 	}
761 
762 	if (!cq_handle)
763 		return;
764 	for_each_set_bit(cqn, active_cqns, cq_count) {
765 		q = mlxsw_pci_cq_get(mlxsw_pci, cqn);
766 		mlxsw_pci_queue_tasklet_schedule(q);
767 	}
768 }
769 
770 struct mlxsw_pci_queue_ops {
771 	const char *name;
772 	enum mlxsw_pci_queue_type type;
773 	void (*pre_init)(struct mlxsw_pci *mlxsw_pci,
774 			 struct mlxsw_pci_queue *q);
775 	int (*init)(struct mlxsw_pci *mlxsw_pci, char *mbox,
776 		    struct mlxsw_pci_queue *q);
777 	void (*fini)(struct mlxsw_pci *mlxsw_pci,
778 		     struct mlxsw_pci_queue *q);
779 	void (*tasklet)(unsigned long data);
780 	u16 (*elem_count_f)(const struct mlxsw_pci_queue *q);
781 	u8 (*elem_size_f)(const struct mlxsw_pci_queue *q);
782 	u16 elem_count;
783 	u8 elem_size;
784 };
785 
786 static const struct mlxsw_pci_queue_ops mlxsw_pci_sdq_ops = {
787 	.type		= MLXSW_PCI_QUEUE_TYPE_SDQ,
788 	.init		= mlxsw_pci_sdq_init,
789 	.fini		= mlxsw_pci_sdq_fini,
790 	.elem_count	= MLXSW_PCI_WQE_COUNT,
791 	.elem_size	= MLXSW_PCI_WQE_SIZE,
792 };
793 
794 static const struct mlxsw_pci_queue_ops mlxsw_pci_rdq_ops = {
795 	.type		= MLXSW_PCI_QUEUE_TYPE_RDQ,
796 	.init		= mlxsw_pci_rdq_init,
797 	.fini		= mlxsw_pci_rdq_fini,
798 	.elem_count	= MLXSW_PCI_WQE_COUNT,
799 	.elem_size	= MLXSW_PCI_WQE_SIZE
800 };
801 
802 static const struct mlxsw_pci_queue_ops mlxsw_pci_cq_ops = {
803 	.type		= MLXSW_PCI_QUEUE_TYPE_CQ,
804 	.pre_init	= mlxsw_pci_cq_pre_init,
805 	.init		= mlxsw_pci_cq_init,
806 	.fini		= mlxsw_pci_cq_fini,
807 	.tasklet	= mlxsw_pci_cq_tasklet,
808 	.elem_count_f	= mlxsw_pci_cq_elem_count,
809 	.elem_size_f	= mlxsw_pci_cq_elem_size
810 };
811 
812 static const struct mlxsw_pci_queue_ops mlxsw_pci_eq_ops = {
813 	.type		= MLXSW_PCI_QUEUE_TYPE_EQ,
814 	.init		= mlxsw_pci_eq_init,
815 	.fini		= mlxsw_pci_eq_fini,
816 	.tasklet	= mlxsw_pci_eq_tasklet,
817 	.elem_count	= MLXSW_PCI_EQE_COUNT,
818 	.elem_size	= MLXSW_PCI_EQE_SIZE
819 };
820 
821 static int mlxsw_pci_queue_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
822 				const struct mlxsw_pci_queue_ops *q_ops,
823 				struct mlxsw_pci_queue *q, u8 q_num)
824 {
825 	struct mlxsw_pci_mem_item *mem_item = &q->mem_item;
826 	int i;
827 	int err;
828 
829 	q->num = q_num;
830 	if (q_ops->pre_init)
831 		q_ops->pre_init(mlxsw_pci, q);
832 
833 	spin_lock_init(&q->lock);
834 	q->count = q_ops->elem_count_f ? q_ops->elem_count_f(q) :
835 					 q_ops->elem_count;
836 	q->elem_size = q_ops->elem_size_f ? q_ops->elem_size_f(q) :
837 					    q_ops->elem_size;
838 	q->type = q_ops->type;
839 	q->pci = mlxsw_pci;
840 
841 	if (q_ops->tasklet)
842 		tasklet_init(&q->tasklet, q_ops->tasklet, (unsigned long) q);
843 
844 	mem_item->size = MLXSW_PCI_AQ_SIZE;
845 	mem_item->buf = pci_alloc_consistent(mlxsw_pci->pdev,
846 					     mem_item->size,
847 					     &mem_item->mapaddr);
848 	if (!mem_item->buf)
849 		return -ENOMEM;
850 	memset(mem_item->buf, 0, mem_item->size);
851 
852 	q->elem_info = kcalloc(q->count, sizeof(*q->elem_info), GFP_KERNEL);
853 	if (!q->elem_info) {
854 		err = -ENOMEM;
855 		goto err_elem_info_alloc;
856 	}
857 
858 	/* Initialize dma mapped elements info elem_info for
859 	 * future easy access.
860 	 */
861 	for (i = 0; i < q->count; i++) {
862 		struct mlxsw_pci_queue_elem_info *elem_info;
863 
864 		elem_info = mlxsw_pci_queue_elem_info_get(q, i);
865 		elem_info->elem =
866 			__mlxsw_pci_queue_elem_get(q, q->elem_size, i);
867 	}
868 
869 	mlxsw_cmd_mbox_zero(mbox);
870 	err = q_ops->init(mlxsw_pci, mbox, q);
871 	if (err)
872 		goto err_q_ops_init;
873 	return 0;
874 
875 err_q_ops_init:
876 	kfree(q->elem_info);
877 err_elem_info_alloc:
878 	pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
879 			    mem_item->buf, mem_item->mapaddr);
880 	return err;
881 }
882 
883 static void mlxsw_pci_queue_fini(struct mlxsw_pci *mlxsw_pci,
884 				 const struct mlxsw_pci_queue_ops *q_ops,
885 				 struct mlxsw_pci_queue *q)
886 {
887 	struct mlxsw_pci_mem_item *mem_item = &q->mem_item;
888 
889 	q_ops->fini(mlxsw_pci, q);
890 	kfree(q->elem_info);
891 	pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
892 			    mem_item->buf, mem_item->mapaddr);
893 }
894 
895 static int mlxsw_pci_queue_group_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
896 				      const struct mlxsw_pci_queue_ops *q_ops,
897 				      u8 num_qs)
898 {
899 	struct mlxsw_pci_queue_type_group *queue_group;
900 	int i;
901 	int err;
902 
903 	queue_group = mlxsw_pci_queue_type_group_get(mlxsw_pci, q_ops->type);
904 	queue_group->q = kcalloc(num_qs, sizeof(*queue_group->q), GFP_KERNEL);
905 	if (!queue_group->q)
906 		return -ENOMEM;
907 
908 	for (i = 0; i < num_qs; i++) {
909 		err = mlxsw_pci_queue_init(mlxsw_pci, mbox, q_ops,
910 					   &queue_group->q[i], i);
911 		if (err)
912 			goto err_queue_init;
913 	}
914 	queue_group->count = num_qs;
915 
916 	return 0;
917 
918 err_queue_init:
919 	for (i--; i >= 0; i--)
920 		mlxsw_pci_queue_fini(mlxsw_pci, q_ops, &queue_group->q[i]);
921 	kfree(queue_group->q);
922 	return err;
923 }
924 
925 static void mlxsw_pci_queue_group_fini(struct mlxsw_pci *mlxsw_pci,
926 				       const struct mlxsw_pci_queue_ops *q_ops)
927 {
928 	struct mlxsw_pci_queue_type_group *queue_group;
929 	int i;
930 
931 	queue_group = mlxsw_pci_queue_type_group_get(mlxsw_pci, q_ops->type);
932 	for (i = 0; i < queue_group->count; i++)
933 		mlxsw_pci_queue_fini(mlxsw_pci, q_ops, &queue_group->q[i]);
934 	kfree(queue_group->q);
935 }
936 
937 static int mlxsw_pci_aqs_init(struct mlxsw_pci *mlxsw_pci, char *mbox)
938 {
939 	struct pci_dev *pdev = mlxsw_pci->pdev;
940 	u8 num_sdqs;
941 	u8 sdq_log2sz;
942 	u8 num_rdqs;
943 	u8 rdq_log2sz;
944 	u8 num_cqs;
945 	u8 cq_log2sz;
946 	u8 cqv2_log2sz;
947 	u8 num_eqs;
948 	u8 eq_log2sz;
949 	int err;
950 
951 	mlxsw_cmd_mbox_zero(mbox);
952 	err = mlxsw_cmd_query_aq_cap(mlxsw_pci->core, mbox);
953 	if (err)
954 		return err;
955 
956 	num_sdqs = mlxsw_cmd_mbox_query_aq_cap_max_num_sdqs_get(mbox);
957 	sdq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_sdq_sz_get(mbox);
958 	num_rdqs = mlxsw_cmd_mbox_query_aq_cap_max_num_rdqs_get(mbox);
959 	rdq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_rdq_sz_get(mbox);
960 	num_cqs = mlxsw_cmd_mbox_query_aq_cap_max_num_cqs_get(mbox);
961 	cq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_cq_sz_get(mbox);
962 	cqv2_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_cqv2_sz_get(mbox);
963 	num_eqs = mlxsw_cmd_mbox_query_aq_cap_max_num_eqs_get(mbox);
964 	eq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_eq_sz_get(mbox);
965 
966 	if (num_sdqs + num_rdqs > num_cqs ||
967 	    num_cqs > MLXSW_PCI_CQS_MAX || num_eqs != MLXSW_PCI_EQS_COUNT) {
968 		dev_err(&pdev->dev, "Unsupported number of queues\n");
969 		return -EINVAL;
970 	}
971 
972 	if ((1 << sdq_log2sz != MLXSW_PCI_WQE_COUNT) ||
973 	    (1 << rdq_log2sz != MLXSW_PCI_WQE_COUNT) ||
974 	    (1 << cq_log2sz != MLXSW_PCI_CQE01_COUNT) ||
975 	    (mlxsw_pci->max_cqe_ver == MLXSW_PCI_CQE_V2 &&
976 	     (1 << cqv2_log2sz != MLXSW_PCI_CQE2_COUNT)) ||
977 	    (1 << eq_log2sz != MLXSW_PCI_EQE_COUNT)) {
978 		dev_err(&pdev->dev, "Unsupported number of async queue descriptors\n");
979 		return -EINVAL;
980 	}
981 
982 	mlxsw_pci->num_sdq_cqs = num_sdqs;
983 
984 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_eq_ops,
985 					 num_eqs);
986 	if (err) {
987 		dev_err(&pdev->dev, "Failed to initialize event queues\n");
988 		return err;
989 	}
990 
991 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_cq_ops,
992 					 num_cqs);
993 	if (err) {
994 		dev_err(&pdev->dev, "Failed to initialize completion queues\n");
995 		goto err_cqs_init;
996 	}
997 
998 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_sdq_ops,
999 					 num_sdqs);
1000 	if (err) {
1001 		dev_err(&pdev->dev, "Failed to initialize send descriptor queues\n");
1002 		goto err_sdqs_init;
1003 	}
1004 
1005 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_rdq_ops,
1006 					 num_rdqs);
1007 	if (err) {
1008 		dev_err(&pdev->dev, "Failed to initialize receive descriptor queues\n");
1009 		goto err_rdqs_init;
1010 	}
1011 
1012 	/* We have to poll in command interface until queues are initialized */
1013 	mlxsw_pci->cmd.nopoll = true;
1014 	return 0;
1015 
1016 err_rdqs_init:
1017 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_sdq_ops);
1018 err_sdqs_init:
1019 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_cq_ops);
1020 err_cqs_init:
1021 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_eq_ops);
1022 	return err;
1023 }
1024 
1025 static void mlxsw_pci_aqs_fini(struct mlxsw_pci *mlxsw_pci)
1026 {
1027 	mlxsw_pci->cmd.nopoll = false;
1028 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_rdq_ops);
1029 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_sdq_ops);
1030 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_cq_ops);
1031 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_eq_ops);
1032 }
1033 
1034 static void
1035 mlxsw_pci_config_profile_swid_config(struct mlxsw_pci *mlxsw_pci,
1036 				     char *mbox, int index,
1037 				     const struct mlxsw_swid_config *swid)
1038 {
1039 	u8 mask = 0;
1040 
1041 	if (swid->used_type) {
1042 		mlxsw_cmd_mbox_config_profile_swid_config_type_set(
1043 			mbox, index, swid->type);
1044 		mask |= 1;
1045 	}
1046 	if (swid->used_properties) {
1047 		mlxsw_cmd_mbox_config_profile_swid_config_properties_set(
1048 			mbox, index, swid->properties);
1049 		mask |= 2;
1050 	}
1051 	mlxsw_cmd_mbox_config_profile_swid_config_mask_set(mbox, index, mask);
1052 }
1053 
1054 static int
1055 mlxsw_pci_profile_get_kvd_sizes(const struct mlxsw_pci *mlxsw_pci,
1056 				const struct mlxsw_config_profile *profile,
1057 				struct mlxsw_res *res)
1058 {
1059 	u64 single_size, double_size, linear_size;
1060 	int err;
1061 
1062 	err = mlxsw_core_kvd_sizes_get(mlxsw_pci->core, profile,
1063 				       &single_size, &double_size,
1064 				       &linear_size);
1065 	if (err)
1066 		return err;
1067 
1068 	MLXSW_RES_SET(res, KVD_SINGLE_SIZE, single_size);
1069 	MLXSW_RES_SET(res, KVD_DOUBLE_SIZE, double_size);
1070 	MLXSW_RES_SET(res, KVD_LINEAR_SIZE, linear_size);
1071 
1072 	return 0;
1073 }
1074 
1075 static int mlxsw_pci_config_profile(struct mlxsw_pci *mlxsw_pci, char *mbox,
1076 				    const struct mlxsw_config_profile *profile,
1077 				    struct mlxsw_res *res)
1078 {
1079 	int i;
1080 	int err;
1081 
1082 	mlxsw_cmd_mbox_zero(mbox);
1083 
1084 	if (profile->used_max_vepa_channels) {
1085 		mlxsw_cmd_mbox_config_profile_set_max_vepa_channels_set(
1086 			mbox, 1);
1087 		mlxsw_cmd_mbox_config_profile_max_vepa_channels_set(
1088 			mbox, profile->max_vepa_channels);
1089 	}
1090 	if (profile->used_max_mid) {
1091 		mlxsw_cmd_mbox_config_profile_set_max_mid_set(
1092 			mbox, 1);
1093 		mlxsw_cmd_mbox_config_profile_max_mid_set(
1094 			mbox, profile->max_mid);
1095 	}
1096 	if (profile->used_max_pgt) {
1097 		mlxsw_cmd_mbox_config_profile_set_max_pgt_set(
1098 			mbox, 1);
1099 		mlxsw_cmd_mbox_config_profile_max_pgt_set(
1100 			mbox, profile->max_pgt);
1101 	}
1102 	if (profile->used_max_system_port) {
1103 		mlxsw_cmd_mbox_config_profile_set_max_system_port_set(
1104 			mbox, 1);
1105 		mlxsw_cmd_mbox_config_profile_max_system_port_set(
1106 			mbox, profile->max_system_port);
1107 	}
1108 	if (profile->used_max_vlan_groups) {
1109 		mlxsw_cmd_mbox_config_profile_set_max_vlan_groups_set(
1110 			mbox, 1);
1111 		mlxsw_cmd_mbox_config_profile_max_vlan_groups_set(
1112 			mbox, profile->max_vlan_groups);
1113 	}
1114 	if (profile->used_max_regions) {
1115 		mlxsw_cmd_mbox_config_profile_set_max_regions_set(
1116 			mbox, 1);
1117 		mlxsw_cmd_mbox_config_profile_max_regions_set(
1118 			mbox, profile->max_regions);
1119 	}
1120 	if (profile->used_flood_tables) {
1121 		mlxsw_cmd_mbox_config_profile_set_flood_tables_set(
1122 			mbox, 1);
1123 		mlxsw_cmd_mbox_config_profile_max_flood_tables_set(
1124 			mbox, profile->max_flood_tables);
1125 		mlxsw_cmd_mbox_config_profile_max_vid_flood_tables_set(
1126 			mbox, profile->max_vid_flood_tables);
1127 		mlxsw_cmd_mbox_config_profile_max_fid_offset_flood_tables_set(
1128 			mbox, profile->max_fid_offset_flood_tables);
1129 		mlxsw_cmd_mbox_config_profile_fid_offset_flood_table_size_set(
1130 			mbox, profile->fid_offset_flood_table_size);
1131 		mlxsw_cmd_mbox_config_profile_max_fid_flood_tables_set(
1132 			mbox, profile->max_fid_flood_tables);
1133 		mlxsw_cmd_mbox_config_profile_fid_flood_table_size_set(
1134 			mbox, profile->fid_flood_table_size);
1135 	}
1136 	if (profile->used_flood_mode) {
1137 		mlxsw_cmd_mbox_config_profile_set_flood_mode_set(
1138 			mbox, 1);
1139 		mlxsw_cmd_mbox_config_profile_flood_mode_set(
1140 			mbox, profile->flood_mode);
1141 	}
1142 	if (profile->used_max_ib_mc) {
1143 		mlxsw_cmd_mbox_config_profile_set_max_ib_mc_set(
1144 			mbox, 1);
1145 		mlxsw_cmd_mbox_config_profile_max_ib_mc_set(
1146 			mbox, profile->max_ib_mc);
1147 	}
1148 	if (profile->used_max_pkey) {
1149 		mlxsw_cmd_mbox_config_profile_set_max_pkey_set(
1150 			mbox, 1);
1151 		mlxsw_cmd_mbox_config_profile_max_pkey_set(
1152 			mbox, profile->max_pkey);
1153 	}
1154 	if (profile->used_ar_sec) {
1155 		mlxsw_cmd_mbox_config_profile_set_ar_sec_set(
1156 			mbox, 1);
1157 		mlxsw_cmd_mbox_config_profile_ar_sec_set(
1158 			mbox, profile->ar_sec);
1159 	}
1160 	if (profile->used_adaptive_routing_group_cap) {
1161 		mlxsw_cmd_mbox_config_profile_set_adaptive_routing_group_cap_set(
1162 			mbox, 1);
1163 		mlxsw_cmd_mbox_config_profile_adaptive_routing_group_cap_set(
1164 			mbox, profile->adaptive_routing_group_cap);
1165 	}
1166 	if (profile->used_kvd_sizes && MLXSW_RES_VALID(res, KVD_SIZE)) {
1167 		err = mlxsw_pci_profile_get_kvd_sizes(mlxsw_pci, profile, res);
1168 		if (err)
1169 			return err;
1170 
1171 		mlxsw_cmd_mbox_config_profile_set_kvd_linear_size_set(mbox, 1);
1172 		mlxsw_cmd_mbox_config_profile_kvd_linear_size_set(mbox,
1173 					MLXSW_RES_GET(res, KVD_LINEAR_SIZE));
1174 		mlxsw_cmd_mbox_config_profile_set_kvd_hash_single_size_set(mbox,
1175 									   1);
1176 		mlxsw_cmd_mbox_config_profile_kvd_hash_single_size_set(mbox,
1177 					MLXSW_RES_GET(res, KVD_SINGLE_SIZE));
1178 		mlxsw_cmd_mbox_config_profile_set_kvd_hash_double_size_set(
1179 								mbox, 1);
1180 		mlxsw_cmd_mbox_config_profile_kvd_hash_double_size_set(mbox,
1181 					MLXSW_RES_GET(res, KVD_DOUBLE_SIZE));
1182 	}
1183 
1184 	for (i = 0; i < MLXSW_CONFIG_PROFILE_SWID_COUNT; i++)
1185 		mlxsw_pci_config_profile_swid_config(mlxsw_pci, mbox, i,
1186 						     &profile->swid_config[i]);
1187 
1188 	if (mlxsw_pci->max_cqe_ver > MLXSW_PCI_CQE_V0) {
1189 		mlxsw_cmd_mbox_config_profile_set_cqe_version_set(mbox, 1);
1190 		mlxsw_cmd_mbox_config_profile_cqe_version_set(mbox, 1);
1191 	}
1192 
1193 	return mlxsw_cmd_config_profile_set(mlxsw_pci->core, mbox);
1194 }
1195 
1196 static int mlxsw_pci_boardinfo(struct mlxsw_pci *mlxsw_pci, char *mbox)
1197 {
1198 	struct mlxsw_bus_info *bus_info = &mlxsw_pci->bus_info;
1199 	int err;
1200 
1201 	mlxsw_cmd_mbox_zero(mbox);
1202 	err = mlxsw_cmd_boardinfo(mlxsw_pci->core, mbox);
1203 	if (err)
1204 		return err;
1205 	mlxsw_cmd_mbox_boardinfo_vsd_memcpy_from(mbox, bus_info->vsd);
1206 	mlxsw_cmd_mbox_boardinfo_psid_memcpy_from(mbox, bus_info->psid);
1207 	return 0;
1208 }
1209 
1210 static int mlxsw_pci_fw_area_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
1211 				  u16 num_pages)
1212 {
1213 	struct mlxsw_pci_mem_item *mem_item;
1214 	int nent = 0;
1215 	int i;
1216 	int err;
1217 
1218 	mlxsw_pci->fw_area.items = kcalloc(num_pages, sizeof(*mem_item),
1219 					   GFP_KERNEL);
1220 	if (!mlxsw_pci->fw_area.items)
1221 		return -ENOMEM;
1222 	mlxsw_pci->fw_area.count = num_pages;
1223 
1224 	mlxsw_cmd_mbox_zero(mbox);
1225 	for (i = 0; i < num_pages; i++) {
1226 		mem_item = &mlxsw_pci->fw_area.items[i];
1227 
1228 		mem_item->size = MLXSW_PCI_PAGE_SIZE;
1229 		mem_item->buf = pci_alloc_consistent(mlxsw_pci->pdev,
1230 						     mem_item->size,
1231 						     &mem_item->mapaddr);
1232 		if (!mem_item->buf) {
1233 			err = -ENOMEM;
1234 			goto err_alloc;
1235 		}
1236 		mlxsw_cmd_mbox_map_fa_pa_set(mbox, nent, mem_item->mapaddr);
1237 		mlxsw_cmd_mbox_map_fa_log2size_set(mbox, nent, 0); /* 1 page */
1238 		if (++nent == MLXSW_CMD_MAP_FA_VPM_ENTRIES_MAX) {
1239 			err = mlxsw_cmd_map_fa(mlxsw_pci->core, mbox, nent);
1240 			if (err)
1241 				goto err_cmd_map_fa;
1242 			nent = 0;
1243 			mlxsw_cmd_mbox_zero(mbox);
1244 		}
1245 	}
1246 
1247 	if (nent) {
1248 		err = mlxsw_cmd_map_fa(mlxsw_pci->core, mbox, nent);
1249 		if (err)
1250 			goto err_cmd_map_fa;
1251 	}
1252 
1253 	return 0;
1254 
1255 err_cmd_map_fa:
1256 err_alloc:
1257 	for (i--; i >= 0; i--) {
1258 		mem_item = &mlxsw_pci->fw_area.items[i];
1259 
1260 		pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
1261 				    mem_item->buf, mem_item->mapaddr);
1262 	}
1263 	kfree(mlxsw_pci->fw_area.items);
1264 	return err;
1265 }
1266 
1267 static void mlxsw_pci_fw_area_fini(struct mlxsw_pci *mlxsw_pci)
1268 {
1269 	struct mlxsw_pci_mem_item *mem_item;
1270 	int i;
1271 
1272 	mlxsw_cmd_unmap_fa(mlxsw_pci->core);
1273 
1274 	for (i = 0; i < mlxsw_pci->fw_area.count; i++) {
1275 		mem_item = &mlxsw_pci->fw_area.items[i];
1276 
1277 		pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
1278 				    mem_item->buf, mem_item->mapaddr);
1279 	}
1280 	kfree(mlxsw_pci->fw_area.items);
1281 }
1282 
1283 static irqreturn_t mlxsw_pci_eq_irq_handler(int irq, void *dev_id)
1284 {
1285 	struct mlxsw_pci *mlxsw_pci = dev_id;
1286 	struct mlxsw_pci_queue *q;
1287 	int i;
1288 
1289 	for (i = 0; i < MLXSW_PCI_EQS_COUNT; i++) {
1290 		q = mlxsw_pci_eq_get(mlxsw_pci, i);
1291 		mlxsw_pci_queue_tasklet_schedule(q);
1292 	}
1293 	return IRQ_HANDLED;
1294 }
1295 
1296 static int mlxsw_pci_mbox_alloc(struct mlxsw_pci *mlxsw_pci,
1297 				struct mlxsw_pci_mem_item *mbox)
1298 {
1299 	struct pci_dev *pdev = mlxsw_pci->pdev;
1300 	int err = 0;
1301 
1302 	mbox->size = MLXSW_CMD_MBOX_SIZE;
1303 	mbox->buf = pci_alloc_consistent(pdev, MLXSW_CMD_MBOX_SIZE,
1304 					 &mbox->mapaddr);
1305 	if (!mbox->buf) {
1306 		dev_err(&pdev->dev, "Failed allocating memory for mailbox\n");
1307 		err = -ENOMEM;
1308 	}
1309 
1310 	return err;
1311 }
1312 
1313 static void mlxsw_pci_mbox_free(struct mlxsw_pci *mlxsw_pci,
1314 				struct mlxsw_pci_mem_item *mbox)
1315 {
1316 	struct pci_dev *pdev = mlxsw_pci->pdev;
1317 
1318 	pci_free_consistent(pdev, MLXSW_CMD_MBOX_SIZE, mbox->buf,
1319 			    mbox->mapaddr);
1320 }
1321 
1322 static int mlxsw_pci_sw_reset(struct mlxsw_pci *mlxsw_pci,
1323 			      const struct pci_device_id *id)
1324 {
1325 	unsigned long end;
1326 	char mrsr_pl[MLXSW_REG_MRSR_LEN];
1327 	int err;
1328 
1329 	mlxsw_reg_mrsr_pack(mrsr_pl);
1330 	err = mlxsw_reg_write(mlxsw_pci->core, MLXSW_REG(mrsr), mrsr_pl);
1331 	if (err)
1332 		return err;
1333 	if (id->device == PCI_DEVICE_ID_MELLANOX_SWITCHX2) {
1334 		msleep(MLXSW_PCI_SW_RESET_TIMEOUT_MSECS);
1335 		return 0;
1336 	}
1337 
1338 	/* We must wait for the HW to become responsive once again. */
1339 	msleep(MLXSW_PCI_SW_RESET_WAIT_MSECS);
1340 
1341 	end = jiffies + msecs_to_jiffies(MLXSW_PCI_SW_RESET_TIMEOUT_MSECS);
1342 	do {
1343 		u32 val = mlxsw_pci_read32(mlxsw_pci, FW_READY);
1344 
1345 		if ((val & MLXSW_PCI_FW_READY_MASK) == MLXSW_PCI_FW_READY_MAGIC)
1346 			return 0;
1347 		cond_resched();
1348 	} while (time_before(jiffies, end));
1349 	return -EBUSY;
1350 }
1351 
1352 static int mlxsw_pci_alloc_irq_vectors(struct mlxsw_pci *mlxsw_pci)
1353 {
1354 	int err;
1355 
1356 	err = pci_alloc_irq_vectors(mlxsw_pci->pdev, 1, 1, PCI_IRQ_MSIX);
1357 	if (err < 0)
1358 		dev_err(&mlxsw_pci->pdev->dev, "MSI-X init failed\n");
1359 	return err;
1360 }
1361 
1362 static void mlxsw_pci_free_irq_vectors(struct mlxsw_pci *mlxsw_pci)
1363 {
1364 	pci_free_irq_vectors(mlxsw_pci->pdev);
1365 }
1366 
1367 static int mlxsw_pci_init(void *bus_priv, struct mlxsw_core *mlxsw_core,
1368 			  const struct mlxsw_config_profile *profile,
1369 			  struct mlxsw_res *res)
1370 {
1371 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1372 	struct pci_dev *pdev = mlxsw_pci->pdev;
1373 	char *mbox;
1374 	u16 num_pages;
1375 	int err;
1376 
1377 	mutex_init(&mlxsw_pci->cmd.lock);
1378 	init_waitqueue_head(&mlxsw_pci->cmd.wait);
1379 
1380 	mlxsw_pci->core = mlxsw_core;
1381 
1382 	mbox = mlxsw_cmd_mbox_alloc();
1383 	if (!mbox)
1384 		return -ENOMEM;
1385 
1386 	err = mlxsw_pci_mbox_alloc(mlxsw_pci, &mlxsw_pci->cmd.in_mbox);
1387 	if (err)
1388 		goto mbox_put;
1389 
1390 	err = mlxsw_pci_mbox_alloc(mlxsw_pci, &mlxsw_pci->cmd.out_mbox);
1391 	if (err)
1392 		goto err_out_mbox_alloc;
1393 
1394 	err = mlxsw_pci_sw_reset(mlxsw_pci, mlxsw_pci->id);
1395 	if (err)
1396 		goto err_sw_reset;
1397 
1398 	err = mlxsw_pci_alloc_irq_vectors(mlxsw_pci);
1399 	if (err < 0) {
1400 		dev_err(&pdev->dev, "MSI-X init failed\n");
1401 		goto err_alloc_irq;
1402 	}
1403 
1404 	err = mlxsw_cmd_query_fw(mlxsw_core, mbox);
1405 	if (err)
1406 		goto err_query_fw;
1407 
1408 	mlxsw_pci->bus_info.fw_rev.major =
1409 		mlxsw_cmd_mbox_query_fw_fw_rev_major_get(mbox);
1410 	mlxsw_pci->bus_info.fw_rev.minor =
1411 		mlxsw_cmd_mbox_query_fw_fw_rev_minor_get(mbox);
1412 	mlxsw_pci->bus_info.fw_rev.subminor =
1413 		mlxsw_cmd_mbox_query_fw_fw_rev_subminor_get(mbox);
1414 
1415 	if (mlxsw_cmd_mbox_query_fw_cmd_interface_rev_get(mbox) != 1) {
1416 		dev_err(&pdev->dev, "Unsupported cmd interface revision ID queried from hw\n");
1417 		err = -EINVAL;
1418 		goto err_iface_rev;
1419 	}
1420 	if (mlxsw_cmd_mbox_query_fw_doorbell_page_bar_get(mbox) != 0) {
1421 		dev_err(&pdev->dev, "Unsupported doorbell page bar queried from hw\n");
1422 		err = -EINVAL;
1423 		goto err_doorbell_page_bar;
1424 	}
1425 
1426 	mlxsw_pci->doorbell_offset =
1427 		mlxsw_cmd_mbox_query_fw_doorbell_page_offset_get(mbox);
1428 
1429 	if (mlxsw_cmd_mbox_query_fw_fr_rn_clk_bar_get(mbox) != 0) {
1430 		dev_err(&pdev->dev, "Unsupported free running clock BAR queried from hw\n");
1431 		err = -EINVAL;
1432 		goto err_fr_rn_clk_bar;
1433 	}
1434 
1435 	mlxsw_pci->free_running_clock_offset =
1436 		mlxsw_cmd_mbox_query_fw_free_running_clock_offset_get(mbox);
1437 
1438 	num_pages = mlxsw_cmd_mbox_query_fw_fw_pages_get(mbox);
1439 	err = mlxsw_pci_fw_area_init(mlxsw_pci, mbox, num_pages);
1440 	if (err)
1441 		goto err_fw_area_init;
1442 
1443 	err = mlxsw_pci_boardinfo(mlxsw_pci, mbox);
1444 	if (err)
1445 		goto err_boardinfo;
1446 
1447 	err = mlxsw_core_resources_query(mlxsw_core, mbox, res);
1448 	if (err)
1449 		goto err_query_resources;
1450 
1451 	if (MLXSW_CORE_RES_VALID(mlxsw_core, CQE_V2) &&
1452 	    MLXSW_CORE_RES_GET(mlxsw_core, CQE_V2))
1453 		mlxsw_pci->max_cqe_ver = MLXSW_PCI_CQE_V2;
1454 	else if (MLXSW_CORE_RES_VALID(mlxsw_core, CQE_V1) &&
1455 		 MLXSW_CORE_RES_GET(mlxsw_core, CQE_V1))
1456 		mlxsw_pci->max_cqe_ver = MLXSW_PCI_CQE_V1;
1457 	else if ((MLXSW_CORE_RES_VALID(mlxsw_core, CQE_V0) &&
1458 		  MLXSW_CORE_RES_GET(mlxsw_core, CQE_V0)) ||
1459 		 !MLXSW_CORE_RES_VALID(mlxsw_core, CQE_V0)) {
1460 		mlxsw_pci->max_cqe_ver = MLXSW_PCI_CQE_V0;
1461 	} else {
1462 		dev_err(&pdev->dev, "Invalid supported CQE version combination reported\n");
1463 		goto err_cqe_v_check;
1464 	}
1465 
1466 	err = mlxsw_pci_config_profile(mlxsw_pci, mbox, profile, res);
1467 	if (err)
1468 		goto err_config_profile;
1469 
1470 	err = mlxsw_pci_aqs_init(mlxsw_pci, mbox);
1471 	if (err)
1472 		goto err_aqs_init;
1473 
1474 	err = request_irq(pci_irq_vector(pdev, 0),
1475 			  mlxsw_pci_eq_irq_handler, 0,
1476 			  mlxsw_pci->bus_info.device_kind, mlxsw_pci);
1477 	if (err) {
1478 		dev_err(&pdev->dev, "IRQ request failed\n");
1479 		goto err_request_eq_irq;
1480 	}
1481 
1482 	goto mbox_put;
1483 
1484 err_request_eq_irq:
1485 	mlxsw_pci_aqs_fini(mlxsw_pci);
1486 err_aqs_init:
1487 err_config_profile:
1488 err_cqe_v_check:
1489 err_query_resources:
1490 err_boardinfo:
1491 	mlxsw_pci_fw_area_fini(mlxsw_pci);
1492 err_fw_area_init:
1493 err_fr_rn_clk_bar:
1494 err_doorbell_page_bar:
1495 err_iface_rev:
1496 err_query_fw:
1497 	mlxsw_pci_free_irq_vectors(mlxsw_pci);
1498 err_alloc_irq:
1499 err_sw_reset:
1500 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.out_mbox);
1501 err_out_mbox_alloc:
1502 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.in_mbox);
1503 mbox_put:
1504 	mlxsw_cmd_mbox_free(mbox);
1505 	return err;
1506 }
1507 
1508 static void mlxsw_pci_fini(void *bus_priv)
1509 {
1510 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1511 
1512 	free_irq(pci_irq_vector(mlxsw_pci->pdev, 0), mlxsw_pci);
1513 	mlxsw_pci_aqs_fini(mlxsw_pci);
1514 	mlxsw_pci_fw_area_fini(mlxsw_pci);
1515 	mlxsw_pci_free_irq_vectors(mlxsw_pci);
1516 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.out_mbox);
1517 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.in_mbox);
1518 }
1519 
1520 static struct mlxsw_pci_queue *
1521 mlxsw_pci_sdq_pick(struct mlxsw_pci *mlxsw_pci,
1522 		   const struct mlxsw_tx_info *tx_info)
1523 {
1524 	u8 sdqn = tx_info->local_port % mlxsw_pci_sdq_count(mlxsw_pci);
1525 
1526 	return mlxsw_pci_sdq_get(mlxsw_pci, sdqn);
1527 }
1528 
1529 static bool mlxsw_pci_skb_transmit_busy(void *bus_priv,
1530 					const struct mlxsw_tx_info *tx_info)
1531 {
1532 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1533 	struct mlxsw_pci_queue *q = mlxsw_pci_sdq_pick(mlxsw_pci, tx_info);
1534 
1535 	return !mlxsw_pci_queue_elem_info_producer_get(q);
1536 }
1537 
1538 static int mlxsw_pci_skb_transmit(void *bus_priv, struct sk_buff *skb,
1539 				  const struct mlxsw_tx_info *tx_info)
1540 {
1541 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1542 	struct mlxsw_pci_queue *q;
1543 	struct mlxsw_pci_queue_elem_info *elem_info;
1544 	char *wqe;
1545 	int i;
1546 	int err;
1547 
1548 	if (skb_shinfo(skb)->nr_frags > MLXSW_PCI_WQE_SG_ENTRIES - 1) {
1549 		err = skb_linearize(skb);
1550 		if (err)
1551 			return err;
1552 	}
1553 
1554 	q = mlxsw_pci_sdq_pick(mlxsw_pci, tx_info);
1555 	spin_lock_bh(&q->lock);
1556 	elem_info = mlxsw_pci_queue_elem_info_producer_get(q);
1557 	if (!elem_info) {
1558 		/* queue is full */
1559 		err = -EAGAIN;
1560 		goto unlock;
1561 	}
1562 	mlxsw_skb_cb(skb)->tx_info = *tx_info;
1563 	elem_info->u.sdq.skb = skb;
1564 
1565 	wqe = elem_info->elem;
1566 	mlxsw_pci_wqe_c_set(wqe, 1); /* always report completion */
1567 	mlxsw_pci_wqe_lp_set(wqe, !!tx_info->is_emad);
1568 	mlxsw_pci_wqe_type_set(wqe, MLXSW_PCI_WQE_TYPE_ETHERNET);
1569 
1570 	err = mlxsw_pci_wqe_frag_map(mlxsw_pci, wqe, 0, skb->data,
1571 				     skb_headlen(skb), DMA_TO_DEVICE);
1572 	if (err)
1573 		goto unlock;
1574 
1575 	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
1576 		const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
1577 
1578 		err = mlxsw_pci_wqe_frag_map(mlxsw_pci, wqe, i + 1,
1579 					     skb_frag_address(frag),
1580 					     skb_frag_size(frag),
1581 					     DMA_TO_DEVICE);
1582 		if (err)
1583 			goto unmap_frags;
1584 	}
1585 
1586 	if (unlikely(skb_shinfo(skb)->tx_flags & SKBTX_HW_TSTAMP))
1587 		skb_shinfo(skb)->tx_flags |= SKBTX_IN_PROGRESS;
1588 
1589 	/* Set unused sq entries byte count to zero. */
1590 	for (i++; i < MLXSW_PCI_WQE_SG_ENTRIES; i++)
1591 		mlxsw_pci_wqe_byte_count_set(wqe, i, 0);
1592 
1593 	/* Everything is set up, ring producer doorbell to get HW going */
1594 	q->producer_counter++;
1595 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
1596 
1597 	goto unlock;
1598 
1599 unmap_frags:
1600 	for (; i >= 0; i--)
1601 		mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, i, DMA_TO_DEVICE);
1602 unlock:
1603 	spin_unlock_bh(&q->lock);
1604 	return err;
1605 }
1606 
1607 static int mlxsw_pci_cmd_exec(void *bus_priv, u16 opcode, u8 opcode_mod,
1608 			      u32 in_mod, bool out_mbox_direct,
1609 			      char *in_mbox, size_t in_mbox_size,
1610 			      char *out_mbox, size_t out_mbox_size,
1611 			      u8 *p_status)
1612 {
1613 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1614 	dma_addr_t in_mapaddr = 0, out_mapaddr = 0;
1615 	bool evreq = mlxsw_pci->cmd.nopoll;
1616 	unsigned long timeout = msecs_to_jiffies(MLXSW_PCI_CIR_TIMEOUT_MSECS);
1617 	bool *p_wait_done = &mlxsw_pci->cmd.wait_done;
1618 	int err;
1619 
1620 	*p_status = MLXSW_CMD_STATUS_OK;
1621 
1622 	err = mutex_lock_interruptible(&mlxsw_pci->cmd.lock);
1623 	if (err)
1624 		return err;
1625 
1626 	if (in_mbox) {
1627 		memcpy(mlxsw_pci->cmd.in_mbox.buf, in_mbox, in_mbox_size);
1628 		in_mapaddr = mlxsw_pci->cmd.in_mbox.mapaddr;
1629 	}
1630 	mlxsw_pci_write32(mlxsw_pci, CIR_IN_PARAM_HI, upper_32_bits(in_mapaddr));
1631 	mlxsw_pci_write32(mlxsw_pci, CIR_IN_PARAM_LO, lower_32_bits(in_mapaddr));
1632 
1633 	if (out_mbox)
1634 		out_mapaddr = mlxsw_pci->cmd.out_mbox.mapaddr;
1635 	mlxsw_pci_write32(mlxsw_pci, CIR_OUT_PARAM_HI, upper_32_bits(out_mapaddr));
1636 	mlxsw_pci_write32(mlxsw_pci, CIR_OUT_PARAM_LO, lower_32_bits(out_mapaddr));
1637 
1638 	mlxsw_pci_write32(mlxsw_pci, CIR_IN_MODIFIER, in_mod);
1639 	mlxsw_pci_write32(mlxsw_pci, CIR_TOKEN, 0);
1640 
1641 	*p_wait_done = false;
1642 
1643 	wmb(); /* all needs to be written before we write control register */
1644 	mlxsw_pci_write32(mlxsw_pci, CIR_CTRL,
1645 			  MLXSW_PCI_CIR_CTRL_GO_BIT |
1646 			  (evreq ? MLXSW_PCI_CIR_CTRL_EVREQ_BIT : 0) |
1647 			  (opcode_mod << MLXSW_PCI_CIR_CTRL_OPCODE_MOD_SHIFT) |
1648 			  opcode);
1649 
1650 	if (!evreq) {
1651 		unsigned long end;
1652 
1653 		end = jiffies + timeout;
1654 		do {
1655 			u32 ctrl = mlxsw_pci_read32(mlxsw_pci, CIR_CTRL);
1656 
1657 			if (!(ctrl & MLXSW_PCI_CIR_CTRL_GO_BIT)) {
1658 				*p_wait_done = true;
1659 				*p_status = ctrl >> MLXSW_PCI_CIR_CTRL_STATUS_SHIFT;
1660 				break;
1661 			}
1662 			cond_resched();
1663 		} while (time_before(jiffies, end));
1664 	} else {
1665 		wait_event_timeout(mlxsw_pci->cmd.wait, *p_wait_done, timeout);
1666 		*p_status = mlxsw_pci->cmd.comp.status;
1667 	}
1668 
1669 	err = 0;
1670 	if (*p_wait_done) {
1671 		if (*p_status)
1672 			err = -EIO;
1673 	} else {
1674 		err = -ETIMEDOUT;
1675 	}
1676 
1677 	if (!err && out_mbox && out_mbox_direct) {
1678 		/* Some commands don't use output param as address to mailbox
1679 		 * but they store output directly into registers. In that case,
1680 		 * copy registers into mbox buffer.
1681 		 */
1682 		__be32 tmp;
1683 
1684 		if (!evreq) {
1685 			tmp = cpu_to_be32(mlxsw_pci_read32(mlxsw_pci,
1686 							   CIR_OUT_PARAM_HI));
1687 			memcpy(out_mbox, &tmp, sizeof(tmp));
1688 			tmp = cpu_to_be32(mlxsw_pci_read32(mlxsw_pci,
1689 							   CIR_OUT_PARAM_LO));
1690 			memcpy(out_mbox + sizeof(tmp), &tmp, sizeof(tmp));
1691 		}
1692 	} else if (!err && out_mbox) {
1693 		memcpy(out_mbox, mlxsw_pci->cmd.out_mbox.buf, out_mbox_size);
1694 	}
1695 
1696 	mutex_unlock(&mlxsw_pci->cmd.lock);
1697 
1698 	return err;
1699 }
1700 
1701 static u32 mlxsw_pci_read_frc_h(void *bus_priv)
1702 {
1703 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1704 	u64 frc_offset;
1705 
1706 	frc_offset = mlxsw_pci->free_running_clock_offset;
1707 	return mlxsw_pci_read32(mlxsw_pci, FREE_RUNNING_CLOCK_H(frc_offset));
1708 }
1709 
1710 static u32 mlxsw_pci_read_frc_l(void *bus_priv)
1711 {
1712 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1713 	u64 frc_offset;
1714 
1715 	frc_offset = mlxsw_pci->free_running_clock_offset;
1716 	return mlxsw_pci_read32(mlxsw_pci, FREE_RUNNING_CLOCK_L(frc_offset));
1717 }
1718 
1719 static const struct mlxsw_bus mlxsw_pci_bus = {
1720 	.kind			= "pci",
1721 	.init			= mlxsw_pci_init,
1722 	.fini			= mlxsw_pci_fini,
1723 	.skb_transmit_busy	= mlxsw_pci_skb_transmit_busy,
1724 	.skb_transmit		= mlxsw_pci_skb_transmit,
1725 	.cmd_exec		= mlxsw_pci_cmd_exec,
1726 	.read_frc_h		= mlxsw_pci_read_frc_h,
1727 	.read_frc_l		= mlxsw_pci_read_frc_l,
1728 	.features		= MLXSW_BUS_F_TXRX | MLXSW_BUS_F_RESET,
1729 };
1730 
1731 static int mlxsw_pci_probe(struct pci_dev *pdev, const struct pci_device_id *id)
1732 {
1733 	const char *driver_name = pdev->driver->name;
1734 	struct mlxsw_pci *mlxsw_pci;
1735 	int err;
1736 
1737 	mlxsw_pci = kzalloc(sizeof(*mlxsw_pci), GFP_KERNEL);
1738 	if (!mlxsw_pci)
1739 		return -ENOMEM;
1740 
1741 	err = pci_enable_device(pdev);
1742 	if (err) {
1743 		dev_err(&pdev->dev, "pci_enable_device failed\n");
1744 		goto err_pci_enable_device;
1745 	}
1746 
1747 	err = pci_request_regions(pdev, driver_name);
1748 	if (err) {
1749 		dev_err(&pdev->dev, "pci_request_regions failed\n");
1750 		goto err_pci_request_regions;
1751 	}
1752 
1753 	err = pci_set_dma_mask(pdev, DMA_BIT_MASK(64));
1754 	if (!err) {
1755 		err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(64));
1756 		if (err) {
1757 			dev_err(&pdev->dev, "pci_set_consistent_dma_mask failed\n");
1758 			goto err_pci_set_dma_mask;
1759 		}
1760 	} else {
1761 		err = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
1762 		if (err) {
1763 			dev_err(&pdev->dev, "pci_set_dma_mask failed\n");
1764 			goto err_pci_set_dma_mask;
1765 		}
1766 	}
1767 
1768 	if (pci_resource_len(pdev, 0) < MLXSW_PCI_BAR0_SIZE) {
1769 		dev_err(&pdev->dev, "invalid PCI region size\n");
1770 		err = -EINVAL;
1771 		goto err_pci_resource_len_check;
1772 	}
1773 
1774 	mlxsw_pci->hw_addr = ioremap(pci_resource_start(pdev, 0),
1775 				     pci_resource_len(pdev, 0));
1776 	if (!mlxsw_pci->hw_addr) {
1777 		dev_err(&pdev->dev, "ioremap failed\n");
1778 		err = -EIO;
1779 		goto err_ioremap;
1780 	}
1781 	pci_set_master(pdev);
1782 
1783 	mlxsw_pci->pdev = pdev;
1784 	pci_set_drvdata(pdev, mlxsw_pci);
1785 
1786 	mlxsw_pci->bus_info.device_kind = driver_name;
1787 	mlxsw_pci->bus_info.device_name = pci_name(mlxsw_pci->pdev);
1788 	mlxsw_pci->bus_info.dev = &pdev->dev;
1789 	mlxsw_pci->bus_info.read_frc_capable = true;
1790 	mlxsw_pci->id = id;
1791 
1792 	err = mlxsw_core_bus_device_register(&mlxsw_pci->bus_info,
1793 					     &mlxsw_pci_bus, mlxsw_pci, false,
1794 					     NULL);
1795 	if (err) {
1796 		dev_err(&pdev->dev, "cannot register bus device\n");
1797 		goto err_bus_device_register;
1798 	}
1799 
1800 	return 0;
1801 
1802 err_bus_device_register:
1803 	iounmap(mlxsw_pci->hw_addr);
1804 err_ioremap:
1805 err_pci_resource_len_check:
1806 err_pci_set_dma_mask:
1807 	pci_release_regions(pdev);
1808 err_pci_request_regions:
1809 	pci_disable_device(pdev);
1810 err_pci_enable_device:
1811 	kfree(mlxsw_pci);
1812 	return err;
1813 }
1814 
1815 static void mlxsw_pci_remove(struct pci_dev *pdev)
1816 {
1817 	struct mlxsw_pci *mlxsw_pci = pci_get_drvdata(pdev);
1818 
1819 	mlxsw_core_bus_device_unregister(mlxsw_pci->core, false);
1820 	iounmap(mlxsw_pci->hw_addr);
1821 	pci_release_regions(mlxsw_pci->pdev);
1822 	pci_disable_device(mlxsw_pci->pdev);
1823 	kfree(mlxsw_pci);
1824 }
1825 
1826 int mlxsw_pci_driver_register(struct pci_driver *pci_driver)
1827 {
1828 	pci_driver->probe = mlxsw_pci_probe;
1829 	pci_driver->remove = mlxsw_pci_remove;
1830 	return pci_register_driver(pci_driver);
1831 }
1832 EXPORT_SYMBOL(mlxsw_pci_driver_register);
1833 
1834 void mlxsw_pci_driver_unregister(struct pci_driver *pci_driver)
1835 {
1836 	pci_unregister_driver(pci_driver);
1837 }
1838 EXPORT_SYMBOL(mlxsw_pci_driver_unregister);
1839 
1840 static int __init mlxsw_pci_module_init(void)
1841 {
1842 	return 0;
1843 }
1844 
1845 static void __exit mlxsw_pci_module_exit(void)
1846 {
1847 }
1848 
1849 module_init(mlxsw_pci_module_init);
1850 module_exit(mlxsw_pci_module_exit);
1851 
1852 MODULE_LICENSE("Dual BSD/GPL");
1853 MODULE_AUTHOR("Jiri Pirko <jiri@mellanox.com>");
1854 MODULE_DESCRIPTION("Mellanox switch PCI interface driver");
1855