1 /*
2  * drivers/net/ethernet/mellanox/mlxsw/pci.c
3  * Copyright (c) 2015 Mellanox Technologies. All rights reserved.
4  * Copyright (c) 2015 Jiri Pirko <jiri@mellanox.com>
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions are met:
8  *
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, this list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright
12  *    notice, this list of conditions and the following disclaimer in the
13  *    documentation and/or other materials provided with the distribution.
14  * 3. Neither the names of the copyright holders nor the names of its
15  *    contributors may be used to endorse or promote products derived from
16  *    this software without specific prior written permission.
17  *
18  * Alternatively, this software may be distributed under the terms of the
19  * GNU General Public License ("GPL") version 2 as published by the Free
20  * Software Foundation.
21  *
22  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
23  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
26  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
27  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
28  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
29  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
30  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
31  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
32  * POSSIBILITY OF SUCH DAMAGE.
33  */
34 
35 #include <linux/kernel.h>
36 #include <linux/module.h>
37 #include <linux/export.h>
38 #include <linux/err.h>
39 #include <linux/device.h>
40 #include <linux/pci.h>
41 #include <linux/interrupt.h>
42 #include <linux/wait.h>
43 #include <linux/types.h>
44 #include <linux/skbuff.h>
45 #include <linux/if_vlan.h>
46 #include <linux/log2.h>
47 #include <linux/debugfs.h>
48 #include <linux/seq_file.h>
49 #include <linux/string.h>
50 
51 #include "pci.h"
52 #include "core.h"
53 #include "cmd.h"
54 #include "port.h"
55 
56 static const char mlxsw_pci_driver_name[] = "mlxsw_pci";
57 
58 static const struct pci_device_id mlxsw_pci_id_table[] = {
59 	{PCI_VDEVICE(MELLANOX, PCI_DEVICE_ID_MELLANOX_SWITCHX2), 0},
60 	{PCI_VDEVICE(MELLANOX, PCI_DEVICE_ID_MELLANOX_SPECTRUM), 0},
61 	{0, }
62 };
63 
64 static struct dentry *mlxsw_pci_dbg_root;
65 
66 static const char *mlxsw_pci_device_kind_get(const struct pci_device_id *id)
67 {
68 	switch (id->device) {
69 	case PCI_DEVICE_ID_MELLANOX_SWITCHX2:
70 		return MLXSW_DEVICE_KIND_SWITCHX2;
71 	case PCI_DEVICE_ID_MELLANOX_SPECTRUM:
72 		return MLXSW_DEVICE_KIND_SPECTRUM;
73 	default:
74 		BUG();
75 	}
76 }
77 
78 #define mlxsw_pci_write32(mlxsw_pci, reg, val) \
79 	iowrite32be(val, (mlxsw_pci)->hw_addr + (MLXSW_PCI_ ## reg))
80 #define mlxsw_pci_read32(mlxsw_pci, reg) \
81 	ioread32be((mlxsw_pci)->hw_addr + (MLXSW_PCI_ ## reg))
82 
83 enum mlxsw_pci_queue_type {
84 	MLXSW_PCI_QUEUE_TYPE_SDQ,
85 	MLXSW_PCI_QUEUE_TYPE_RDQ,
86 	MLXSW_PCI_QUEUE_TYPE_CQ,
87 	MLXSW_PCI_QUEUE_TYPE_EQ,
88 };
89 
90 static const char *mlxsw_pci_queue_type_str(enum mlxsw_pci_queue_type q_type)
91 {
92 	switch (q_type) {
93 	case MLXSW_PCI_QUEUE_TYPE_SDQ:
94 		return "sdq";
95 	case MLXSW_PCI_QUEUE_TYPE_RDQ:
96 		return "rdq";
97 	case MLXSW_PCI_QUEUE_TYPE_CQ:
98 		return "cq";
99 	case MLXSW_PCI_QUEUE_TYPE_EQ:
100 		return "eq";
101 	}
102 	BUG();
103 }
104 
105 #define MLXSW_PCI_QUEUE_TYPE_COUNT	4
106 
107 static const u16 mlxsw_pci_doorbell_type_offset[] = {
108 	MLXSW_PCI_DOORBELL_SDQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_SDQ */
109 	MLXSW_PCI_DOORBELL_RDQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_RDQ */
110 	MLXSW_PCI_DOORBELL_CQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_CQ */
111 	MLXSW_PCI_DOORBELL_EQ_OFFSET,	/* for type MLXSW_PCI_QUEUE_TYPE_EQ */
112 };
113 
114 static const u16 mlxsw_pci_doorbell_arm_type_offset[] = {
115 	0, /* unused */
116 	0, /* unused */
117 	MLXSW_PCI_DOORBELL_ARM_CQ_OFFSET, /* for type MLXSW_PCI_QUEUE_TYPE_CQ */
118 	MLXSW_PCI_DOORBELL_ARM_EQ_OFFSET, /* for type MLXSW_PCI_QUEUE_TYPE_EQ */
119 };
120 
121 struct mlxsw_pci_mem_item {
122 	char *buf;
123 	dma_addr_t mapaddr;
124 	size_t size;
125 };
126 
127 struct mlxsw_pci_queue_elem_info {
128 	char *elem; /* pointer to actual dma mapped element mem chunk */
129 	union {
130 		struct {
131 			struct sk_buff *skb;
132 		} sdq;
133 		struct {
134 			struct sk_buff *skb;
135 		} rdq;
136 	} u;
137 };
138 
139 struct mlxsw_pci_queue {
140 	spinlock_t lock; /* for queue accesses */
141 	struct mlxsw_pci_mem_item mem_item;
142 	struct mlxsw_pci_queue_elem_info *elem_info;
143 	u16 producer_counter;
144 	u16 consumer_counter;
145 	u16 count; /* number of elements in queue */
146 	u8 num; /* queue number */
147 	u8 elem_size; /* size of one element */
148 	enum mlxsw_pci_queue_type type;
149 	struct tasklet_struct tasklet; /* queue processing tasklet */
150 	struct mlxsw_pci *pci;
151 	union {
152 		struct {
153 			u32 comp_sdq_count;
154 			u32 comp_rdq_count;
155 		} cq;
156 		struct {
157 			u32 ev_cmd_count;
158 			u32 ev_comp_count;
159 			u32 ev_other_count;
160 		} eq;
161 	} u;
162 };
163 
164 struct mlxsw_pci_queue_type_group {
165 	struct mlxsw_pci_queue *q;
166 	u8 count; /* number of queues in group */
167 };
168 
169 struct mlxsw_pci {
170 	struct pci_dev *pdev;
171 	u8 __iomem *hw_addr;
172 	struct mlxsw_pci_queue_type_group queues[MLXSW_PCI_QUEUE_TYPE_COUNT];
173 	u32 doorbell_offset;
174 	struct msix_entry msix_entry;
175 	struct mlxsw_core *core;
176 	struct {
177 		struct mlxsw_pci_mem_item *items;
178 		unsigned int count;
179 	} fw_area;
180 	struct {
181 		struct mlxsw_pci_mem_item out_mbox;
182 		struct mlxsw_pci_mem_item in_mbox;
183 		struct mutex lock; /* Lock access to command registers */
184 		bool nopoll;
185 		wait_queue_head_t wait;
186 		bool wait_done;
187 		struct {
188 			u8 status;
189 			u64 out_param;
190 		} comp;
191 	} cmd;
192 	struct mlxsw_bus_info bus_info;
193 	struct dentry *dbg_dir;
194 };
195 
196 static void mlxsw_pci_queue_tasklet_schedule(struct mlxsw_pci_queue *q)
197 {
198 	tasklet_schedule(&q->tasklet);
199 }
200 
201 static char *__mlxsw_pci_queue_elem_get(struct mlxsw_pci_queue *q,
202 					size_t elem_size, int elem_index)
203 {
204 	return q->mem_item.buf + (elem_size * elem_index);
205 }
206 
207 static struct mlxsw_pci_queue_elem_info *
208 mlxsw_pci_queue_elem_info_get(struct mlxsw_pci_queue *q, int elem_index)
209 {
210 	return &q->elem_info[elem_index];
211 }
212 
213 static struct mlxsw_pci_queue_elem_info *
214 mlxsw_pci_queue_elem_info_producer_get(struct mlxsw_pci_queue *q)
215 {
216 	int index = q->producer_counter & (q->count - 1);
217 
218 	if ((u16) (q->producer_counter - q->consumer_counter) == q->count)
219 		return NULL;
220 	return mlxsw_pci_queue_elem_info_get(q, index);
221 }
222 
223 static struct mlxsw_pci_queue_elem_info *
224 mlxsw_pci_queue_elem_info_consumer_get(struct mlxsw_pci_queue *q)
225 {
226 	int index = q->consumer_counter & (q->count - 1);
227 
228 	return mlxsw_pci_queue_elem_info_get(q, index);
229 }
230 
231 static char *mlxsw_pci_queue_elem_get(struct mlxsw_pci_queue *q, int elem_index)
232 {
233 	return mlxsw_pci_queue_elem_info_get(q, elem_index)->elem;
234 }
235 
236 static bool mlxsw_pci_elem_hw_owned(struct mlxsw_pci_queue *q, bool owner_bit)
237 {
238 	return owner_bit != !!(q->consumer_counter & q->count);
239 }
240 
241 static char *mlxsw_pci_queue_sw_elem_get(struct mlxsw_pci_queue *q,
242 					 u32 (*get_elem_owner_func)(char *))
243 {
244 	struct mlxsw_pci_queue_elem_info *elem_info;
245 	char *elem;
246 	bool owner_bit;
247 
248 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
249 	elem = elem_info->elem;
250 	owner_bit = get_elem_owner_func(elem);
251 	if (mlxsw_pci_elem_hw_owned(q, owner_bit))
252 		return NULL;
253 	q->consumer_counter++;
254 	rmb(); /* make sure we read owned bit before the rest of elem */
255 	return elem;
256 }
257 
258 static struct mlxsw_pci_queue_type_group *
259 mlxsw_pci_queue_type_group_get(struct mlxsw_pci *mlxsw_pci,
260 			       enum mlxsw_pci_queue_type q_type)
261 {
262 	return &mlxsw_pci->queues[q_type];
263 }
264 
265 static u8 __mlxsw_pci_queue_count(struct mlxsw_pci *mlxsw_pci,
266 				  enum mlxsw_pci_queue_type q_type)
267 {
268 	struct mlxsw_pci_queue_type_group *queue_group;
269 
270 	queue_group = mlxsw_pci_queue_type_group_get(mlxsw_pci, q_type);
271 	return queue_group->count;
272 }
273 
274 static u8 mlxsw_pci_sdq_count(struct mlxsw_pci *mlxsw_pci)
275 {
276 	return __mlxsw_pci_queue_count(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_SDQ);
277 }
278 
279 static u8 mlxsw_pci_rdq_count(struct mlxsw_pci *mlxsw_pci)
280 {
281 	return __mlxsw_pci_queue_count(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_RDQ);
282 }
283 
284 static u8 mlxsw_pci_cq_count(struct mlxsw_pci *mlxsw_pci)
285 {
286 	return __mlxsw_pci_queue_count(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_CQ);
287 }
288 
289 static u8 mlxsw_pci_eq_count(struct mlxsw_pci *mlxsw_pci)
290 {
291 	return __mlxsw_pci_queue_count(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_EQ);
292 }
293 
294 static struct mlxsw_pci_queue *
295 __mlxsw_pci_queue_get(struct mlxsw_pci *mlxsw_pci,
296 		      enum mlxsw_pci_queue_type q_type, u8 q_num)
297 {
298 	return &mlxsw_pci->queues[q_type].q[q_num];
299 }
300 
301 static struct mlxsw_pci_queue *mlxsw_pci_sdq_get(struct mlxsw_pci *mlxsw_pci,
302 						 u8 q_num)
303 {
304 	return __mlxsw_pci_queue_get(mlxsw_pci,
305 				     MLXSW_PCI_QUEUE_TYPE_SDQ, q_num);
306 }
307 
308 static struct mlxsw_pci_queue *mlxsw_pci_rdq_get(struct mlxsw_pci *mlxsw_pci,
309 						 u8 q_num)
310 {
311 	return __mlxsw_pci_queue_get(mlxsw_pci,
312 				     MLXSW_PCI_QUEUE_TYPE_RDQ, q_num);
313 }
314 
315 static struct mlxsw_pci_queue *mlxsw_pci_cq_get(struct mlxsw_pci *mlxsw_pci,
316 						u8 q_num)
317 {
318 	return __mlxsw_pci_queue_get(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_CQ, q_num);
319 }
320 
321 static struct mlxsw_pci_queue *mlxsw_pci_eq_get(struct mlxsw_pci *mlxsw_pci,
322 						u8 q_num)
323 {
324 	return __mlxsw_pci_queue_get(mlxsw_pci, MLXSW_PCI_QUEUE_TYPE_EQ, q_num);
325 }
326 
327 static void __mlxsw_pci_queue_doorbell_set(struct mlxsw_pci *mlxsw_pci,
328 					   struct mlxsw_pci_queue *q,
329 					   u16 val)
330 {
331 	mlxsw_pci_write32(mlxsw_pci,
332 			  DOORBELL(mlxsw_pci->doorbell_offset,
333 				   mlxsw_pci_doorbell_type_offset[q->type],
334 				   q->num), val);
335 }
336 
337 static void __mlxsw_pci_queue_doorbell_arm_set(struct mlxsw_pci *mlxsw_pci,
338 					       struct mlxsw_pci_queue *q,
339 					       u16 val)
340 {
341 	mlxsw_pci_write32(mlxsw_pci,
342 			  DOORBELL(mlxsw_pci->doorbell_offset,
343 				   mlxsw_pci_doorbell_arm_type_offset[q->type],
344 				   q->num), val);
345 }
346 
347 static void mlxsw_pci_queue_doorbell_producer_ring(struct mlxsw_pci *mlxsw_pci,
348 						   struct mlxsw_pci_queue *q)
349 {
350 	wmb(); /* ensure all writes are done before we ring a bell */
351 	__mlxsw_pci_queue_doorbell_set(mlxsw_pci, q, q->producer_counter);
352 }
353 
354 static void mlxsw_pci_queue_doorbell_consumer_ring(struct mlxsw_pci *mlxsw_pci,
355 						   struct mlxsw_pci_queue *q)
356 {
357 	wmb(); /* ensure all writes are done before we ring a bell */
358 	__mlxsw_pci_queue_doorbell_set(mlxsw_pci, q,
359 				       q->consumer_counter + q->count);
360 }
361 
362 static void
363 mlxsw_pci_queue_doorbell_arm_consumer_ring(struct mlxsw_pci *mlxsw_pci,
364 					   struct mlxsw_pci_queue *q)
365 {
366 	wmb(); /* ensure all writes are done before we ring a bell */
367 	__mlxsw_pci_queue_doorbell_arm_set(mlxsw_pci, q, q->consumer_counter);
368 }
369 
370 static dma_addr_t __mlxsw_pci_queue_page_get(struct mlxsw_pci_queue *q,
371 					     int page_index)
372 {
373 	return q->mem_item.mapaddr + MLXSW_PCI_PAGE_SIZE * page_index;
374 }
375 
376 static int mlxsw_pci_sdq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
377 			      struct mlxsw_pci_queue *q)
378 {
379 	int i;
380 	int err;
381 
382 	q->producer_counter = 0;
383 	q->consumer_counter = 0;
384 
385 	/* Set CQ of same number of this SDQ. */
386 	mlxsw_cmd_mbox_sw2hw_dq_cq_set(mbox, q->num);
387 	mlxsw_cmd_mbox_sw2hw_dq_sdq_tclass_set(mbox, 3);
388 	mlxsw_cmd_mbox_sw2hw_dq_log2_dq_sz_set(mbox, 3); /* 8 pages */
389 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
390 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
391 
392 		mlxsw_cmd_mbox_sw2hw_dq_pa_set(mbox, i, mapaddr);
393 	}
394 
395 	err = mlxsw_cmd_sw2hw_sdq(mlxsw_pci->core, mbox, q->num);
396 	if (err)
397 		return err;
398 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
399 	return 0;
400 }
401 
402 static void mlxsw_pci_sdq_fini(struct mlxsw_pci *mlxsw_pci,
403 			       struct mlxsw_pci_queue *q)
404 {
405 	mlxsw_cmd_hw2sw_sdq(mlxsw_pci->core, q->num);
406 }
407 
408 static int mlxsw_pci_sdq_dbg_read(struct seq_file *file, void *data)
409 {
410 	struct mlxsw_pci *mlxsw_pci = dev_get_drvdata(file->private);
411 	struct mlxsw_pci_queue *q;
412 	int i;
413 	static const char hdr[] =
414 		"NUM PROD_COUNT CONS_COUNT COUNT\n";
415 
416 	seq_printf(file, hdr);
417 	for (i = 0; i < mlxsw_pci_sdq_count(mlxsw_pci); i++) {
418 		q = mlxsw_pci_sdq_get(mlxsw_pci, i);
419 		spin_lock_bh(&q->lock);
420 		seq_printf(file, "%3d %10d %10d %5d\n",
421 			   i, q->producer_counter, q->consumer_counter,
422 			   q->count);
423 		spin_unlock_bh(&q->lock);
424 	}
425 	return 0;
426 }
427 
428 static int mlxsw_pci_wqe_frag_map(struct mlxsw_pci *mlxsw_pci, char *wqe,
429 				  int index, char *frag_data, size_t frag_len,
430 				  int direction)
431 {
432 	struct pci_dev *pdev = mlxsw_pci->pdev;
433 	dma_addr_t mapaddr;
434 
435 	mapaddr = pci_map_single(pdev, frag_data, frag_len, direction);
436 	if (unlikely(pci_dma_mapping_error(pdev, mapaddr))) {
437 		dev_err_ratelimited(&pdev->dev, "failed to dma map tx frag\n");
438 		return -EIO;
439 	}
440 	mlxsw_pci_wqe_address_set(wqe, index, mapaddr);
441 	mlxsw_pci_wqe_byte_count_set(wqe, index, frag_len);
442 	return 0;
443 }
444 
445 static void mlxsw_pci_wqe_frag_unmap(struct mlxsw_pci *mlxsw_pci, char *wqe,
446 				     int index, int direction)
447 {
448 	struct pci_dev *pdev = mlxsw_pci->pdev;
449 	size_t frag_len = mlxsw_pci_wqe_byte_count_get(wqe, index);
450 	dma_addr_t mapaddr = mlxsw_pci_wqe_address_get(wqe, index);
451 
452 	if (!frag_len)
453 		return;
454 	pci_unmap_single(pdev, mapaddr, frag_len, direction);
455 }
456 
457 static int mlxsw_pci_rdq_skb_alloc(struct mlxsw_pci *mlxsw_pci,
458 				   struct mlxsw_pci_queue_elem_info *elem_info)
459 {
460 	size_t buf_len = MLXSW_PORT_MAX_MTU;
461 	char *wqe = elem_info->elem;
462 	struct sk_buff *skb;
463 	int err;
464 
465 	elem_info->u.rdq.skb = NULL;
466 	skb = netdev_alloc_skb_ip_align(NULL, buf_len);
467 	if (!skb)
468 		return -ENOMEM;
469 
470 	/* Assume that wqe was previously zeroed. */
471 
472 	err = mlxsw_pci_wqe_frag_map(mlxsw_pci, wqe, 0, skb->data,
473 				     buf_len, DMA_FROM_DEVICE);
474 	if (err)
475 		goto err_frag_map;
476 
477 	elem_info->u.rdq.skb = skb;
478 	return 0;
479 
480 err_frag_map:
481 	dev_kfree_skb_any(skb);
482 	return err;
483 }
484 
485 static void mlxsw_pci_rdq_skb_free(struct mlxsw_pci *mlxsw_pci,
486 				   struct mlxsw_pci_queue_elem_info *elem_info)
487 {
488 	struct sk_buff *skb;
489 	char *wqe;
490 
491 	skb = elem_info->u.rdq.skb;
492 	wqe = elem_info->elem;
493 
494 	mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, 0, DMA_FROM_DEVICE);
495 	dev_kfree_skb_any(skb);
496 }
497 
498 static int mlxsw_pci_rdq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
499 			      struct mlxsw_pci_queue *q)
500 {
501 	struct mlxsw_pci_queue_elem_info *elem_info;
502 	u8 sdq_count = mlxsw_pci_sdq_count(mlxsw_pci);
503 	int i;
504 	int err;
505 
506 	q->producer_counter = 0;
507 	q->consumer_counter = 0;
508 
509 	/* Set CQ of same number of this RDQ with base
510 	 * above SDQ count as the lower ones are assigned to SDQs.
511 	 */
512 	mlxsw_cmd_mbox_sw2hw_dq_cq_set(mbox, sdq_count + q->num);
513 	mlxsw_cmd_mbox_sw2hw_dq_log2_dq_sz_set(mbox, 3); /* 8 pages */
514 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
515 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
516 
517 		mlxsw_cmd_mbox_sw2hw_dq_pa_set(mbox, i, mapaddr);
518 	}
519 
520 	err = mlxsw_cmd_sw2hw_rdq(mlxsw_pci->core, mbox, q->num);
521 	if (err)
522 		return err;
523 
524 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
525 
526 	for (i = 0; i < q->count; i++) {
527 		elem_info = mlxsw_pci_queue_elem_info_producer_get(q);
528 		BUG_ON(!elem_info);
529 		err = mlxsw_pci_rdq_skb_alloc(mlxsw_pci, elem_info);
530 		if (err)
531 			goto rollback;
532 		/* Everything is set up, ring doorbell to pass elem to HW */
533 		q->producer_counter++;
534 		mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
535 	}
536 
537 	return 0;
538 
539 rollback:
540 	for (i--; i >= 0; i--) {
541 		elem_info = mlxsw_pci_queue_elem_info_get(q, i);
542 		mlxsw_pci_rdq_skb_free(mlxsw_pci, elem_info);
543 	}
544 	mlxsw_cmd_hw2sw_rdq(mlxsw_pci->core, q->num);
545 
546 	return err;
547 }
548 
549 static void mlxsw_pci_rdq_fini(struct mlxsw_pci *mlxsw_pci,
550 			       struct mlxsw_pci_queue *q)
551 {
552 	struct mlxsw_pci_queue_elem_info *elem_info;
553 	int i;
554 
555 	mlxsw_cmd_hw2sw_rdq(mlxsw_pci->core, q->num);
556 	for (i = 0; i < q->count; i++) {
557 		elem_info = mlxsw_pci_queue_elem_info_get(q, i);
558 		mlxsw_pci_rdq_skb_free(mlxsw_pci, elem_info);
559 	}
560 }
561 
562 static int mlxsw_pci_rdq_dbg_read(struct seq_file *file, void *data)
563 {
564 	struct mlxsw_pci *mlxsw_pci = dev_get_drvdata(file->private);
565 	struct mlxsw_pci_queue *q;
566 	int i;
567 	static const char hdr[] =
568 		"NUM PROD_COUNT CONS_COUNT COUNT\n";
569 
570 	seq_printf(file, hdr);
571 	for (i = 0; i < mlxsw_pci_rdq_count(mlxsw_pci); i++) {
572 		q = mlxsw_pci_rdq_get(mlxsw_pci, i);
573 		spin_lock_bh(&q->lock);
574 		seq_printf(file, "%3d %10d %10d %5d\n",
575 			   i, q->producer_counter, q->consumer_counter,
576 			   q->count);
577 		spin_unlock_bh(&q->lock);
578 	}
579 	return 0;
580 }
581 
582 static int mlxsw_pci_cq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
583 			     struct mlxsw_pci_queue *q)
584 {
585 	int i;
586 	int err;
587 
588 	q->consumer_counter = 0;
589 
590 	for (i = 0; i < q->count; i++) {
591 		char *elem = mlxsw_pci_queue_elem_get(q, i);
592 
593 		mlxsw_pci_cqe_owner_set(elem, 1);
594 	}
595 
596 	mlxsw_cmd_mbox_sw2hw_cq_cv_set(mbox, 0); /* CQE ver 0 */
597 	mlxsw_cmd_mbox_sw2hw_cq_c_eqn_set(mbox, MLXSW_PCI_EQ_COMP_NUM);
598 	mlxsw_cmd_mbox_sw2hw_cq_oi_set(mbox, 0);
599 	mlxsw_cmd_mbox_sw2hw_cq_st_set(mbox, 0);
600 	mlxsw_cmd_mbox_sw2hw_cq_log_cq_size_set(mbox, ilog2(q->count));
601 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
602 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
603 
604 		mlxsw_cmd_mbox_sw2hw_cq_pa_set(mbox, i, mapaddr);
605 	}
606 	err = mlxsw_cmd_sw2hw_cq(mlxsw_pci->core, mbox, q->num);
607 	if (err)
608 		return err;
609 	mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
610 	mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
611 	return 0;
612 }
613 
614 static void mlxsw_pci_cq_fini(struct mlxsw_pci *mlxsw_pci,
615 			      struct mlxsw_pci_queue *q)
616 {
617 	mlxsw_cmd_hw2sw_cq(mlxsw_pci->core, q->num);
618 }
619 
620 static int mlxsw_pci_cq_dbg_read(struct seq_file *file, void *data)
621 {
622 	struct mlxsw_pci *mlxsw_pci = dev_get_drvdata(file->private);
623 
624 	struct mlxsw_pci_queue *q;
625 	int i;
626 	static const char hdr[] =
627 		"NUM CONS_INDEX  SDQ_COUNT  RDQ_COUNT COUNT\n";
628 
629 	seq_printf(file, hdr);
630 	for (i = 0; i < mlxsw_pci_cq_count(mlxsw_pci); i++) {
631 		q = mlxsw_pci_cq_get(mlxsw_pci, i);
632 		spin_lock_bh(&q->lock);
633 		seq_printf(file, "%3d %10d %10d %10d %5d\n",
634 			   i, q->consumer_counter, q->u.cq.comp_sdq_count,
635 			   q->u.cq.comp_rdq_count, q->count);
636 		spin_unlock_bh(&q->lock);
637 	}
638 	return 0;
639 }
640 
641 static void mlxsw_pci_cqe_sdq_handle(struct mlxsw_pci *mlxsw_pci,
642 				     struct mlxsw_pci_queue *q,
643 				     u16 consumer_counter_limit,
644 				     char *cqe)
645 {
646 	struct pci_dev *pdev = mlxsw_pci->pdev;
647 	struct mlxsw_pci_queue_elem_info *elem_info;
648 	char *wqe;
649 	struct sk_buff *skb;
650 	int i;
651 
652 	spin_lock(&q->lock);
653 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
654 	skb = elem_info->u.sdq.skb;
655 	wqe = elem_info->elem;
656 	for (i = 0; i < MLXSW_PCI_WQE_SG_ENTRIES; i++)
657 		mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, i, DMA_TO_DEVICE);
658 	dev_kfree_skb_any(skb);
659 	elem_info->u.sdq.skb = NULL;
660 
661 	if (q->consumer_counter++ != consumer_counter_limit)
662 		dev_dbg_ratelimited(&pdev->dev, "Consumer counter does not match limit in SDQ\n");
663 	spin_unlock(&q->lock);
664 }
665 
666 static void mlxsw_pci_cqe_rdq_handle(struct mlxsw_pci *mlxsw_pci,
667 				     struct mlxsw_pci_queue *q,
668 				     u16 consumer_counter_limit,
669 				     char *cqe)
670 {
671 	struct pci_dev *pdev = mlxsw_pci->pdev;
672 	struct mlxsw_pci_queue_elem_info *elem_info;
673 	char *wqe;
674 	struct sk_buff *skb;
675 	struct mlxsw_rx_info rx_info;
676 	u16 byte_count;
677 	int err;
678 
679 	elem_info = mlxsw_pci_queue_elem_info_consumer_get(q);
680 	skb = elem_info->u.sdq.skb;
681 	if (!skb)
682 		return;
683 	wqe = elem_info->elem;
684 	mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, 0, DMA_FROM_DEVICE);
685 
686 	if (q->consumer_counter++ != consumer_counter_limit)
687 		dev_dbg_ratelimited(&pdev->dev, "Consumer counter does not match limit in RDQ\n");
688 
689 	if (mlxsw_pci_cqe_lag_get(cqe)) {
690 		rx_info.is_lag = true;
691 		rx_info.u.lag_id = mlxsw_pci_cqe_lag_id_get(cqe);
692 		rx_info.lag_port_index = mlxsw_pci_cqe_lag_port_index_get(cqe);
693 	} else {
694 		rx_info.is_lag = false;
695 		rx_info.u.sys_port = mlxsw_pci_cqe_system_port_get(cqe);
696 	}
697 
698 	rx_info.trap_id = mlxsw_pci_cqe_trap_id_get(cqe);
699 
700 	byte_count = mlxsw_pci_cqe_byte_count_get(cqe);
701 	if (mlxsw_pci_cqe_crc_get(cqe))
702 		byte_count -= ETH_FCS_LEN;
703 	skb_put(skb, byte_count);
704 	mlxsw_core_skb_receive(mlxsw_pci->core, skb, &rx_info);
705 
706 	memset(wqe, 0, q->elem_size);
707 	err = mlxsw_pci_rdq_skb_alloc(mlxsw_pci, elem_info);
708 	if (err)
709 		dev_dbg_ratelimited(&pdev->dev, "Failed to alloc skb for RDQ\n");
710 	/* Everything is set up, ring doorbell to pass elem to HW */
711 	q->producer_counter++;
712 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
713 	return;
714 }
715 
716 static char *mlxsw_pci_cq_sw_cqe_get(struct mlxsw_pci_queue *q)
717 {
718 	return mlxsw_pci_queue_sw_elem_get(q, mlxsw_pci_cqe_owner_get);
719 }
720 
721 static void mlxsw_pci_cq_tasklet(unsigned long data)
722 {
723 	struct mlxsw_pci_queue *q = (struct mlxsw_pci_queue *) data;
724 	struct mlxsw_pci *mlxsw_pci = q->pci;
725 	char *cqe;
726 	int items = 0;
727 	int credits = q->count >> 1;
728 
729 	while ((cqe = mlxsw_pci_cq_sw_cqe_get(q))) {
730 		u16 wqe_counter = mlxsw_pci_cqe_wqe_counter_get(cqe);
731 		u8 sendq = mlxsw_pci_cqe_sr_get(cqe);
732 		u8 dqn = mlxsw_pci_cqe_dqn_get(cqe);
733 
734 		if (sendq) {
735 			struct mlxsw_pci_queue *sdq;
736 
737 			sdq = mlxsw_pci_sdq_get(mlxsw_pci, dqn);
738 			mlxsw_pci_cqe_sdq_handle(mlxsw_pci, sdq,
739 						 wqe_counter, cqe);
740 			q->u.cq.comp_sdq_count++;
741 		} else {
742 			struct mlxsw_pci_queue *rdq;
743 
744 			rdq = mlxsw_pci_rdq_get(mlxsw_pci, dqn);
745 			mlxsw_pci_cqe_rdq_handle(mlxsw_pci, rdq,
746 						 wqe_counter, cqe);
747 			q->u.cq.comp_rdq_count++;
748 		}
749 		if (++items == credits)
750 			break;
751 	}
752 	if (items) {
753 		mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
754 		mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
755 	}
756 }
757 
758 static int mlxsw_pci_eq_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
759 			     struct mlxsw_pci_queue *q)
760 {
761 	int i;
762 	int err;
763 
764 	q->consumer_counter = 0;
765 
766 	for (i = 0; i < q->count; i++) {
767 		char *elem = mlxsw_pci_queue_elem_get(q, i);
768 
769 		mlxsw_pci_eqe_owner_set(elem, 1);
770 	}
771 
772 	mlxsw_cmd_mbox_sw2hw_eq_int_msix_set(mbox, 1); /* MSI-X used */
773 	mlxsw_cmd_mbox_sw2hw_eq_oi_set(mbox, 0);
774 	mlxsw_cmd_mbox_sw2hw_eq_st_set(mbox, 1); /* armed */
775 	mlxsw_cmd_mbox_sw2hw_eq_log_eq_size_set(mbox, ilog2(q->count));
776 	for (i = 0; i < MLXSW_PCI_AQ_PAGES; i++) {
777 		dma_addr_t mapaddr = __mlxsw_pci_queue_page_get(q, i);
778 
779 		mlxsw_cmd_mbox_sw2hw_eq_pa_set(mbox, i, mapaddr);
780 	}
781 	err = mlxsw_cmd_sw2hw_eq(mlxsw_pci->core, mbox, q->num);
782 	if (err)
783 		return err;
784 	mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
785 	mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
786 	return 0;
787 }
788 
789 static void mlxsw_pci_eq_fini(struct mlxsw_pci *mlxsw_pci,
790 			      struct mlxsw_pci_queue *q)
791 {
792 	mlxsw_cmd_hw2sw_eq(mlxsw_pci->core, q->num);
793 }
794 
795 static int mlxsw_pci_eq_dbg_read(struct seq_file *file, void *data)
796 {
797 	struct mlxsw_pci *mlxsw_pci = dev_get_drvdata(file->private);
798 	struct mlxsw_pci_queue *q;
799 	int i;
800 	static const char hdr[] =
801 		"NUM CONS_COUNT     EV_CMD    EV_COMP   EV_OTHER COUNT\n";
802 
803 	seq_printf(file, hdr);
804 	for (i = 0; i < mlxsw_pci_eq_count(mlxsw_pci); i++) {
805 		q = mlxsw_pci_eq_get(mlxsw_pci, i);
806 		spin_lock_bh(&q->lock);
807 		seq_printf(file, "%3d %10d %10d %10d %10d %5d\n",
808 			   i, q->consumer_counter, q->u.eq.ev_cmd_count,
809 			   q->u.eq.ev_comp_count, q->u.eq.ev_other_count,
810 			   q->count);
811 		spin_unlock_bh(&q->lock);
812 	}
813 	return 0;
814 }
815 
816 static void mlxsw_pci_eq_cmd_event(struct mlxsw_pci *mlxsw_pci, char *eqe)
817 {
818 	mlxsw_pci->cmd.comp.status = mlxsw_pci_eqe_cmd_status_get(eqe);
819 	mlxsw_pci->cmd.comp.out_param =
820 		((u64) mlxsw_pci_eqe_cmd_out_param_h_get(eqe)) << 32 |
821 		mlxsw_pci_eqe_cmd_out_param_l_get(eqe);
822 	mlxsw_pci->cmd.wait_done = true;
823 	wake_up(&mlxsw_pci->cmd.wait);
824 }
825 
826 static char *mlxsw_pci_eq_sw_eqe_get(struct mlxsw_pci_queue *q)
827 {
828 	return mlxsw_pci_queue_sw_elem_get(q, mlxsw_pci_eqe_owner_get);
829 }
830 
831 static void mlxsw_pci_eq_tasklet(unsigned long data)
832 {
833 	struct mlxsw_pci_queue *q = (struct mlxsw_pci_queue *) data;
834 	struct mlxsw_pci *mlxsw_pci = q->pci;
835 	u8 cq_count = mlxsw_pci_cq_count(mlxsw_pci);
836 	unsigned long active_cqns[BITS_TO_LONGS(MLXSW_PCI_CQS_MAX)];
837 	char *eqe;
838 	u8 cqn;
839 	bool cq_handle = false;
840 	int items = 0;
841 	int credits = q->count >> 1;
842 
843 	memset(&active_cqns, 0, sizeof(active_cqns));
844 
845 	while ((eqe = mlxsw_pci_eq_sw_eqe_get(q))) {
846 		u8 event_type = mlxsw_pci_eqe_event_type_get(eqe);
847 
848 		switch (event_type) {
849 		case MLXSW_PCI_EQE_EVENT_TYPE_CMD:
850 			mlxsw_pci_eq_cmd_event(mlxsw_pci, eqe);
851 			q->u.eq.ev_cmd_count++;
852 			break;
853 		case MLXSW_PCI_EQE_EVENT_TYPE_COMP:
854 			cqn = mlxsw_pci_eqe_cqn_get(eqe);
855 			set_bit(cqn, active_cqns);
856 			cq_handle = true;
857 			q->u.eq.ev_comp_count++;
858 			break;
859 		default:
860 			q->u.eq.ev_other_count++;
861 		}
862 		if (++items == credits)
863 			break;
864 	}
865 	if (items) {
866 		mlxsw_pci_queue_doorbell_consumer_ring(mlxsw_pci, q);
867 		mlxsw_pci_queue_doorbell_arm_consumer_ring(mlxsw_pci, q);
868 	}
869 
870 	if (!cq_handle)
871 		return;
872 	for_each_set_bit(cqn, active_cqns, cq_count) {
873 		q = mlxsw_pci_cq_get(mlxsw_pci, cqn);
874 		mlxsw_pci_queue_tasklet_schedule(q);
875 	}
876 }
877 
878 struct mlxsw_pci_queue_ops {
879 	const char *name;
880 	enum mlxsw_pci_queue_type type;
881 	int (*init)(struct mlxsw_pci *mlxsw_pci, char *mbox,
882 		    struct mlxsw_pci_queue *q);
883 	void (*fini)(struct mlxsw_pci *mlxsw_pci,
884 		     struct mlxsw_pci_queue *q);
885 	void (*tasklet)(unsigned long data);
886 	int (*dbg_read)(struct seq_file *s, void *data);
887 	u16 elem_count;
888 	u8 elem_size;
889 };
890 
891 static const struct mlxsw_pci_queue_ops mlxsw_pci_sdq_ops = {
892 	.type		= MLXSW_PCI_QUEUE_TYPE_SDQ,
893 	.init		= mlxsw_pci_sdq_init,
894 	.fini		= mlxsw_pci_sdq_fini,
895 	.dbg_read	= mlxsw_pci_sdq_dbg_read,
896 	.elem_count	= MLXSW_PCI_WQE_COUNT,
897 	.elem_size	= MLXSW_PCI_WQE_SIZE,
898 };
899 
900 static const struct mlxsw_pci_queue_ops mlxsw_pci_rdq_ops = {
901 	.type		= MLXSW_PCI_QUEUE_TYPE_RDQ,
902 	.init		= mlxsw_pci_rdq_init,
903 	.fini		= mlxsw_pci_rdq_fini,
904 	.dbg_read	= mlxsw_pci_rdq_dbg_read,
905 	.elem_count	= MLXSW_PCI_WQE_COUNT,
906 	.elem_size	= MLXSW_PCI_WQE_SIZE
907 };
908 
909 static const struct mlxsw_pci_queue_ops mlxsw_pci_cq_ops = {
910 	.type		= MLXSW_PCI_QUEUE_TYPE_CQ,
911 	.init		= mlxsw_pci_cq_init,
912 	.fini		= mlxsw_pci_cq_fini,
913 	.tasklet	= mlxsw_pci_cq_tasklet,
914 	.dbg_read	= mlxsw_pci_cq_dbg_read,
915 	.elem_count	= MLXSW_PCI_CQE_COUNT,
916 	.elem_size	= MLXSW_PCI_CQE_SIZE
917 };
918 
919 static const struct mlxsw_pci_queue_ops mlxsw_pci_eq_ops = {
920 	.type		= MLXSW_PCI_QUEUE_TYPE_EQ,
921 	.init		= mlxsw_pci_eq_init,
922 	.fini		= mlxsw_pci_eq_fini,
923 	.tasklet	= mlxsw_pci_eq_tasklet,
924 	.dbg_read	= mlxsw_pci_eq_dbg_read,
925 	.elem_count	= MLXSW_PCI_EQE_COUNT,
926 	.elem_size	= MLXSW_PCI_EQE_SIZE
927 };
928 
929 static int mlxsw_pci_queue_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
930 				const struct mlxsw_pci_queue_ops *q_ops,
931 				struct mlxsw_pci_queue *q, u8 q_num)
932 {
933 	struct mlxsw_pci_mem_item *mem_item = &q->mem_item;
934 	int i;
935 	int err;
936 
937 	spin_lock_init(&q->lock);
938 	q->num = q_num;
939 	q->count = q_ops->elem_count;
940 	q->elem_size = q_ops->elem_size;
941 	q->type = q_ops->type;
942 	q->pci = mlxsw_pci;
943 
944 	if (q_ops->tasklet)
945 		tasklet_init(&q->tasklet, q_ops->tasklet, (unsigned long) q);
946 
947 	mem_item->size = MLXSW_PCI_AQ_SIZE;
948 	mem_item->buf = pci_alloc_consistent(mlxsw_pci->pdev,
949 					     mem_item->size,
950 					     &mem_item->mapaddr);
951 	if (!mem_item->buf)
952 		return -ENOMEM;
953 	memset(mem_item->buf, 0, mem_item->size);
954 
955 	q->elem_info = kcalloc(q->count, sizeof(*q->elem_info), GFP_KERNEL);
956 	if (!q->elem_info) {
957 		err = -ENOMEM;
958 		goto err_elem_info_alloc;
959 	}
960 
961 	/* Initialize dma mapped elements info elem_info for
962 	 * future easy access.
963 	 */
964 	for (i = 0; i < q->count; i++) {
965 		struct mlxsw_pci_queue_elem_info *elem_info;
966 
967 		elem_info = mlxsw_pci_queue_elem_info_get(q, i);
968 		elem_info->elem =
969 			__mlxsw_pci_queue_elem_get(q, q_ops->elem_size, i);
970 	}
971 
972 	mlxsw_cmd_mbox_zero(mbox);
973 	err = q_ops->init(mlxsw_pci, mbox, q);
974 	if (err)
975 		goto err_q_ops_init;
976 	return 0;
977 
978 err_q_ops_init:
979 	kfree(q->elem_info);
980 err_elem_info_alloc:
981 	pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
982 			    mem_item->buf, mem_item->mapaddr);
983 	return err;
984 }
985 
986 static void mlxsw_pci_queue_fini(struct mlxsw_pci *mlxsw_pci,
987 				 const struct mlxsw_pci_queue_ops *q_ops,
988 				 struct mlxsw_pci_queue *q)
989 {
990 	struct mlxsw_pci_mem_item *mem_item = &q->mem_item;
991 
992 	q_ops->fini(mlxsw_pci, q);
993 	kfree(q->elem_info);
994 	pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
995 			    mem_item->buf, mem_item->mapaddr);
996 }
997 
998 static int mlxsw_pci_queue_group_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
999 				      const struct mlxsw_pci_queue_ops *q_ops,
1000 				      u8 num_qs)
1001 {
1002 	struct pci_dev *pdev = mlxsw_pci->pdev;
1003 	struct mlxsw_pci_queue_type_group *queue_group;
1004 	char tmp[16];
1005 	int i;
1006 	int err;
1007 
1008 	queue_group = mlxsw_pci_queue_type_group_get(mlxsw_pci, q_ops->type);
1009 	queue_group->q = kcalloc(num_qs, sizeof(*queue_group->q), GFP_KERNEL);
1010 	if (!queue_group->q)
1011 		return -ENOMEM;
1012 
1013 	for (i = 0; i < num_qs; i++) {
1014 		err = mlxsw_pci_queue_init(mlxsw_pci, mbox, q_ops,
1015 					   &queue_group->q[i], i);
1016 		if (err)
1017 			goto err_queue_init;
1018 	}
1019 	queue_group->count = num_qs;
1020 
1021 	sprintf(tmp, "%s_stats", mlxsw_pci_queue_type_str(q_ops->type));
1022 	debugfs_create_devm_seqfile(&pdev->dev, tmp, mlxsw_pci->dbg_dir,
1023 				    q_ops->dbg_read);
1024 
1025 	return 0;
1026 
1027 err_queue_init:
1028 	for (i--; i >= 0; i--)
1029 		mlxsw_pci_queue_fini(mlxsw_pci, q_ops, &queue_group->q[i]);
1030 	kfree(queue_group->q);
1031 	return err;
1032 }
1033 
1034 static void mlxsw_pci_queue_group_fini(struct mlxsw_pci *mlxsw_pci,
1035 				       const struct mlxsw_pci_queue_ops *q_ops)
1036 {
1037 	struct mlxsw_pci_queue_type_group *queue_group;
1038 	int i;
1039 
1040 	queue_group = mlxsw_pci_queue_type_group_get(mlxsw_pci, q_ops->type);
1041 	for (i = 0; i < queue_group->count; i++)
1042 		mlxsw_pci_queue_fini(mlxsw_pci, q_ops, &queue_group->q[i]);
1043 	kfree(queue_group->q);
1044 }
1045 
1046 static int mlxsw_pci_aqs_init(struct mlxsw_pci *mlxsw_pci, char *mbox)
1047 {
1048 	struct pci_dev *pdev = mlxsw_pci->pdev;
1049 	u8 num_sdqs;
1050 	u8 sdq_log2sz;
1051 	u8 num_rdqs;
1052 	u8 rdq_log2sz;
1053 	u8 num_cqs;
1054 	u8 cq_log2sz;
1055 	u8 num_eqs;
1056 	u8 eq_log2sz;
1057 	int err;
1058 
1059 	mlxsw_cmd_mbox_zero(mbox);
1060 	err = mlxsw_cmd_query_aq_cap(mlxsw_pci->core, mbox);
1061 	if (err)
1062 		return err;
1063 
1064 	num_sdqs = mlxsw_cmd_mbox_query_aq_cap_max_num_sdqs_get(mbox);
1065 	sdq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_sdq_sz_get(mbox);
1066 	num_rdqs = mlxsw_cmd_mbox_query_aq_cap_max_num_rdqs_get(mbox);
1067 	rdq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_rdq_sz_get(mbox);
1068 	num_cqs = mlxsw_cmd_mbox_query_aq_cap_max_num_cqs_get(mbox);
1069 	cq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_cq_sz_get(mbox);
1070 	num_eqs = mlxsw_cmd_mbox_query_aq_cap_max_num_eqs_get(mbox);
1071 	eq_log2sz = mlxsw_cmd_mbox_query_aq_cap_log_max_eq_sz_get(mbox);
1072 
1073 	if (num_sdqs + num_rdqs > num_cqs ||
1074 	    num_cqs > MLXSW_PCI_CQS_MAX || num_eqs != MLXSW_PCI_EQS_COUNT) {
1075 		dev_err(&pdev->dev, "Unsupported number of queues\n");
1076 		return -EINVAL;
1077 	}
1078 
1079 	if ((1 << sdq_log2sz != MLXSW_PCI_WQE_COUNT) ||
1080 	    (1 << rdq_log2sz != MLXSW_PCI_WQE_COUNT) ||
1081 	    (1 << cq_log2sz != MLXSW_PCI_CQE_COUNT) ||
1082 	    (1 << eq_log2sz != MLXSW_PCI_EQE_COUNT)) {
1083 		dev_err(&pdev->dev, "Unsupported number of async queue descriptors\n");
1084 		return -EINVAL;
1085 	}
1086 
1087 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_eq_ops,
1088 					 num_eqs);
1089 	if (err) {
1090 		dev_err(&pdev->dev, "Failed to initialize event queues\n");
1091 		return err;
1092 	}
1093 
1094 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_cq_ops,
1095 					 num_cqs);
1096 	if (err) {
1097 		dev_err(&pdev->dev, "Failed to initialize completion queues\n");
1098 		goto err_cqs_init;
1099 	}
1100 
1101 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_sdq_ops,
1102 					 num_sdqs);
1103 	if (err) {
1104 		dev_err(&pdev->dev, "Failed to initialize send descriptor queues\n");
1105 		goto err_sdqs_init;
1106 	}
1107 
1108 	err = mlxsw_pci_queue_group_init(mlxsw_pci, mbox, &mlxsw_pci_rdq_ops,
1109 					 num_rdqs);
1110 	if (err) {
1111 		dev_err(&pdev->dev, "Failed to initialize receive descriptor queues\n");
1112 		goto err_rdqs_init;
1113 	}
1114 
1115 	/* We have to poll in command interface until queues are initialized */
1116 	mlxsw_pci->cmd.nopoll = true;
1117 	return 0;
1118 
1119 err_rdqs_init:
1120 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_sdq_ops);
1121 err_sdqs_init:
1122 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_cq_ops);
1123 err_cqs_init:
1124 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_eq_ops);
1125 	return err;
1126 }
1127 
1128 static void mlxsw_pci_aqs_fini(struct mlxsw_pci *mlxsw_pci)
1129 {
1130 	mlxsw_pci->cmd.nopoll = false;
1131 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_rdq_ops);
1132 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_sdq_ops);
1133 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_cq_ops);
1134 	mlxsw_pci_queue_group_fini(mlxsw_pci, &mlxsw_pci_eq_ops);
1135 }
1136 
1137 static void
1138 mlxsw_pci_config_profile_swid_config(struct mlxsw_pci *mlxsw_pci,
1139 				     char *mbox, int index,
1140 				     const struct mlxsw_swid_config *swid)
1141 {
1142 	u8 mask = 0;
1143 
1144 	if (swid->used_type) {
1145 		mlxsw_cmd_mbox_config_profile_swid_config_type_set(
1146 			mbox, index, swid->type);
1147 		mask |= 1;
1148 	}
1149 	if (swid->used_properties) {
1150 		mlxsw_cmd_mbox_config_profile_swid_config_properties_set(
1151 			mbox, index, swid->properties);
1152 		mask |= 2;
1153 	}
1154 	mlxsw_cmd_mbox_config_profile_swid_config_mask_set(mbox, index, mask);
1155 }
1156 
1157 #define MLXSW_RESOURCES_TABLE_END_ID 0xffff
1158 #define MLXSW_MAX_SPAN_ID 0x2420
1159 #define MLXSW_MAX_LAG_ID 0x2520
1160 #define MLXSW_MAX_PORTS_IN_LAG_ID 0x2521
1161 #define MLXSW_KVD_SIZE_ID 0x1001
1162 #define MLXSW_KVD_SINGLE_MIN_SIZE_ID 0x1002
1163 #define MLXSW_KVD_DOUBLE_MIN_SIZE_ID 0x1003
1164 #define MLXSW_MAX_VIRTUAL_ROUTERS_ID 0x2C01
1165 #define MLXSW_MAX_SYSTEM_PORT_ID 0x2502
1166 #define MLXSW_MAX_VLAN_GROUPS_ID 0x2906
1167 #define MLXSW_MAX_REGIONS_ID 0x2901
1168 #define MLXSW_MAX_RIF_ID 0x2C02
1169 #define MLXSW_RESOURCES_QUERY_MAX_QUERIES 100
1170 #define MLXSW_RESOURCES_PER_QUERY 32
1171 
1172 static void mlxsw_pci_resources_query_parse(int id, u64 val,
1173 					    struct mlxsw_resources *resources)
1174 {
1175 	switch (id) {
1176 	case MLXSW_MAX_SPAN_ID:
1177 		resources->max_span = val;
1178 		resources->max_span_valid = 1;
1179 		break;
1180 	case MLXSW_MAX_LAG_ID:
1181 		resources->max_lag = val;
1182 		resources->max_lag_valid = 1;
1183 		break;
1184 	case MLXSW_MAX_PORTS_IN_LAG_ID:
1185 		resources->max_ports_in_lag = val;
1186 		resources->max_ports_in_lag_valid = 1;
1187 		break;
1188 	case MLXSW_KVD_SIZE_ID:
1189 		resources->kvd_size = val;
1190 		resources->kvd_size_valid = 1;
1191 		break;
1192 	case MLXSW_KVD_SINGLE_MIN_SIZE_ID:
1193 		resources->kvd_single_min_size = val;
1194 		resources->kvd_single_min_size_valid = 1;
1195 		break;
1196 	case MLXSW_KVD_DOUBLE_MIN_SIZE_ID:
1197 		resources->kvd_double_min_size = val;
1198 		resources->kvd_double_min_size_valid = 1;
1199 		break;
1200 	case MLXSW_MAX_VIRTUAL_ROUTERS_ID:
1201 		resources->max_virtual_routers = val;
1202 		resources->max_virtual_routers_valid = 1;
1203 		break;
1204 	case MLXSW_MAX_SYSTEM_PORT_ID:
1205 		resources->max_system_ports = val;
1206 		resources->max_system_ports_valid = 1;
1207 		break;
1208 	case MLXSW_MAX_VLAN_GROUPS_ID:
1209 		resources->max_vlan_groups = val;
1210 		resources->max_vlan_groups_valid = 1;
1211 		break;
1212 	case MLXSW_MAX_REGIONS_ID:
1213 		resources->max_regions = val;
1214 		resources->max_regions_valid = 1;
1215 		break;
1216 	case MLXSW_MAX_RIF_ID:
1217 		resources->max_rif = val;
1218 		resources->max_rif_valid = 1;
1219 		break;
1220 	default:
1221 		break;
1222 	}
1223 }
1224 
1225 static int mlxsw_pci_resources_query(struct mlxsw_pci *mlxsw_pci, char *mbox,
1226 				     struct mlxsw_resources *resources,
1227 				     u8 query_enabled)
1228 {
1229 	int index, i;
1230 	u64 data;
1231 	u16 id;
1232 	int err;
1233 
1234 	/* Not all the versions support resources query */
1235 	if (!query_enabled)
1236 		return 0;
1237 
1238 	mlxsw_cmd_mbox_zero(mbox);
1239 
1240 	for (index = 0; index < MLXSW_RESOURCES_QUERY_MAX_QUERIES; index++) {
1241 		err = mlxsw_cmd_query_resources(mlxsw_pci->core, mbox, index);
1242 		if (err)
1243 			return err;
1244 
1245 		for (i = 0; i < MLXSW_RESOURCES_PER_QUERY; i++) {
1246 			id = mlxsw_cmd_mbox_query_resource_id_get(mbox, i);
1247 			data = mlxsw_cmd_mbox_query_resource_data_get(mbox, i);
1248 
1249 			if (id == MLXSW_RESOURCES_TABLE_END_ID)
1250 				return 0;
1251 
1252 			mlxsw_pci_resources_query_parse(id, data, resources);
1253 		}
1254 	}
1255 
1256 	/* If after MLXSW_RESOURCES_QUERY_MAX_QUERIES we still didn't get
1257 	 * MLXSW_RESOURCES_TABLE_END_ID, something went bad in the FW.
1258 	 */
1259 	return -EIO;
1260 }
1261 
1262 static int mlxsw_pci_profile_get_kvd_sizes(const struct mlxsw_config_profile *profile,
1263 					   struct mlxsw_resources *resources)
1264 {
1265 	u32 singles_size, doubles_size, linear_size;
1266 
1267 	if (!resources->kvd_single_min_size_valid ||
1268 	    !resources->kvd_double_min_size_valid ||
1269 	    !profile->used_kvd_split_data)
1270 		return -EIO;
1271 
1272 	linear_size = profile->kvd_linear_size;
1273 
1274 	/* The hash part is what left of the kvd without the
1275 	 * linear part. It is split to the single size and
1276 	 * double size by the parts ratio from the profile.
1277 	 * Both sizes must be a multiplications of the
1278 	 * granularity from the profile.
1279 	 */
1280 	doubles_size = (resources->kvd_size - linear_size);
1281 	doubles_size *= profile->kvd_hash_double_parts;
1282 	doubles_size /= (profile->kvd_hash_double_parts +
1283 			 profile->kvd_hash_single_parts);
1284 	doubles_size /= profile->kvd_hash_granularity;
1285 	doubles_size *= profile->kvd_hash_granularity;
1286 	singles_size = resources->kvd_size - doubles_size -
1287 		       linear_size;
1288 
1289 	/* Check results are legal. */
1290 	if (singles_size < resources->kvd_single_min_size ||
1291 	    doubles_size < resources->kvd_double_min_size ||
1292 	    resources->kvd_size < linear_size)
1293 		return -EIO;
1294 
1295 	resources->kvd_single_size = singles_size;
1296 	resources->kvd_double_size = doubles_size;
1297 	resources->kvd_linear_size = linear_size;
1298 
1299 	return 0;
1300 }
1301 
1302 static int mlxsw_pci_config_profile(struct mlxsw_pci *mlxsw_pci, char *mbox,
1303 				    const struct mlxsw_config_profile *profile,
1304 				    struct mlxsw_resources *resources)
1305 {
1306 	int i;
1307 	int err;
1308 
1309 	mlxsw_cmd_mbox_zero(mbox);
1310 
1311 	if (profile->used_max_vepa_channels) {
1312 		mlxsw_cmd_mbox_config_profile_set_max_vepa_channels_set(
1313 			mbox, 1);
1314 		mlxsw_cmd_mbox_config_profile_max_vepa_channels_set(
1315 			mbox, profile->max_vepa_channels);
1316 	}
1317 	if (profile->used_max_mid) {
1318 		mlxsw_cmd_mbox_config_profile_set_max_mid_set(
1319 			mbox, 1);
1320 		mlxsw_cmd_mbox_config_profile_max_mid_set(
1321 			mbox, profile->max_mid);
1322 	}
1323 	if (profile->used_max_pgt) {
1324 		mlxsw_cmd_mbox_config_profile_set_max_pgt_set(
1325 			mbox, 1);
1326 		mlxsw_cmd_mbox_config_profile_max_pgt_set(
1327 			mbox, profile->max_pgt);
1328 	}
1329 	if (profile->used_max_system_port) {
1330 		mlxsw_cmd_mbox_config_profile_set_max_system_port_set(
1331 			mbox, 1);
1332 		mlxsw_cmd_mbox_config_profile_max_system_port_set(
1333 			mbox, profile->max_system_port);
1334 	}
1335 	if (profile->used_max_vlan_groups) {
1336 		mlxsw_cmd_mbox_config_profile_set_max_vlan_groups_set(
1337 			mbox, 1);
1338 		mlxsw_cmd_mbox_config_profile_max_vlan_groups_set(
1339 			mbox, profile->max_vlan_groups);
1340 	}
1341 	if (profile->used_max_regions) {
1342 		mlxsw_cmd_mbox_config_profile_set_max_regions_set(
1343 			mbox, 1);
1344 		mlxsw_cmd_mbox_config_profile_max_regions_set(
1345 			mbox, profile->max_regions);
1346 	}
1347 	if (profile->used_flood_tables) {
1348 		mlxsw_cmd_mbox_config_profile_set_flood_tables_set(
1349 			mbox, 1);
1350 		mlxsw_cmd_mbox_config_profile_max_flood_tables_set(
1351 			mbox, profile->max_flood_tables);
1352 		mlxsw_cmd_mbox_config_profile_max_vid_flood_tables_set(
1353 			mbox, profile->max_vid_flood_tables);
1354 		mlxsw_cmd_mbox_config_profile_max_fid_offset_flood_tables_set(
1355 			mbox, profile->max_fid_offset_flood_tables);
1356 		mlxsw_cmd_mbox_config_profile_fid_offset_flood_table_size_set(
1357 			mbox, profile->fid_offset_flood_table_size);
1358 		mlxsw_cmd_mbox_config_profile_max_fid_flood_tables_set(
1359 			mbox, profile->max_fid_flood_tables);
1360 		mlxsw_cmd_mbox_config_profile_fid_flood_table_size_set(
1361 			mbox, profile->fid_flood_table_size);
1362 	}
1363 	if (profile->used_flood_mode) {
1364 		mlxsw_cmd_mbox_config_profile_set_flood_mode_set(
1365 			mbox, 1);
1366 		mlxsw_cmd_mbox_config_profile_flood_mode_set(
1367 			mbox, profile->flood_mode);
1368 	}
1369 	if (profile->used_max_ib_mc) {
1370 		mlxsw_cmd_mbox_config_profile_set_max_ib_mc_set(
1371 			mbox, 1);
1372 		mlxsw_cmd_mbox_config_profile_max_ib_mc_set(
1373 			mbox, profile->max_ib_mc);
1374 	}
1375 	if (profile->used_max_pkey) {
1376 		mlxsw_cmd_mbox_config_profile_set_max_pkey_set(
1377 			mbox, 1);
1378 		mlxsw_cmd_mbox_config_profile_max_pkey_set(
1379 			mbox, profile->max_pkey);
1380 	}
1381 	if (profile->used_ar_sec) {
1382 		mlxsw_cmd_mbox_config_profile_set_ar_sec_set(
1383 			mbox, 1);
1384 		mlxsw_cmd_mbox_config_profile_ar_sec_set(
1385 			mbox, profile->ar_sec);
1386 	}
1387 	if (profile->used_adaptive_routing_group_cap) {
1388 		mlxsw_cmd_mbox_config_profile_set_adaptive_routing_group_cap_set(
1389 			mbox, 1);
1390 		mlxsw_cmd_mbox_config_profile_adaptive_routing_group_cap_set(
1391 			mbox, profile->adaptive_routing_group_cap);
1392 	}
1393 	if (resources->kvd_size_valid) {
1394 		err = mlxsw_pci_profile_get_kvd_sizes(profile, resources);
1395 		if (err)
1396 			return err;
1397 
1398 		mlxsw_cmd_mbox_config_profile_set_kvd_linear_size_set(mbox, 1);
1399 		mlxsw_cmd_mbox_config_profile_kvd_linear_size_set(mbox,
1400 						resources->kvd_linear_size);
1401 		mlxsw_cmd_mbox_config_profile_set_kvd_hash_single_size_set(mbox,
1402 									   1);
1403 		mlxsw_cmd_mbox_config_profile_kvd_hash_single_size_set(mbox,
1404 						resources->kvd_single_size);
1405 		mlxsw_cmd_mbox_config_profile_set_kvd_hash_double_size_set(
1406 								mbox, 1);
1407 		mlxsw_cmd_mbox_config_profile_kvd_hash_double_size_set(mbox,
1408 						resources->kvd_double_size);
1409 	}
1410 
1411 	for (i = 0; i < MLXSW_CONFIG_PROFILE_SWID_COUNT; i++)
1412 		mlxsw_pci_config_profile_swid_config(mlxsw_pci, mbox, i,
1413 						     &profile->swid_config[i]);
1414 
1415 	return mlxsw_cmd_config_profile_set(mlxsw_pci->core, mbox);
1416 }
1417 
1418 static int mlxsw_pci_boardinfo(struct mlxsw_pci *mlxsw_pci, char *mbox)
1419 {
1420 	struct mlxsw_bus_info *bus_info = &mlxsw_pci->bus_info;
1421 	int err;
1422 
1423 	mlxsw_cmd_mbox_zero(mbox);
1424 	err = mlxsw_cmd_boardinfo(mlxsw_pci->core, mbox);
1425 	if (err)
1426 		return err;
1427 	mlxsw_cmd_mbox_boardinfo_vsd_memcpy_from(mbox, bus_info->vsd);
1428 	mlxsw_cmd_mbox_boardinfo_psid_memcpy_from(mbox, bus_info->psid);
1429 	return 0;
1430 }
1431 
1432 static int mlxsw_pci_fw_area_init(struct mlxsw_pci *mlxsw_pci, char *mbox,
1433 				  u16 num_pages)
1434 {
1435 	struct mlxsw_pci_mem_item *mem_item;
1436 	int nent = 0;
1437 	int i;
1438 	int err;
1439 
1440 	mlxsw_pci->fw_area.items = kcalloc(num_pages, sizeof(*mem_item),
1441 					   GFP_KERNEL);
1442 	if (!mlxsw_pci->fw_area.items)
1443 		return -ENOMEM;
1444 	mlxsw_pci->fw_area.count = num_pages;
1445 
1446 	mlxsw_cmd_mbox_zero(mbox);
1447 	for (i = 0; i < num_pages; i++) {
1448 		mem_item = &mlxsw_pci->fw_area.items[i];
1449 
1450 		mem_item->size = MLXSW_PCI_PAGE_SIZE;
1451 		mem_item->buf = pci_alloc_consistent(mlxsw_pci->pdev,
1452 						     mem_item->size,
1453 						     &mem_item->mapaddr);
1454 		if (!mem_item->buf) {
1455 			err = -ENOMEM;
1456 			goto err_alloc;
1457 		}
1458 		mlxsw_cmd_mbox_map_fa_pa_set(mbox, nent, mem_item->mapaddr);
1459 		mlxsw_cmd_mbox_map_fa_log2size_set(mbox, nent, 0); /* 1 page */
1460 		if (++nent == MLXSW_CMD_MAP_FA_VPM_ENTRIES_MAX) {
1461 			err = mlxsw_cmd_map_fa(mlxsw_pci->core, mbox, nent);
1462 			if (err)
1463 				goto err_cmd_map_fa;
1464 			nent = 0;
1465 			mlxsw_cmd_mbox_zero(mbox);
1466 		}
1467 	}
1468 
1469 	if (nent) {
1470 		err = mlxsw_cmd_map_fa(mlxsw_pci->core, mbox, nent);
1471 		if (err)
1472 			goto err_cmd_map_fa;
1473 	}
1474 
1475 	return 0;
1476 
1477 err_cmd_map_fa:
1478 err_alloc:
1479 	for (i--; i >= 0; i--) {
1480 		mem_item = &mlxsw_pci->fw_area.items[i];
1481 
1482 		pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
1483 				    mem_item->buf, mem_item->mapaddr);
1484 	}
1485 	kfree(mlxsw_pci->fw_area.items);
1486 	return err;
1487 }
1488 
1489 static void mlxsw_pci_fw_area_fini(struct mlxsw_pci *mlxsw_pci)
1490 {
1491 	struct mlxsw_pci_mem_item *mem_item;
1492 	int i;
1493 
1494 	mlxsw_cmd_unmap_fa(mlxsw_pci->core);
1495 
1496 	for (i = 0; i < mlxsw_pci->fw_area.count; i++) {
1497 		mem_item = &mlxsw_pci->fw_area.items[i];
1498 
1499 		pci_free_consistent(mlxsw_pci->pdev, mem_item->size,
1500 				    mem_item->buf, mem_item->mapaddr);
1501 	}
1502 	kfree(mlxsw_pci->fw_area.items);
1503 }
1504 
1505 static irqreturn_t mlxsw_pci_eq_irq_handler(int irq, void *dev_id)
1506 {
1507 	struct mlxsw_pci *mlxsw_pci = dev_id;
1508 	struct mlxsw_pci_queue *q;
1509 	int i;
1510 
1511 	for (i = 0; i < MLXSW_PCI_EQS_COUNT; i++) {
1512 		q = mlxsw_pci_eq_get(mlxsw_pci, i);
1513 		mlxsw_pci_queue_tasklet_schedule(q);
1514 	}
1515 	return IRQ_HANDLED;
1516 }
1517 
1518 static int mlxsw_pci_mbox_alloc(struct mlxsw_pci *mlxsw_pci,
1519 				struct mlxsw_pci_mem_item *mbox)
1520 {
1521 	struct pci_dev *pdev = mlxsw_pci->pdev;
1522 	int err = 0;
1523 
1524 	mbox->size = MLXSW_CMD_MBOX_SIZE;
1525 	mbox->buf = pci_alloc_consistent(pdev, MLXSW_CMD_MBOX_SIZE,
1526 					 &mbox->mapaddr);
1527 	if (!mbox->buf) {
1528 		dev_err(&pdev->dev, "Failed allocating memory for mailbox\n");
1529 		err = -ENOMEM;
1530 	}
1531 
1532 	return err;
1533 }
1534 
1535 static void mlxsw_pci_mbox_free(struct mlxsw_pci *mlxsw_pci,
1536 				struct mlxsw_pci_mem_item *mbox)
1537 {
1538 	struct pci_dev *pdev = mlxsw_pci->pdev;
1539 
1540 	pci_free_consistent(pdev, MLXSW_CMD_MBOX_SIZE, mbox->buf,
1541 			    mbox->mapaddr);
1542 }
1543 
1544 static int mlxsw_pci_init(void *bus_priv, struct mlxsw_core *mlxsw_core,
1545 			  const struct mlxsw_config_profile *profile,
1546 			  struct mlxsw_resources *resources)
1547 {
1548 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1549 	struct pci_dev *pdev = mlxsw_pci->pdev;
1550 	char *mbox;
1551 	u16 num_pages;
1552 	int err;
1553 
1554 	mutex_init(&mlxsw_pci->cmd.lock);
1555 	init_waitqueue_head(&mlxsw_pci->cmd.wait);
1556 
1557 	mlxsw_pci->core = mlxsw_core;
1558 
1559 	mbox = mlxsw_cmd_mbox_alloc();
1560 	if (!mbox)
1561 		return -ENOMEM;
1562 
1563 	err = mlxsw_pci_mbox_alloc(mlxsw_pci, &mlxsw_pci->cmd.in_mbox);
1564 	if (err)
1565 		goto mbox_put;
1566 
1567 	err = mlxsw_pci_mbox_alloc(mlxsw_pci, &mlxsw_pci->cmd.out_mbox);
1568 	if (err)
1569 		goto err_out_mbox_alloc;
1570 
1571 	err = mlxsw_cmd_query_fw(mlxsw_core, mbox);
1572 	if (err)
1573 		goto err_query_fw;
1574 
1575 	mlxsw_pci->bus_info.fw_rev.major =
1576 		mlxsw_cmd_mbox_query_fw_fw_rev_major_get(mbox);
1577 	mlxsw_pci->bus_info.fw_rev.minor =
1578 		mlxsw_cmd_mbox_query_fw_fw_rev_minor_get(mbox);
1579 	mlxsw_pci->bus_info.fw_rev.subminor =
1580 		mlxsw_cmd_mbox_query_fw_fw_rev_subminor_get(mbox);
1581 
1582 	if (mlxsw_cmd_mbox_query_fw_cmd_interface_rev_get(mbox) != 1) {
1583 		dev_err(&pdev->dev, "Unsupported cmd interface revision ID queried from hw\n");
1584 		err = -EINVAL;
1585 		goto err_iface_rev;
1586 	}
1587 	if (mlxsw_cmd_mbox_query_fw_doorbell_page_bar_get(mbox) != 0) {
1588 		dev_err(&pdev->dev, "Unsupported doorbell page bar queried from hw\n");
1589 		err = -EINVAL;
1590 		goto err_doorbell_page_bar;
1591 	}
1592 
1593 	mlxsw_pci->doorbell_offset =
1594 		mlxsw_cmd_mbox_query_fw_doorbell_page_offset_get(mbox);
1595 
1596 	num_pages = mlxsw_cmd_mbox_query_fw_fw_pages_get(mbox);
1597 	err = mlxsw_pci_fw_area_init(mlxsw_pci, mbox, num_pages);
1598 	if (err)
1599 		goto err_fw_area_init;
1600 
1601 	err = mlxsw_pci_boardinfo(mlxsw_pci, mbox);
1602 	if (err)
1603 		goto err_boardinfo;
1604 
1605 	err = mlxsw_pci_resources_query(mlxsw_pci, mbox, resources,
1606 					profile->resource_query_enable);
1607 	if (err)
1608 		goto err_query_resources;
1609 
1610 	err = mlxsw_pci_config_profile(mlxsw_pci, mbox, profile, resources);
1611 	if (err)
1612 		goto err_config_profile;
1613 
1614 	err = mlxsw_pci_aqs_init(mlxsw_pci, mbox);
1615 	if (err)
1616 		goto err_aqs_init;
1617 
1618 	err = request_irq(mlxsw_pci->msix_entry.vector,
1619 			  mlxsw_pci_eq_irq_handler, 0,
1620 			  mlxsw_pci_driver_name, mlxsw_pci);
1621 	if (err) {
1622 		dev_err(&pdev->dev, "IRQ request failed\n");
1623 		goto err_request_eq_irq;
1624 	}
1625 
1626 	goto mbox_put;
1627 
1628 err_request_eq_irq:
1629 	mlxsw_pci_aqs_fini(mlxsw_pci);
1630 err_aqs_init:
1631 err_config_profile:
1632 err_query_resources:
1633 err_boardinfo:
1634 	mlxsw_pci_fw_area_fini(mlxsw_pci);
1635 err_fw_area_init:
1636 err_doorbell_page_bar:
1637 err_iface_rev:
1638 err_query_fw:
1639 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.out_mbox);
1640 err_out_mbox_alloc:
1641 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.in_mbox);
1642 mbox_put:
1643 	mlxsw_cmd_mbox_free(mbox);
1644 	return err;
1645 }
1646 
1647 static void mlxsw_pci_fini(void *bus_priv)
1648 {
1649 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1650 
1651 	free_irq(mlxsw_pci->msix_entry.vector, mlxsw_pci);
1652 	mlxsw_pci_aqs_fini(mlxsw_pci);
1653 	mlxsw_pci_fw_area_fini(mlxsw_pci);
1654 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.out_mbox);
1655 	mlxsw_pci_mbox_free(mlxsw_pci, &mlxsw_pci->cmd.in_mbox);
1656 }
1657 
1658 static struct mlxsw_pci_queue *
1659 mlxsw_pci_sdq_pick(struct mlxsw_pci *mlxsw_pci,
1660 		   const struct mlxsw_tx_info *tx_info)
1661 {
1662 	u8 sdqn = tx_info->local_port % mlxsw_pci_sdq_count(mlxsw_pci);
1663 
1664 	return mlxsw_pci_sdq_get(mlxsw_pci, sdqn);
1665 }
1666 
1667 static bool mlxsw_pci_skb_transmit_busy(void *bus_priv,
1668 					const struct mlxsw_tx_info *tx_info)
1669 {
1670 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1671 	struct mlxsw_pci_queue *q = mlxsw_pci_sdq_pick(mlxsw_pci, tx_info);
1672 
1673 	return !mlxsw_pci_queue_elem_info_producer_get(q);
1674 }
1675 
1676 static int mlxsw_pci_skb_transmit(void *bus_priv, struct sk_buff *skb,
1677 				  const struct mlxsw_tx_info *tx_info)
1678 {
1679 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1680 	struct mlxsw_pci_queue *q;
1681 	struct mlxsw_pci_queue_elem_info *elem_info;
1682 	char *wqe;
1683 	int i;
1684 	int err;
1685 
1686 	if (skb_shinfo(skb)->nr_frags > MLXSW_PCI_WQE_SG_ENTRIES - 1) {
1687 		err = skb_linearize(skb);
1688 		if (err)
1689 			return err;
1690 	}
1691 
1692 	q = mlxsw_pci_sdq_pick(mlxsw_pci, tx_info);
1693 	spin_lock_bh(&q->lock);
1694 	elem_info = mlxsw_pci_queue_elem_info_producer_get(q);
1695 	if (!elem_info) {
1696 		/* queue is full */
1697 		err = -EAGAIN;
1698 		goto unlock;
1699 	}
1700 	elem_info->u.sdq.skb = skb;
1701 
1702 	wqe = elem_info->elem;
1703 	mlxsw_pci_wqe_c_set(wqe, 1); /* always report completion */
1704 	mlxsw_pci_wqe_lp_set(wqe, !!tx_info->is_emad);
1705 	mlxsw_pci_wqe_type_set(wqe, MLXSW_PCI_WQE_TYPE_ETHERNET);
1706 
1707 	err = mlxsw_pci_wqe_frag_map(mlxsw_pci, wqe, 0, skb->data,
1708 				     skb_headlen(skb), DMA_TO_DEVICE);
1709 	if (err)
1710 		goto unlock;
1711 
1712 	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
1713 		const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
1714 
1715 		err = mlxsw_pci_wqe_frag_map(mlxsw_pci, wqe, i + 1,
1716 					     skb_frag_address(frag),
1717 					     skb_frag_size(frag),
1718 					     DMA_TO_DEVICE);
1719 		if (err)
1720 			goto unmap_frags;
1721 	}
1722 
1723 	/* Set unused sq entries byte count to zero. */
1724 	for (i++; i < MLXSW_PCI_WQE_SG_ENTRIES; i++)
1725 		mlxsw_pci_wqe_byte_count_set(wqe, i, 0);
1726 
1727 	/* Everything is set up, ring producer doorbell to get HW going */
1728 	q->producer_counter++;
1729 	mlxsw_pci_queue_doorbell_producer_ring(mlxsw_pci, q);
1730 
1731 	goto unlock;
1732 
1733 unmap_frags:
1734 	for (; i >= 0; i--)
1735 		mlxsw_pci_wqe_frag_unmap(mlxsw_pci, wqe, i, DMA_TO_DEVICE);
1736 unlock:
1737 	spin_unlock_bh(&q->lock);
1738 	return err;
1739 }
1740 
1741 static int mlxsw_pci_cmd_exec(void *bus_priv, u16 opcode, u8 opcode_mod,
1742 			      u32 in_mod, bool out_mbox_direct,
1743 			      char *in_mbox, size_t in_mbox_size,
1744 			      char *out_mbox, size_t out_mbox_size,
1745 			      u8 *p_status)
1746 {
1747 	struct mlxsw_pci *mlxsw_pci = bus_priv;
1748 	dma_addr_t in_mapaddr = mlxsw_pci->cmd.in_mbox.mapaddr;
1749 	dma_addr_t out_mapaddr = mlxsw_pci->cmd.out_mbox.mapaddr;
1750 	bool evreq = mlxsw_pci->cmd.nopoll;
1751 	unsigned long timeout = msecs_to_jiffies(MLXSW_PCI_CIR_TIMEOUT_MSECS);
1752 	bool *p_wait_done = &mlxsw_pci->cmd.wait_done;
1753 	int err;
1754 
1755 	*p_status = MLXSW_CMD_STATUS_OK;
1756 
1757 	err = mutex_lock_interruptible(&mlxsw_pci->cmd.lock);
1758 	if (err)
1759 		return err;
1760 
1761 	if (in_mbox)
1762 		memcpy(mlxsw_pci->cmd.in_mbox.buf, in_mbox, in_mbox_size);
1763 	mlxsw_pci_write32(mlxsw_pci, CIR_IN_PARAM_HI, upper_32_bits(in_mapaddr));
1764 	mlxsw_pci_write32(mlxsw_pci, CIR_IN_PARAM_LO, lower_32_bits(in_mapaddr));
1765 
1766 	mlxsw_pci_write32(mlxsw_pci, CIR_OUT_PARAM_HI, upper_32_bits(out_mapaddr));
1767 	mlxsw_pci_write32(mlxsw_pci, CIR_OUT_PARAM_LO, lower_32_bits(out_mapaddr));
1768 
1769 	mlxsw_pci_write32(mlxsw_pci, CIR_IN_MODIFIER, in_mod);
1770 	mlxsw_pci_write32(mlxsw_pci, CIR_TOKEN, 0);
1771 
1772 	*p_wait_done = false;
1773 
1774 	wmb(); /* all needs to be written before we write control register */
1775 	mlxsw_pci_write32(mlxsw_pci, CIR_CTRL,
1776 			  MLXSW_PCI_CIR_CTRL_GO_BIT |
1777 			  (evreq ? MLXSW_PCI_CIR_CTRL_EVREQ_BIT : 0) |
1778 			  (opcode_mod << MLXSW_PCI_CIR_CTRL_OPCODE_MOD_SHIFT) |
1779 			  opcode);
1780 
1781 	if (!evreq) {
1782 		unsigned long end;
1783 
1784 		end = jiffies + timeout;
1785 		do {
1786 			u32 ctrl = mlxsw_pci_read32(mlxsw_pci, CIR_CTRL);
1787 
1788 			if (!(ctrl & MLXSW_PCI_CIR_CTRL_GO_BIT)) {
1789 				*p_wait_done = true;
1790 				*p_status = ctrl >> MLXSW_PCI_CIR_CTRL_STATUS_SHIFT;
1791 				break;
1792 			}
1793 			cond_resched();
1794 		} while (time_before(jiffies, end));
1795 	} else {
1796 		wait_event_timeout(mlxsw_pci->cmd.wait, *p_wait_done, timeout);
1797 		*p_status = mlxsw_pci->cmd.comp.status;
1798 	}
1799 
1800 	err = 0;
1801 	if (*p_wait_done) {
1802 		if (*p_status)
1803 			err = -EIO;
1804 	} else {
1805 		err = -ETIMEDOUT;
1806 	}
1807 
1808 	if (!err && out_mbox && out_mbox_direct) {
1809 		/* Some commands don't use output param as address to mailbox
1810 		 * but they store output directly into registers. In that case,
1811 		 * copy registers into mbox buffer.
1812 		 */
1813 		__be32 tmp;
1814 
1815 		if (!evreq) {
1816 			tmp = cpu_to_be32(mlxsw_pci_read32(mlxsw_pci,
1817 							   CIR_OUT_PARAM_HI));
1818 			memcpy(out_mbox, &tmp, sizeof(tmp));
1819 			tmp = cpu_to_be32(mlxsw_pci_read32(mlxsw_pci,
1820 							   CIR_OUT_PARAM_LO));
1821 			memcpy(out_mbox + sizeof(tmp), &tmp, sizeof(tmp));
1822 		}
1823 	} else if (!err && out_mbox) {
1824 		memcpy(out_mbox, mlxsw_pci->cmd.out_mbox.buf, out_mbox_size);
1825 	}
1826 
1827 	mutex_unlock(&mlxsw_pci->cmd.lock);
1828 
1829 	return err;
1830 }
1831 
1832 static const struct mlxsw_bus mlxsw_pci_bus = {
1833 	.kind			= "pci",
1834 	.init			= mlxsw_pci_init,
1835 	.fini			= mlxsw_pci_fini,
1836 	.skb_transmit_busy	= mlxsw_pci_skb_transmit_busy,
1837 	.skb_transmit		= mlxsw_pci_skb_transmit,
1838 	.cmd_exec		= mlxsw_pci_cmd_exec,
1839 };
1840 
1841 static int mlxsw_pci_sw_reset(struct mlxsw_pci *mlxsw_pci,
1842 			      const struct pci_device_id *id)
1843 {
1844 	unsigned long end;
1845 
1846 	mlxsw_pci_write32(mlxsw_pci, SW_RESET, MLXSW_PCI_SW_RESET_RST_BIT);
1847 	if (id->device == PCI_DEVICE_ID_MELLANOX_SWITCHX2) {
1848 		msleep(MLXSW_PCI_SW_RESET_TIMEOUT_MSECS);
1849 		return 0;
1850 	}
1851 
1852 	wmb(); /* reset needs to be written before we read control register */
1853 	end = jiffies + msecs_to_jiffies(MLXSW_PCI_SW_RESET_TIMEOUT_MSECS);
1854 	do {
1855 		u32 val = mlxsw_pci_read32(mlxsw_pci, FW_READY);
1856 
1857 		if ((val & MLXSW_PCI_FW_READY_MASK) == MLXSW_PCI_FW_READY_MAGIC)
1858 			break;
1859 		cond_resched();
1860 	} while (time_before(jiffies, end));
1861 	return 0;
1862 }
1863 
1864 static int mlxsw_pci_probe(struct pci_dev *pdev, const struct pci_device_id *id)
1865 {
1866 	struct mlxsw_pci *mlxsw_pci;
1867 	int err;
1868 
1869 	mlxsw_pci = kzalloc(sizeof(*mlxsw_pci), GFP_KERNEL);
1870 	if (!mlxsw_pci)
1871 		return -ENOMEM;
1872 
1873 	err = pci_enable_device(pdev);
1874 	if (err) {
1875 		dev_err(&pdev->dev, "pci_enable_device failed\n");
1876 		goto err_pci_enable_device;
1877 	}
1878 
1879 	err = pci_request_regions(pdev, mlxsw_pci_driver_name);
1880 	if (err) {
1881 		dev_err(&pdev->dev, "pci_request_regions failed\n");
1882 		goto err_pci_request_regions;
1883 	}
1884 
1885 	err = pci_set_dma_mask(pdev, DMA_BIT_MASK(64));
1886 	if (!err) {
1887 		err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(64));
1888 		if (err) {
1889 			dev_err(&pdev->dev, "pci_set_consistent_dma_mask failed\n");
1890 			goto err_pci_set_dma_mask;
1891 		}
1892 	} else {
1893 		err = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
1894 		if (err) {
1895 			dev_err(&pdev->dev, "pci_set_dma_mask failed\n");
1896 			goto err_pci_set_dma_mask;
1897 		}
1898 	}
1899 
1900 	if (pci_resource_len(pdev, 0) < MLXSW_PCI_BAR0_SIZE) {
1901 		dev_err(&pdev->dev, "invalid PCI region size\n");
1902 		err = -EINVAL;
1903 		goto err_pci_resource_len_check;
1904 	}
1905 
1906 	mlxsw_pci->hw_addr = ioremap(pci_resource_start(pdev, 0),
1907 				     pci_resource_len(pdev, 0));
1908 	if (!mlxsw_pci->hw_addr) {
1909 		dev_err(&pdev->dev, "ioremap failed\n");
1910 		err = -EIO;
1911 		goto err_ioremap;
1912 	}
1913 	pci_set_master(pdev);
1914 
1915 	mlxsw_pci->pdev = pdev;
1916 	pci_set_drvdata(pdev, mlxsw_pci);
1917 
1918 	err = mlxsw_pci_sw_reset(mlxsw_pci, id);
1919 	if (err) {
1920 		dev_err(&pdev->dev, "Software reset failed\n");
1921 		goto err_sw_reset;
1922 	}
1923 
1924 	err = pci_enable_msix_exact(pdev, &mlxsw_pci->msix_entry, 1);
1925 	if (err) {
1926 		dev_err(&pdev->dev, "MSI-X init failed\n");
1927 		goto err_msix_init;
1928 	}
1929 
1930 	mlxsw_pci->bus_info.device_kind = mlxsw_pci_device_kind_get(id);
1931 	mlxsw_pci->bus_info.device_name = pci_name(mlxsw_pci->pdev);
1932 	mlxsw_pci->bus_info.dev = &pdev->dev;
1933 
1934 	mlxsw_pci->dbg_dir = debugfs_create_dir(mlxsw_pci->bus_info.device_name,
1935 						mlxsw_pci_dbg_root);
1936 	if (!mlxsw_pci->dbg_dir) {
1937 		dev_err(&pdev->dev, "Failed to create debugfs dir\n");
1938 		err = -ENOMEM;
1939 		goto err_dbg_create_dir;
1940 	}
1941 
1942 	err = mlxsw_core_bus_device_register(&mlxsw_pci->bus_info,
1943 					     &mlxsw_pci_bus, mlxsw_pci);
1944 	if (err) {
1945 		dev_err(&pdev->dev, "cannot register bus device\n");
1946 		goto err_bus_device_register;
1947 	}
1948 
1949 	return 0;
1950 
1951 err_bus_device_register:
1952 	debugfs_remove_recursive(mlxsw_pci->dbg_dir);
1953 err_dbg_create_dir:
1954 	pci_disable_msix(mlxsw_pci->pdev);
1955 err_msix_init:
1956 err_sw_reset:
1957 	iounmap(mlxsw_pci->hw_addr);
1958 err_ioremap:
1959 err_pci_resource_len_check:
1960 err_pci_set_dma_mask:
1961 	pci_release_regions(pdev);
1962 err_pci_request_regions:
1963 	pci_disable_device(pdev);
1964 err_pci_enable_device:
1965 	kfree(mlxsw_pci);
1966 	return err;
1967 }
1968 
1969 static void mlxsw_pci_remove(struct pci_dev *pdev)
1970 {
1971 	struct mlxsw_pci *mlxsw_pci = pci_get_drvdata(pdev);
1972 
1973 	mlxsw_core_bus_device_unregister(mlxsw_pci->core);
1974 	debugfs_remove_recursive(mlxsw_pci->dbg_dir);
1975 	pci_disable_msix(mlxsw_pci->pdev);
1976 	iounmap(mlxsw_pci->hw_addr);
1977 	pci_release_regions(mlxsw_pci->pdev);
1978 	pci_disable_device(mlxsw_pci->pdev);
1979 	kfree(mlxsw_pci);
1980 }
1981 
1982 static struct pci_driver mlxsw_pci_driver = {
1983 	.name		= mlxsw_pci_driver_name,
1984 	.id_table	= mlxsw_pci_id_table,
1985 	.probe		= mlxsw_pci_probe,
1986 	.remove		= mlxsw_pci_remove,
1987 };
1988 
1989 static int __init mlxsw_pci_module_init(void)
1990 {
1991 	int err;
1992 
1993 	mlxsw_pci_dbg_root = debugfs_create_dir(mlxsw_pci_driver_name, NULL);
1994 	if (!mlxsw_pci_dbg_root)
1995 		return -ENOMEM;
1996 	err = pci_register_driver(&mlxsw_pci_driver);
1997 	if (err)
1998 		goto err_register_driver;
1999 	return 0;
2000 
2001 err_register_driver:
2002 	debugfs_remove_recursive(mlxsw_pci_dbg_root);
2003 	return err;
2004 }
2005 
2006 static void __exit mlxsw_pci_module_exit(void)
2007 {
2008 	pci_unregister_driver(&mlxsw_pci_driver);
2009 	debugfs_remove_recursive(mlxsw_pci_dbg_root);
2010 }
2011 
2012 module_init(mlxsw_pci_module_init);
2013 module_exit(mlxsw_pci_module_exit);
2014 
2015 MODULE_LICENSE("Dual BSD/GPL");
2016 MODULE_AUTHOR("Jiri Pirko <jiri@mellanox.com>");
2017 MODULE_DESCRIPTION("Mellanox switch PCI interface driver");
2018 MODULE_DEVICE_TABLE(pci, mlxsw_pci_id_table);
2019