xref: /openbmc/linux/drivers/net/ethernet/chelsio/cxgb4/cudbg_lib.c (revision 4f727ecefefbd180de10e25b3e74c03dce3f1e75)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  *  Copyright (C) 2017 Chelsio Communications.  All rights reserved.
4  */
5 
6 #include <linux/sort.h>
7 
8 #include "t4_regs.h"
9 #include "cxgb4.h"
10 #include "cxgb4_cudbg.h"
11 #include "cudbg_if.h"
12 #include "cudbg_lib_common.h"
13 #include "cudbg_entity.h"
14 #include "cudbg_lib.h"
15 #include "cudbg_zlib.h"
16 
17 static int cudbg_do_compression(struct cudbg_init *pdbg_init,
18 				struct cudbg_buffer *pin_buff,
19 				struct cudbg_buffer *dbg_buff)
20 {
21 	struct cudbg_buffer temp_in_buff = { 0 };
22 	int bytes_left, bytes_read, bytes;
23 	u32 offset = dbg_buff->offset;
24 	int rc;
25 
26 	temp_in_buff.offset = pin_buff->offset;
27 	temp_in_buff.data = pin_buff->data;
28 	temp_in_buff.size = pin_buff->size;
29 
30 	bytes_left = pin_buff->size;
31 	bytes_read = 0;
32 	while (bytes_left > 0) {
33 		/* Do compression in smaller chunks */
34 		bytes = min_t(unsigned long, bytes_left,
35 			      (unsigned long)CUDBG_CHUNK_SIZE);
36 		temp_in_buff.data = (char *)pin_buff->data + bytes_read;
37 		temp_in_buff.size = bytes;
38 		rc = cudbg_compress_buff(pdbg_init, &temp_in_buff, dbg_buff);
39 		if (rc)
40 			return rc;
41 		bytes_left -= bytes;
42 		bytes_read += bytes;
43 	}
44 
45 	pin_buff->size = dbg_buff->offset - offset;
46 	return 0;
47 }
48 
49 static int cudbg_write_and_release_buff(struct cudbg_init *pdbg_init,
50 					struct cudbg_buffer *pin_buff,
51 					struct cudbg_buffer *dbg_buff)
52 {
53 	int rc = 0;
54 
55 	if (pdbg_init->compress_type == CUDBG_COMPRESSION_NONE) {
56 		cudbg_update_buff(pin_buff, dbg_buff);
57 	} else {
58 		rc = cudbg_do_compression(pdbg_init, pin_buff, dbg_buff);
59 		if (rc)
60 			goto out;
61 	}
62 
63 out:
64 	cudbg_put_buff(pdbg_init, pin_buff);
65 	return rc;
66 }
67 
68 static int is_fw_attached(struct cudbg_init *pdbg_init)
69 {
70 	struct adapter *padap = pdbg_init->adap;
71 
72 	if (!(padap->flags & CXGB4_FW_OK) || padap->use_bd)
73 		return 0;
74 
75 	return 1;
76 }
77 
78 /* This function will add additional padding bytes into debug_buffer to make it
79  * 4 byte aligned.
80  */
81 void cudbg_align_debug_buffer(struct cudbg_buffer *dbg_buff,
82 			      struct cudbg_entity_hdr *entity_hdr)
83 {
84 	u8 zero_buf[4] = {0};
85 	u8 padding, remain;
86 
87 	remain = (dbg_buff->offset - entity_hdr->start_offset) % 4;
88 	padding = 4 - remain;
89 	if (remain) {
90 		memcpy(((u8 *)dbg_buff->data) + dbg_buff->offset, &zero_buf,
91 		       padding);
92 		dbg_buff->offset += padding;
93 		entity_hdr->num_pad = padding;
94 	}
95 	entity_hdr->size = dbg_buff->offset - entity_hdr->start_offset;
96 }
97 
98 struct cudbg_entity_hdr *cudbg_get_entity_hdr(void *outbuf, int i)
99 {
100 	struct cudbg_hdr *cudbg_hdr = (struct cudbg_hdr *)outbuf;
101 
102 	return (struct cudbg_entity_hdr *)
103 	       ((char *)outbuf + cudbg_hdr->hdr_len +
104 		(sizeof(struct cudbg_entity_hdr) * (i - 1)));
105 }
106 
107 static int cudbg_read_vpd_reg(struct adapter *padap, u32 addr, u32 len,
108 			      void *dest)
109 {
110 	int vaddr, rc;
111 
112 	vaddr = t4_eeprom_ptov(addr, padap->pf, EEPROMPFSIZE);
113 	if (vaddr < 0)
114 		return vaddr;
115 
116 	rc = pci_read_vpd(padap->pdev, vaddr, len, dest);
117 	if (rc < 0)
118 		return rc;
119 
120 	return 0;
121 }
122 
123 static int cudbg_mem_desc_cmp(const void *a, const void *b)
124 {
125 	return ((const struct cudbg_mem_desc *)a)->base -
126 	       ((const struct cudbg_mem_desc *)b)->base;
127 }
128 
129 int cudbg_fill_meminfo(struct adapter *padap,
130 		       struct cudbg_meminfo *meminfo_buff)
131 {
132 	struct cudbg_mem_desc *md;
133 	u32 lo, hi, used, alloc;
134 	int n, i;
135 
136 	memset(meminfo_buff->avail, 0,
137 	       ARRAY_SIZE(meminfo_buff->avail) *
138 	       sizeof(struct cudbg_mem_desc));
139 	memset(meminfo_buff->mem, 0,
140 	       (ARRAY_SIZE(cudbg_region) + 3) * sizeof(struct cudbg_mem_desc));
141 	md  = meminfo_buff->mem;
142 
143 	for (i = 0; i < ARRAY_SIZE(meminfo_buff->mem); i++) {
144 		meminfo_buff->mem[i].limit = 0;
145 		meminfo_buff->mem[i].idx = i;
146 	}
147 
148 	/* Find and sort the populated memory ranges */
149 	i = 0;
150 	lo = t4_read_reg(padap, MA_TARGET_MEM_ENABLE_A);
151 	if (lo & EDRAM0_ENABLE_F) {
152 		hi = t4_read_reg(padap, MA_EDRAM0_BAR_A);
153 		meminfo_buff->avail[i].base =
154 			cudbg_mbytes_to_bytes(EDRAM0_BASE_G(hi));
155 		meminfo_buff->avail[i].limit =
156 			meminfo_buff->avail[i].base +
157 			cudbg_mbytes_to_bytes(EDRAM0_SIZE_G(hi));
158 		meminfo_buff->avail[i].idx = 0;
159 		i++;
160 	}
161 
162 	if (lo & EDRAM1_ENABLE_F) {
163 		hi =  t4_read_reg(padap, MA_EDRAM1_BAR_A);
164 		meminfo_buff->avail[i].base =
165 			cudbg_mbytes_to_bytes(EDRAM1_BASE_G(hi));
166 		meminfo_buff->avail[i].limit =
167 			meminfo_buff->avail[i].base +
168 			cudbg_mbytes_to_bytes(EDRAM1_SIZE_G(hi));
169 		meminfo_buff->avail[i].idx = 1;
170 		i++;
171 	}
172 
173 	if (is_t5(padap->params.chip)) {
174 		if (lo & EXT_MEM0_ENABLE_F) {
175 			hi = t4_read_reg(padap, MA_EXT_MEMORY0_BAR_A);
176 			meminfo_buff->avail[i].base =
177 				cudbg_mbytes_to_bytes(EXT_MEM_BASE_G(hi));
178 			meminfo_buff->avail[i].limit =
179 				meminfo_buff->avail[i].base +
180 				cudbg_mbytes_to_bytes(EXT_MEM_SIZE_G(hi));
181 			meminfo_buff->avail[i].idx = 3;
182 			i++;
183 		}
184 
185 		if (lo & EXT_MEM1_ENABLE_F) {
186 			hi = t4_read_reg(padap, MA_EXT_MEMORY1_BAR_A);
187 			meminfo_buff->avail[i].base =
188 				cudbg_mbytes_to_bytes(EXT_MEM1_BASE_G(hi));
189 			meminfo_buff->avail[i].limit =
190 				meminfo_buff->avail[i].base +
191 				cudbg_mbytes_to_bytes(EXT_MEM1_SIZE_G(hi));
192 			meminfo_buff->avail[i].idx = 4;
193 			i++;
194 		}
195 	} else {
196 		if (lo & EXT_MEM_ENABLE_F) {
197 			hi = t4_read_reg(padap, MA_EXT_MEMORY_BAR_A);
198 			meminfo_buff->avail[i].base =
199 				cudbg_mbytes_to_bytes(EXT_MEM_BASE_G(hi));
200 			meminfo_buff->avail[i].limit =
201 				meminfo_buff->avail[i].base +
202 				cudbg_mbytes_to_bytes(EXT_MEM_SIZE_G(hi));
203 			meminfo_buff->avail[i].idx = 2;
204 			i++;
205 		}
206 
207 		if (lo & HMA_MUX_F) {
208 			hi = t4_read_reg(padap, MA_EXT_MEMORY1_BAR_A);
209 			meminfo_buff->avail[i].base =
210 				cudbg_mbytes_to_bytes(EXT_MEM1_BASE_G(hi));
211 			meminfo_buff->avail[i].limit =
212 				meminfo_buff->avail[i].base +
213 				cudbg_mbytes_to_bytes(EXT_MEM1_SIZE_G(hi));
214 			meminfo_buff->avail[i].idx = 5;
215 			i++;
216 		}
217 	}
218 
219 	if (!i) /* no memory available */
220 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
221 
222 	meminfo_buff->avail_c = i;
223 	sort(meminfo_buff->avail, i, sizeof(struct cudbg_mem_desc),
224 	     cudbg_mem_desc_cmp, NULL);
225 	(md++)->base = t4_read_reg(padap, SGE_DBQ_CTXT_BADDR_A);
226 	(md++)->base = t4_read_reg(padap, SGE_IMSG_CTXT_BADDR_A);
227 	(md++)->base = t4_read_reg(padap, SGE_FLM_CACHE_BADDR_A);
228 	(md++)->base = t4_read_reg(padap, TP_CMM_TCB_BASE_A);
229 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_BASE_A);
230 	(md++)->base = t4_read_reg(padap, TP_CMM_TIMER_BASE_A);
231 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_RX_FLST_BASE_A);
232 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_TX_FLST_BASE_A);
233 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_PS_FLST_BASE_A);
234 
235 	/* the next few have explicit upper bounds */
236 	md->base = t4_read_reg(padap, TP_PMM_TX_BASE_A);
237 	md->limit = md->base - 1 +
238 		    t4_read_reg(padap, TP_PMM_TX_PAGE_SIZE_A) *
239 		    PMTXMAXPAGE_G(t4_read_reg(padap, TP_PMM_TX_MAX_PAGE_A));
240 	md++;
241 
242 	md->base = t4_read_reg(padap, TP_PMM_RX_BASE_A);
243 	md->limit = md->base - 1 +
244 		    t4_read_reg(padap, TP_PMM_RX_PAGE_SIZE_A) *
245 		    PMRXMAXPAGE_G(t4_read_reg(padap, TP_PMM_RX_MAX_PAGE_A));
246 	md++;
247 
248 	if (t4_read_reg(padap, LE_DB_CONFIG_A) & HASHEN_F) {
249 		if (CHELSIO_CHIP_VERSION(padap->params.chip) <= CHELSIO_T5) {
250 			hi = t4_read_reg(padap, LE_DB_TID_HASHBASE_A) / 4;
251 			md->base = t4_read_reg(padap, LE_DB_HASH_TID_BASE_A);
252 		} else {
253 			hi = t4_read_reg(padap, LE_DB_HASH_TID_BASE_A);
254 			md->base = t4_read_reg(padap,
255 					       LE_DB_HASH_TBL_BASE_ADDR_A);
256 		}
257 		md->limit = 0;
258 	} else {
259 		md->base = 0;
260 		md->idx = ARRAY_SIZE(cudbg_region);  /* hide it */
261 	}
262 	md++;
263 
264 #define ulp_region(reg) do { \
265 	md->base = t4_read_reg(padap, ULP_ ## reg ## _LLIMIT_A);\
266 	(md++)->limit = t4_read_reg(padap, ULP_ ## reg ## _ULIMIT_A);\
267 } while (0)
268 
269 	ulp_region(RX_ISCSI);
270 	ulp_region(RX_TDDP);
271 	ulp_region(TX_TPT);
272 	ulp_region(RX_STAG);
273 	ulp_region(RX_RQ);
274 	ulp_region(RX_RQUDP);
275 	ulp_region(RX_PBL);
276 	ulp_region(TX_PBL);
277 #undef ulp_region
278 	md->base = 0;
279 	md->idx = ARRAY_SIZE(cudbg_region);
280 	if (!is_t4(padap->params.chip)) {
281 		u32 fifo_size = t4_read_reg(padap, SGE_DBVFIFO_SIZE_A);
282 		u32 sge_ctrl = t4_read_reg(padap, SGE_CONTROL2_A);
283 		u32 size = 0;
284 
285 		if (is_t5(padap->params.chip)) {
286 			if (sge_ctrl & VFIFO_ENABLE_F)
287 				size = DBVFIFO_SIZE_G(fifo_size);
288 		} else {
289 			size = T6_DBVFIFO_SIZE_G(fifo_size);
290 		}
291 
292 		if (size) {
293 			md->base = BASEADDR_G(t4_read_reg(padap,
294 							  SGE_DBVFIFO_BADDR_A));
295 			md->limit = md->base + (size << 2) - 1;
296 		}
297 	}
298 
299 	md++;
300 
301 	md->base = t4_read_reg(padap, ULP_RX_CTX_BASE_A);
302 	md->limit = 0;
303 	md++;
304 	md->base = t4_read_reg(padap, ULP_TX_ERR_TABLE_BASE_A);
305 	md->limit = 0;
306 	md++;
307 
308 	md->base = padap->vres.ocq.start;
309 	if (padap->vres.ocq.size)
310 		md->limit = md->base + padap->vres.ocq.size - 1;
311 	else
312 		md->idx = ARRAY_SIZE(cudbg_region);  /* hide it */
313 	md++;
314 
315 	/* add any address-space holes, there can be up to 3 */
316 	for (n = 0; n < i - 1; n++)
317 		if (meminfo_buff->avail[n].limit <
318 		    meminfo_buff->avail[n + 1].base)
319 			(md++)->base = meminfo_buff->avail[n].limit;
320 
321 	if (meminfo_buff->avail[n].limit)
322 		(md++)->base = meminfo_buff->avail[n].limit;
323 
324 	n = md - meminfo_buff->mem;
325 	meminfo_buff->mem_c = n;
326 
327 	sort(meminfo_buff->mem, n, sizeof(struct cudbg_mem_desc),
328 	     cudbg_mem_desc_cmp, NULL);
329 
330 	lo = t4_read_reg(padap, CIM_SDRAM_BASE_ADDR_A);
331 	hi = t4_read_reg(padap, CIM_SDRAM_ADDR_SIZE_A) + lo - 1;
332 	meminfo_buff->up_ram_lo = lo;
333 	meminfo_buff->up_ram_hi = hi;
334 
335 	lo = t4_read_reg(padap, CIM_EXTMEM2_BASE_ADDR_A);
336 	hi = t4_read_reg(padap, CIM_EXTMEM2_ADDR_SIZE_A) + lo - 1;
337 	meminfo_buff->up_extmem2_lo = lo;
338 	meminfo_buff->up_extmem2_hi = hi;
339 
340 	lo = t4_read_reg(padap, TP_PMM_RX_MAX_PAGE_A);
341 	for (i = 0, meminfo_buff->free_rx_cnt = 0; i < 2; i++)
342 		meminfo_buff->free_rx_cnt +=
343 			FREERXPAGECOUNT_G(t4_read_reg(padap,
344 						      TP_FLM_FREE_RX_CNT_A));
345 
346 	meminfo_buff->rx_pages_data[0] =  PMRXMAXPAGE_G(lo);
347 	meminfo_buff->rx_pages_data[1] =
348 		t4_read_reg(padap, TP_PMM_RX_PAGE_SIZE_A) >> 10;
349 	meminfo_buff->rx_pages_data[2] = (lo & PMRXNUMCHN_F) ? 2 : 1;
350 
351 	lo = t4_read_reg(padap, TP_PMM_TX_MAX_PAGE_A);
352 	hi = t4_read_reg(padap, TP_PMM_TX_PAGE_SIZE_A);
353 	for (i = 0, meminfo_buff->free_tx_cnt = 0; i < 4; i++)
354 		meminfo_buff->free_tx_cnt +=
355 			FREETXPAGECOUNT_G(t4_read_reg(padap,
356 						      TP_FLM_FREE_TX_CNT_A));
357 
358 	meminfo_buff->tx_pages_data[0] = PMTXMAXPAGE_G(lo);
359 	meminfo_buff->tx_pages_data[1] =
360 		hi >= (1 << 20) ? (hi >> 20) : (hi >> 10);
361 	meminfo_buff->tx_pages_data[2] =
362 		hi >= (1 << 20) ? 'M' : 'K';
363 	meminfo_buff->tx_pages_data[3] = 1 << PMTXNUMCHN_G(lo);
364 
365 	meminfo_buff->p_structs = t4_read_reg(padap, TP_CMM_MM_MAX_PSTRUCT_A);
366 	meminfo_buff->p_structs_free_cnt =
367 		FREEPSTRUCTCOUNT_G(t4_read_reg(padap, TP_FLM_FREE_PS_CNT_A));
368 
369 	for (i = 0; i < 4; i++) {
370 		if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5)
371 			lo = t4_read_reg(padap,
372 					 MPS_RX_MAC_BG_PG_CNT0_A + i * 4);
373 		else
374 			lo = t4_read_reg(padap, MPS_RX_PG_RSV0_A + i * 4);
375 		if (is_t5(padap->params.chip)) {
376 			used = T5_USED_G(lo);
377 			alloc = T5_ALLOC_G(lo);
378 		} else {
379 			used = USED_G(lo);
380 			alloc = ALLOC_G(lo);
381 		}
382 		meminfo_buff->port_used[i] = used;
383 		meminfo_buff->port_alloc[i] = alloc;
384 	}
385 
386 	for (i = 0; i < padap->params.arch.nchan; i++) {
387 		if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5)
388 			lo = t4_read_reg(padap,
389 					 MPS_RX_LPBK_BG_PG_CNT0_A + i * 4);
390 		else
391 			lo = t4_read_reg(padap, MPS_RX_PG_RSV4_A + i * 4);
392 		if (is_t5(padap->params.chip)) {
393 			used = T5_USED_G(lo);
394 			alloc = T5_ALLOC_G(lo);
395 		} else {
396 			used = USED_G(lo);
397 			alloc = ALLOC_G(lo);
398 		}
399 		meminfo_buff->loopback_used[i] = used;
400 		meminfo_buff->loopback_alloc[i] = alloc;
401 	}
402 
403 	return 0;
404 }
405 
406 int cudbg_collect_reg_dump(struct cudbg_init *pdbg_init,
407 			   struct cudbg_buffer *dbg_buff,
408 			   struct cudbg_error *cudbg_err)
409 {
410 	struct adapter *padap = pdbg_init->adap;
411 	struct cudbg_buffer temp_buff = { 0 };
412 	u32 buf_size = 0;
413 	int rc = 0;
414 
415 	if (is_t4(padap->params.chip))
416 		buf_size = T4_REGMAP_SIZE;
417 	else if (is_t5(padap->params.chip) || is_t6(padap->params.chip))
418 		buf_size = T5_REGMAP_SIZE;
419 
420 	rc = cudbg_get_buff(pdbg_init, dbg_buff, buf_size, &temp_buff);
421 	if (rc)
422 		return rc;
423 	t4_get_regs(padap, (void *)temp_buff.data, temp_buff.size);
424 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
425 }
426 
427 int cudbg_collect_fw_devlog(struct cudbg_init *pdbg_init,
428 			    struct cudbg_buffer *dbg_buff,
429 			    struct cudbg_error *cudbg_err)
430 {
431 	struct adapter *padap = pdbg_init->adap;
432 	struct cudbg_buffer temp_buff = { 0 };
433 	struct devlog_params *dparams;
434 	int rc = 0;
435 
436 	rc = t4_init_devlog_params(padap);
437 	if (rc < 0) {
438 		cudbg_err->sys_err = rc;
439 		return rc;
440 	}
441 
442 	dparams = &padap->params.devlog;
443 	rc = cudbg_get_buff(pdbg_init, dbg_buff, dparams->size, &temp_buff);
444 	if (rc)
445 		return rc;
446 
447 	/* Collect FW devlog */
448 	if (dparams->start != 0) {
449 		spin_lock(&padap->win0_lock);
450 		rc = t4_memory_rw(padap, padap->params.drv_memwin,
451 				  dparams->memtype, dparams->start,
452 				  dparams->size,
453 				  (__be32 *)(char *)temp_buff.data,
454 				  1);
455 		spin_unlock(&padap->win0_lock);
456 		if (rc) {
457 			cudbg_err->sys_err = rc;
458 			cudbg_put_buff(pdbg_init, &temp_buff);
459 			return rc;
460 		}
461 	}
462 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
463 }
464 
465 int cudbg_collect_cim_la(struct cudbg_init *pdbg_init,
466 			 struct cudbg_buffer *dbg_buff,
467 			 struct cudbg_error *cudbg_err)
468 {
469 	struct adapter *padap = pdbg_init->adap;
470 	struct cudbg_buffer temp_buff = { 0 };
471 	int size, rc;
472 	u32 cfg = 0;
473 
474 	if (is_t6(padap->params.chip)) {
475 		size = padap->params.cim_la_size / 10 + 1;
476 		size *= 10 * sizeof(u32);
477 	} else {
478 		size = padap->params.cim_la_size / 8;
479 		size *= 8 * sizeof(u32);
480 	}
481 
482 	size += sizeof(cfg);
483 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
484 	if (rc)
485 		return rc;
486 
487 	rc = t4_cim_read(padap, UP_UP_DBG_LA_CFG_A, 1, &cfg);
488 	if (rc) {
489 		cudbg_err->sys_err = rc;
490 		cudbg_put_buff(pdbg_init, &temp_buff);
491 		return rc;
492 	}
493 
494 	memcpy((char *)temp_buff.data, &cfg, sizeof(cfg));
495 	rc = t4_cim_read_la(padap,
496 			    (u32 *)((char *)temp_buff.data + sizeof(cfg)),
497 			    NULL);
498 	if (rc < 0) {
499 		cudbg_err->sys_err = rc;
500 		cudbg_put_buff(pdbg_init, &temp_buff);
501 		return rc;
502 	}
503 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
504 }
505 
506 int cudbg_collect_cim_ma_la(struct cudbg_init *pdbg_init,
507 			    struct cudbg_buffer *dbg_buff,
508 			    struct cudbg_error *cudbg_err)
509 {
510 	struct adapter *padap = pdbg_init->adap;
511 	struct cudbg_buffer temp_buff = { 0 };
512 	int size, rc;
513 
514 	size = 2 * CIM_MALA_SIZE * 5 * sizeof(u32);
515 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
516 	if (rc)
517 		return rc;
518 
519 	t4_cim_read_ma_la(padap,
520 			  (u32 *)temp_buff.data,
521 			  (u32 *)((char *)temp_buff.data +
522 				  5 * CIM_MALA_SIZE));
523 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
524 }
525 
526 int cudbg_collect_cim_qcfg(struct cudbg_init *pdbg_init,
527 			   struct cudbg_buffer *dbg_buff,
528 			   struct cudbg_error *cudbg_err)
529 {
530 	struct adapter *padap = pdbg_init->adap;
531 	struct cudbg_buffer temp_buff = { 0 };
532 	struct cudbg_cim_qcfg *cim_qcfg_data;
533 	int rc;
534 
535 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_cim_qcfg),
536 			    &temp_buff);
537 	if (rc)
538 		return rc;
539 
540 	cim_qcfg_data = (struct cudbg_cim_qcfg *)temp_buff.data;
541 	cim_qcfg_data->chip = padap->params.chip;
542 	rc = t4_cim_read(padap, UP_IBQ_0_RDADDR_A,
543 			 ARRAY_SIZE(cim_qcfg_data->stat), cim_qcfg_data->stat);
544 	if (rc) {
545 		cudbg_err->sys_err = rc;
546 		cudbg_put_buff(pdbg_init, &temp_buff);
547 		return rc;
548 	}
549 
550 	rc = t4_cim_read(padap, UP_OBQ_0_REALADDR_A,
551 			 ARRAY_SIZE(cim_qcfg_data->obq_wr),
552 			 cim_qcfg_data->obq_wr);
553 	if (rc) {
554 		cudbg_err->sys_err = rc;
555 		cudbg_put_buff(pdbg_init, &temp_buff);
556 		return rc;
557 	}
558 
559 	t4_read_cimq_cfg(padap, cim_qcfg_data->base, cim_qcfg_data->size,
560 			 cim_qcfg_data->thres);
561 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
562 }
563 
564 static int cudbg_read_cim_ibq(struct cudbg_init *pdbg_init,
565 			      struct cudbg_buffer *dbg_buff,
566 			      struct cudbg_error *cudbg_err, int qid)
567 {
568 	struct adapter *padap = pdbg_init->adap;
569 	struct cudbg_buffer temp_buff = { 0 };
570 	int no_of_read_words, rc = 0;
571 	u32 qsize;
572 
573 	/* collect CIM IBQ */
574 	qsize = CIM_IBQ_SIZE * 4 * sizeof(u32);
575 	rc = cudbg_get_buff(pdbg_init, dbg_buff, qsize, &temp_buff);
576 	if (rc)
577 		return rc;
578 
579 	/* t4_read_cim_ibq will return no. of read words or error */
580 	no_of_read_words = t4_read_cim_ibq(padap, qid,
581 					   (u32 *)temp_buff.data, qsize);
582 	/* no_of_read_words is less than or equal to 0 means error */
583 	if (no_of_read_words <= 0) {
584 		if (!no_of_read_words)
585 			rc = CUDBG_SYSTEM_ERROR;
586 		else
587 			rc = no_of_read_words;
588 		cudbg_err->sys_err = rc;
589 		cudbg_put_buff(pdbg_init, &temp_buff);
590 		return rc;
591 	}
592 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
593 }
594 
595 int cudbg_collect_cim_ibq_tp0(struct cudbg_init *pdbg_init,
596 			      struct cudbg_buffer *dbg_buff,
597 			      struct cudbg_error *cudbg_err)
598 {
599 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 0);
600 }
601 
602 int cudbg_collect_cim_ibq_tp1(struct cudbg_init *pdbg_init,
603 			      struct cudbg_buffer *dbg_buff,
604 			      struct cudbg_error *cudbg_err)
605 {
606 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 1);
607 }
608 
609 int cudbg_collect_cim_ibq_ulp(struct cudbg_init *pdbg_init,
610 			      struct cudbg_buffer *dbg_buff,
611 			      struct cudbg_error *cudbg_err)
612 {
613 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 2);
614 }
615 
616 int cudbg_collect_cim_ibq_sge0(struct cudbg_init *pdbg_init,
617 			       struct cudbg_buffer *dbg_buff,
618 			       struct cudbg_error *cudbg_err)
619 {
620 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 3);
621 }
622 
623 int cudbg_collect_cim_ibq_sge1(struct cudbg_init *pdbg_init,
624 			       struct cudbg_buffer *dbg_buff,
625 			       struct cudbg_error *cudbg_err)
626 {
627 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 4);
628 }
629 
630 int cudbg_collect_cim_ibq_ncsi(struct cudbg_init *pdbg_init,
631 			       struct cudbg_buffer *dbg_buff,
632 			       struct cudbg_error *cudbg_err)
633 {
634 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 5);
635 }
636 
637 u32 cudbg_cim_obq_size(struct adapter *padap, int qid)
638 {
639 	u32 value;
640 
641 	t4_write_reg(padap, CIM_QUEUE_CONFIG_REF_A, OBQSELECT_F |
642 		     QUENUMSELECT_V(qid));
643 	value = t4_read_reg(padap, CIM_QUEUE_CONFIG_CTRL_A);
644 	value = CIMQSIZE_G(value) * 64; /* size in number of words */
645 	return value * sizeof(u32);
646 }
647 
648 static int cudbg_read_cim_obq(struct cudbg_init *pdbg_init,
649 			      struct cudbg_buffer *dbg_buff,
650 			      struct cudbg_error *cudbg_err, int qid)
651 {
652 	struct adapter *padap = pdbg_init->adap;
653 	struct cudbg_buffer temp_buff = { 0 };
654 	int no_of_read_words, rc = 0;
655 	u32 qsize;
656 
657 	/* collect CIM OBQ */
658 	qsize =  cudbg_cim_obq_size(padap, qid);
659 	rc = cudbg_get_buff(pdbg_init, dbg_buff, qsize, &temp_buff);
660 	if (rc)
661 		return rc;
662 
663 	/* t4_read_cim_obq will return no. of read words or error */
664 	no_of_read_words = t4_read_cim_obq(padap, qid,
665 					   (u32 *)temp_buff.data, qsize);
666 	/* no_of_read_words is less than or equal to 0 means error */
667 	if (no_of_read_words <= 0) {
668 		if (!no_of_read_words)
669 			rc = CUDBG_SYSTEM_ERROR;
670 		else
671 			rc = no_of_read_words;
672 		cudbg_err->sys_err = rc;
673 		cudbg_put_buff(pdbg_init, &temp_buff);
674 		return rc;
675 	}
676 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
677 }
678 
679 int cudbg_collect_cim_obq_ulp0(struct cudbg_init *pdbg_init,
680 			       struct cudbg_buffer *dbg_buff,
681 			       struct cudbg_error *cudbg_err)
682 {
683 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 0);
684 }
685 
686 int cudbg_collect_cim_obq_ulp1(struct cudbg_init *pdbg_init,
687 			       struct cudbg_buffer *dbg_buff,
688 			       struct cudbg_error *cudbg_err)
689 {
690 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 1);
691 }
692 
693 int cudbg_collect_cim_obq_ulp2(struct cudbg_init *pdbg_init,
694 			       struct cudbg_buffer *dbg_buff,
695 			       struct cudbg_error *cudbg_err)
696 {
697 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 2);
698 }
699 
700 int cudbg_collect_cim_obq_ulp3(struct cudbg_init *pdbg_init,
701 			       struct cudbg_buffer *dbg_buff,
702 			       struct cudbg_error *cudbg_err)
703 {
704 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 3);
705 }
706 
707 int cudbg_collect_cim_obq_sge(struct cudbg_init *pdbg_init,
708 			      struct cudbg_buffer *dbg_buff,
709 			      struct cudbg_error *cudbg_err)
710 {
711 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 4);
712 }
713 
714 int cudbg_collect_cim_obq_ncsi(struct cudbg_init *pdbg_init,
715 			       struct cudbg_buffer *dbg_buff,
716 			       struct cudbg_error *cudbg_err)
717 {
718 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 5);
719 }
720 
721 int cudbg_collect_obq_sge_rx_q0(struct cudbg_init *pdbg_init,
722 				struct cudbg_buffer *dbg_buff,
723 				struct cudbg_error *cudbg_err)
724 {
725 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 6);
726 }
727 
728 int cudbg_collect_obq_sge_rx_q1(struct cudbg_init *pdbg_init,
729 				struct cudbg_buffer *dbg_buff,
730 				struct cudbg_error *cudbg_err)
731 {
732 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 7);
733 }
734 
735 static int cudbg_meminfo_get_mem_index(struct adapter *padap,
736 				       struct cudbg_meminfo *mem_info,
737 				       u8 mem_type, u8 *idx)
738 {
739 	u8 i, flag;
740 
741 	switch (mem_type) {
742 	case MEM_EDC0:
743 		flag = EDC0_FLAG;
744 		break;
745 	case MEM_EDC1:
746 		flag = EDC1_FLAG;
747 		break;
748 	case MEM_MC0:
749 		/* Some T5 cards have both MC0 and MC1. */
750 		flag = is_t5(padap->params.chip) ? MC0_FLAG : MC_FLAG;
751 		break;
752 	case MEM_MC1:
753 		flag = MC1_FLAG;
754 		break;
755 	case MEM_HMA:
756 		flag = HMA_FLAG;
757 		break;
758 	default:
759 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
760 	}
761 
762 	for (i = 0; i < mem_info->avail_c; i++) {
763 		if (mem_info->avail[i].idx == flag) {
764 			*idx = i;
765 			return 0;
766 		}
767 	}
768 
769 	return CUDBG_STATUS_ENTITY_NOT_FOUND;
770 }
771 
772 /* Fetch the @region_name's start and end from @meminfo. */
773 static int cudbg_get_mem_region(struct adapter *padap,
774 				struct cudbg_meminfo *meminfo,
775 				u8 mem_type, const char *region_name,
776 				struct cudbg_mem_desc *mem_desc)
777 {
778 	u8 mc, found = 0;
779 	u32 i, idx = 0;
780 	int rc;
781 
782 	rc = cudbg_meminfo_get_mem_index(padap, meminfo, mem_type, &mc);
783 	if (rc)
784 		return rc;
785 
786 	for (i = 0; i < ARRAY_SIZE(cudbg_region); i++) {
787 		if (!strcmp(cudbg_region[i], region_name)) {
788 			found = 1;
789 			idx = i;
790 			break;
791 		}
792 	}
793 	if (!found)
794 		return -EINVAL;
795 
796 	found = 0;
797 	for (i = 0; i < meminfo->mem_c; i++) {
798 		if (meminfo->mem[i].idx >= ARRAY_SIZE(cudbg_region))
799 			continue; /* Skip holes */
800 
801 		if (!(meminfo->mem[i].limit))
802 			meminfo->mem[i].limit =
803 				i < meminfo->mem_c - 1 ?
804 				meminfo->mem[i + 1].base - 1 : ~0;
805 
806 		if (meminfo->mem[i].idx == idx) {
807 			/* Check if the region exists in @mem_type memory */
808 			if (meminfo->mem[i].base < meminfo->avail[mc].base &&
809 			    meminfo->mem[i].limit < meminfo->avail[mc].base)
810 				return -EINVAL;
811 
812 			if (meminfo->mem[i].base > meminfo->avail[mc].limit)
813 				return -EINVAL;
814 
815 			memcpy(mem_desc, &meminfo->mem[i],
816 			       sizeof(struct cudbg_mem_desc));
817 			found = 1;
818 			break;
819 		}
820 	}
821 	if (!found)
822 		return -EINVAL;
823 
824 	return 0;
825 }
826 
827 /* Fetch and update the start and end of the requested memory region w.r.t 0
828  * in the corresponding EDC/MC/HMA.
829  */
830 static int cudbg_get_mem_relative(struct adapter *padap,
831 				  struct cudbg_meminfo *meminfo,
832 				  u8 mem_type, u32 *out_base, u32 *out_end)
833 {
834 	u8 mc_idx;
835 	int rc;
836 
837 	rc = cudbg_meminfo_get_mem_index(padap, meminfo, mem_type, &mc_idx);
838 	if (rc)
839 		return rc;
840 
841 	if (*out_base < meminfo->avail[mc_idx].base)
842 		*out_base = 0;
843 	else
844 		*out_base -= meminfo->avail[mc_idx].base;
845 
846 	if (*out_end > meminfo->avail[mc_idx].limit)
847 		*out_end = meminfo->avail[mc_idx].limit;
848 	else
849 		*out_end -= meminfo->avail[mc_idx].base;
850 
851 	return 0;
852 }
853 
854 /* Get TX and RX Payload region */
855 static int cudbg_get_payload_range(struct adapter *padap, u8 mem_type,
856 				   const char *region_name,
857 				   struct cudbg_region_info *payload)
858 {
859 	struct cudbg_mem_desc mem_desc = { 0 };
860 	struct cudbg_meminfo meminfo;
861 	int rc;
862 
863 	rc = cudbg_fill_meminfo(padap, &meminfo);
864 	if (rc)
865 		return rc;
866 
867 	rc = cudbg_get_mem_region(padap, &meminfo, mem_type, region_name,
868 				  &mem_desc);
869 	if (rc) {
870 		payload->exist = false;
871 		return 0;
872 	}
873 
874 	payload->exist = true;
875 	payload->start = mem_desc.base;
876 	payload->end = mem_desc.limit;
877 
878 	return cudbg_get_mem_relative(padap, &meminfo, mem_type,
879 				      &payload->start, &payload->end);
880 }
881 
882 static int cudbg_memory_read(struct cudbg_init *pdbg_init, int win,
883 			     int mtype, u32 addr, u32 len, void *hbuf)
884 {
885 	u32 win_pf, memoffset, mem_aperture, mem_base;
886 	struct adapter *adap = pdbg_init->adap;
887 	u32 pos, offset, resid;
888 	u32 *res_buf;
889 	u64 *buf;
890 	int ret;
891 
892 	/* Argument sanity checks ...
893 	 */
894 	if (addr & 0x3 || (uintptr_t)hbuf & 0x3)
895 		return -EINVAL;
896 
897 	buf = (u64 *)hbuf;
898 
899 	/* Try to do 64-bit reads.  Residual will be handled later. */
900 	resid = len & 0x7;
901 	len -= resid;
902 
903 	ret = t4_memory_rw_init(adap, win, mtype, &memoffset, &mem_base,
904 				&mem_aperture);
905 	if (ret)
906 		return ret;
907 
908 	addr = addr + memoffset;
909 	win_pf = is_t4(adap->params.chip) ? 0 : PFNUM_V(adap->pf);
910 
911 	pos = addr & ~(mem_aperture - 1);
912 	offset = addr - pos;
913 
914 	/* Set up initial PCI-E Memory Window to cover the start of our
915 	 * transfer.
916 	 */
917 	t4_memory_update_win(adap, win, pos | win_pf);
918 
919 	/* Transfer data from the adapter */
920 	while (len > 0) {
921 		*buf++ = le64_to_cpu((__force __le64)
922 				     t4_read_reg64(adap, mem_base + offset));
923 		offset += sizeof(u64);
924 		len -= sizeof(u64);
925 
926 		/* If we've reached the end of our current window aperture,
927 		 * move the PCI-E Memory Window on to the next.
928 		 */
929 		if (offset == mem_aperture) {
930 			pos += mem_aperture;
931 			offset = 0;
932 			t4_memory_update_win(adap, win, pos | win_pf);
933 		}
934 	}
935 
936 	res_buf = (u32 *)buf;
937 	/* Read residual in 32-bit multiples */
938 	while (resid > sizeof(u32)) {
939 		*res_buf++ = le32_to_cpu((__force __le32)
940 					 t4_read_reg(adap, mem_base + offset));
941 		offset += sizeof(u32);
942 		resid -= sizeof(u32);
943 
944 		/* If we've reached the end of our current window aperture,
945 		 * move the PCI-E Memory Window on to the next.
946 		 */
947 		if (offset == mem_aperture) {
948 			pos += mem_aperture;
949 			offset = 0;
950 			t4_memory_update_win(adap, win, pos | win_pf);
951 		}
952 	}
953 
954 	/* Transfer residual < 32-bits */
955 	if (resid)
956 		t4_memory_rw_residual(adap, resid, mem_base + offset,
957 				      (u8 *)res_buf, T4_MEMORY_READ);
958 
959 	return 0;
960 }
961 
962 #define CUDBG_YIELD_ITERATION 256
963 
964 static int cudbg_read_fw_mem(struct cudbg_init *pdbg_init,
965 			     struct cudbg_buffer *dbg_buff, u8 mem_type,
966 			     unsigned long tot_len,
967 			     struct cudbg_error *cudbg_err)
968 {
969 	static const char * const region_name[] = { "Tx payload:",
970 						    "Rx payload:" };
971 	unsigned long bytes, bytes_left, bytes_read = 0;
972 	struct adapter *padap = pdbg_init->adap;
973 	struct cudbg_buffer temp_buff = { 0 };
974 	struct cudbg_region_info payload[2];
975 	u32 yield_count = 0;
976 	int rc = 0;
977 	u8 i;
978 
979 	/* Get TX/RX Payload region range if they exist */
980 	memset(payload, 0, sizeof(payload));
981 	for (i = 0; i < ARRAY_SIZE(region_name); i++) {
982 		rc = cudbg_get_payload_range(padap, mem_type, region_name[i],
983 					     &payload[i]);
984 		if (rc)
985 			return rc;
986 
987 		if (payload[i].exist) {
988 			/* Align start and end to avoid wrap around */
989 			payload[i].start = roundup(payload[i].start,
990 						   CUDBG_CHUNK_SIZE);
991 			payload[i].end = rounddown(payload[i].end,
992 						   CUDBG_CHUNK_SIZE);
993 		}
994 	}
995 
996 	bytes_left = tot_len;
997 	while (bytes_left > 0) {
998 		/* As MC size is huge and read through PIO access, this
999 		 * loop will hold cpu for a longer time. OS may think that
1000 		 * the process is hanged and will generate CPU stall traces.
1001 		 * So yield the cpu regularly.
1002 		 */
1003 		yield_count++;
1004 		if (!(yield_count % CUDBG_YIELD_ITERATION))
1005 			schedule();
1006 
1007 		bytes = min_t(unsigned long, bytes_left,
1008 			      (unsigned long)CUDBG_CHUNK_SIZE);
1009 		rc = cudbg_get_buff(pdbg_init, dbg_buff, bytes, &temp_buff);
1010 		if (rc)
1011 			return rc;
1012 
1013 		for (i = 0; i < ARRAY_SIZE(payload); i++)
1014 			if (payload[i].exist &&
1015 			    bytes_read >= payload[i].start &&
1016 			    bytes_read + bytes <= payload[i].end)
1017 				/* TX and RX Payload regions can't overlap */
1018 				goto skip_read;
1019 
1020 		spin_lock(&padap->win0_lock);
1021 		rc = cudbg_memory_read(pdbg_init, MEMWIN_NIC, mem_type,
1022 				       bytes_read, bytes, temp_buff.data);
1023 		spin_unlock(&padap->win0_lock);
1024 		if (rc) {
1025 			cudbg_err->sys_err = rc;
1026 			cudbg_put_buff(pdbg_init, &temp_buff);
1027 			return rc;
1028 		}
1029 
1030 skip_read:
1031 		bytes_left -= bytes;
1032 		bytes_read += bytes;
1033 		rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
1034 						  dbg_buff);
1035 		if (rc) {
1036 			cudbg_put_buff(pdbg_init, &temp_buff);
1037 			return rc;
1038 		}
1039 	}
1040 	return rc;
1041 }
1042 
1043 static void cudbg_t4_fwcache(struct cudbg_init *pdbg_init,
1044 			     struct cudbg_error *cudbg_err)
1045 {
1046 	struct adapter *padap = pdbg_init->adap;
1047 	int rc;
1048 
1049 	if (is_fw_attached(pdbg_init)) {
1050 		/* Flush uP dcache before reading edcX/mcX  */
1051 		rc = t4_fwcache(padap, FW_PARAM_DEV_FWCACHE_FLUSH);
1052 		if (rc)
1053 			cudbg_err->sys_warn = rc;
1054 	}
1055 }
1056 
1057 static int cudbg_collect_mem_region(struct cudbg_init *pdbg_init,
1058 				    struct cudbg_buffer *dbg_buff,
1059 				    struct cudbg_error *cudbg_err,
1060 				    u8 mem_type)
1061 {
1062 	struct adapter *padap = pdbg_init->adap;
1063 	struct cudbg_meminfo mem_info;
1064 	unsigned long size;
1065 	u8 mc_idx;
1066 	int rc;
1067 
1068 	memset(&mem_info, 0, sizeof(struct cudbg_meminfo));
1069 	rc = cudbg_fill_meminfo(padap, &mem_info);
1070 	if (rc)
1071 		return rc;
1072 
1073 	cudbg_t4_fwcache(pdbg_init, cudbg_err);
1074 	rc = cudbg_meminfo_get_mem_index(padap, &mem_info, mem_type, &mc_idx);
1075 	if (rc)
1076 		return rc;
1077 
1078 	size = mem_info.avail[mc_idx].limit - mem_info.avail[mc_idx].base;
1079 	return cudbg_read_fw_mem(pdbg_init, dbg_buff, mem_type, size,
1080 				 cudbg_err);
1081 }
1082 
1083 int cudbg_collect_edc0_meminfo(struct cudbg_init *pdbg_init,
1084 			       struct cudbg_buffer *dbg_buff,
1085 			       struct cudbg_error *cudbg_err)
1086 {
1087 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1088 					MEM_EDC0);
1089 }
1090 
1091 int cudbg_collect_edc1_meminfo(struct cudbg_init *pdbg_init,
1092 			       struct cudbg_buffer *dbg_buff,
1093 			       struct cudbg_error *cudbg_err)
1094 {
1095 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1096 					MEM_EDC1);
1097 }
1098 
1099 int cudbg_collect_mc0_meminfo(struct cudbg_init *pdbg_init,
1100 			      struct cudbg_buffer *dbg_buff,
1101 			      struct cudbg_error *cudbg_err)
1102 {
1103 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1104 					MEM_MC0);
1105 }
1106 
1107 int cudbg_collect_mc1_meminfo(struct cudbg_init *pdbg_init,
1108 			      struct cudbg_buffer *dbg_buff,
1109 			      struct cudbg_error *cudbg_err)
1110 {
1111 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1112 					MEM_MC1);
1113 }
1114 
1115 int cudbg_collect_hma_meminfo(struct cudbg_init *pdbg_init,
1116 			      struct cudbg_buffer *dbg_buff,
1117 			      struct cudbg_error *cudbg_err)
1118 {
1119 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1120 					MEM_HMA);
1121 }
1122 
1123 int cudbg_collect_rss(struct cudbg_init *pdbg_init,
1124 		      struct cudbg_buffer *dbg_buff,
1125 		      struct cudbg_error *cudbg_err)
1126 {
1127 	struct adapter *padap = pdbg_init->adap;
1128 	struct cudbg_buffer temp_buff = { 0 };
1129 	int rc, nentries;
1130 
1131 	nentries = t4_chip_rss_size(padap);
1132 	rc = cudbg_get_buff(pdbg_init, dbg_buff, nentries * sizeof(u16),
1133 			    &temp_buff);
1134 	if (rc)
1135 		return rc;
1136 
1137 	rc = t4_read_rss(padap, (u16 *)temp_buff.data);
1138 	if (rc) {
1139 		cudbg_err->sys_err = rc;
1140 		cudbg_put_buff(pdbg_init, &temp_buff);
1141 		return rc;
1142 	}
1143 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1144 }
1145 
1146 int cudbg_collect_rss_vf_config(struct cudbg_init *pdbg_init,
1147 				struct cudbg_buffer *dbg_buff,
1148 				struct cudbg_error *cudbg_err)
1149 {
1150 	struct adapter *padap = pdbg_init->adap;
1151 	struct cudbg_buffer temp_buff = { 0 };
1152 	struct cudbg_rss_vf_conf *vfconf;
1153 	int vf, rc, vf_count;
1154 
1155 	vf_count = padap->params.arch.vfcount;
1156 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
1157 			    vf_count * sizeof(struct cudbg_rss_vf_conf),
1158 			    &temp_buff);
1159 	if (rc)
1160 		return rc;
1161 
1162 	vfconf = (struct cudbg_rss_vf_conf *)temp_buff.data;
1163 	for (vf = 0; vf < vf_count; vf++)
1164 		t4_read_rss_vf_config(padap, vf, &vfconf[vf].rss_vf_vfl,
1165 				      &vfconf[vf].rss_vf_vfh, true);
1166 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1167 }
1168 
1169 int cudbg_collect_path_mtu(struct cudbg_init *pdbg_init,
1170 			   struct cudbg_buffer *dbg_buff,
1171 			   struct cudbg_error *cudbg_err)
1172 {
1173 	struct adapter *padap = pdbg_init->adap;
1174 	struct cudbg_buffer temp_buff = { 0 };
1175 	int rc;
1176 
1177 	rc = cudbg_get_buff(pdbg_init, dbg_buff, NMTUS * sizeof(u16),
1178 			    &temp_buff);
1179 	if (rc)
1180 		return rc;
1181 
1182 	t4_read_mtu_tbl(padap, (u16 *)temp_buff.data, NULL);
1183 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1184 }
1185 
1186 int cudbg_collect_pm_stats(struct cudbg_init *pdbg_init,
1187 			   struct cudbg_buffer *dbg_buff,
1188 			   struct cudbg_error *cudbg_err)
1189 {
1190 	struct adapter *padap = pdbg_init->adap;
1191 	struct cudbg_buffer temp_buff = { 0 };
1192 	struct cudbg_pm_stats *pm_stats_buff;
1193 	int rc;
1194 
1195 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_pm_stats),
1196 			    &temp_buff);
1197 	if (rc)
1198 		return rc;
1199 
1200 	pm_stats_buff = (struct cudbg_pm_stats *)temp_buff.data;
1201 	t4_pmtx_get_stats(padap, pm_stats_buff->tx_cnt, pm_stats_buff->tx_cyc);
1202 	t4_pmrx_get_stats(padap, pm_stats_buff->rx_cnt, pm_stats_buff->rx_cyc);
1203 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1204 }
1205 
1206 int cudbg_collect_hw_sched(struct cudbg_init *pdbg_init,
1207 			   struct cudbg_buffer *dbg_buff,
1208 			   struct cudbg_error *cudbg_err)
1209 {
1210 	struct adapter *padap = pdbg_init->adap;
1211 	struct cudbg_buffer temp_buff = { 0 };
1212 	struct cudbg_hw_sched *hw_sched_buff;
1213 	int i, rc = 0;
1214 
1215 	if (!padap->params.vpd.cclk)
1216 		return CUDBG_STATUS_CCLK_NOT_DEFINED;
1217 
1218 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_hw_sched),
1219 			    &temp_buff);
1220 
1221 	if (rc)
1222 		return rc;
1223 
1224 	hw_sched_buff = (struct cudbg_hw_sched *)temp_buff.data;
1225 	hw_sched_buff->map = t4_read_reg(padap, TP_TX_MOD_QUEUE_REQ_MAP_A);
1226 	hw_sched_buff->mode = TIMERMODE_G(t4_read_reg(padap, TP_MOD_CONFIG_A));
1227 	t4_read_pace_tbl(padap, hw_sched_buff->pace_tab);
1228 	for (i = 0; i < NTX_SCHED; ++i)
1229 		t4_get_tx_sched(padap, i, &hw_sched_buff->kbps[i],
1230 				&hw_sched_buff->ipg[i], true);
1231 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1232 }
1233 
1234 int cudbg_collect_tp_indirect(struct cudbg_init *pdbg_init,
1235 			      struct cudbg_buffer *dbg_buff,
1236 			      struct cudbg_error *cudbg_err)
1237 {
1238 	struct adapter *padap = pdbg_init->adap;
1239 	struct cudbg_buffer temp_buff = { 0 };
1240 	struct ireg_buf *ch_tp_pio;
1241 	int i, rc, n = 0;
1242 	u32 size;
1243 
1244 	if (is_t5(padap->params.chip))
1245 		n = sizeof(t5_tp_pio_array) +
1246 		    sizeof(t5_tp_tm_pio_array) +
1247 		    sizeof(t5_tp_mib_index_array);
1248 	else
1249 		n = sizeof(t6_tp_pio_array) +
1250 		    sizeof(t6_tp_tm_pio_array) +
1251 		    sizeof(t6_tp_mib_index_array);
1252 
1253 	n = n / (IREG_NUM_ELEM * sizeof(u32));
1254 	size = sizeof(struct ireg_buf) * n;
1255 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1256 	if (rc)
1257 		return rc;
1258 
1259 	ch_tp_pio = (struct ireg_buf *)temp_buff.data;
1260 
1261 	/* TP_PIO */
1262 	if (is_t5(padap->params.chip))
1263 		n = sizeof(t5_tp_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1264 	else if (is_t6(padap->params.chip))
1265 		n = sizeof(t6_tp_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1266 
1267 	for (i = 0; i < n; i++) {
1268 		struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1269 		u32 *buff = ch_tp_pio->outbuf;
1270 
1271 		if (is_t5(padap->params.chip)) {
1272 			tp_pio->ireg_addr = t5_tp_pio_array[i][0];
1273 			tp_pio->ireg_data = t5_tp_pio_array[i][1];
1274 			tp_pio->ireg_local_offset = t5_tp_pio_array[i][2];
1275 			tp_pio->ireg_offset_range = t5_tp_pio_array[i][3];
1276 		} else if (is_t6(padap->params.chip)) {
1277 			tp_pio->ireg_addr = t6_tp_pio_array[i][0];
1278 			tp_pio->ireg_data = t6_tp_pio_array[i][1];
1279 			tp_pio->ireg_local_offset = t6_tp_pio_array[i][2];
1280 			tp_pio->ireg_offset_range = t6_tp_pio_array[i][3];
1281 		}
1282 		t4_tp_pio_read(padap, buff, tp_pio->ireg_offset_range,
1283 			       tp_pio->ireg_local_offset, true);
1284 		ch_tp_pio++;
1285 	}
1286 
1287 	/* TP_TM_PIO */
1288 	if (is_t5(padap->params.chip))
1289 		n = sizeof(t5_tp_tm_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1290 	else if (is_t6(padap->params.chip))
1291 		n = sizeof(t6_tp_tm_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1292 
1293 	for (i = 0; i < n; i++) {
1294 		struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1295 		u32 *buff = ch_tp_pio->outbuf;
1296 
1297 		if (is_t5(padap->params.chip)) {
1298 			tp_pio->ireg_addr = t5_tp_tm_pio_array[i][0];
1299 			tp_pio->ireg_data = t5_tp_tm_pio_array[i][1];
1300 			tp_pio->ireg_local_offset = t5_tp_tm_pio_array[i][2];
1301 			tp_pio->ireg_offset_range = t5_tp_tm_pio_array[i][3];
1302 		} else if (is_t6(padap->params.chip)) {
1303 			tp_pio->ireg_addr = t6_tp_tm_pio_array[i][0];
1304 			tp_pio->ireg_data = t6_tp_tm_pio_array[i][1];
1305 			tp_pio->ireg_local_offset = t6_tp_tm_pio_array[i][2];
1306 			tp_pio->ireg_offset_range = t6_tp_tm_pio_array[i][3];
1307 		}
1308 		t4_tp_tm_pio_read(padap, buff, tp_pio->ireg_offset_range,
1309 				  tp_pio->ireg_local_offset, true);
1310 		ch_tp_pio++;
1311 	}
1312 
1313 	/* TP_MIB_INDEX */
1314 	if (is_t5(padap->params.chip))
1315 		n = sizeof(t5_tp_mib_index_array) /
1316 		    (IREG_NUM_ELEM * sizeof(u32));
1317 	else if (is_t6(padap->params.chip))
1318 		n = sizeof(t6_tp_mib_index_array) /
1319 		    (IREG_NUM_ELEM * sizeof(u32));
1320 
1321 	for (i = 0; i < n ; i++) {
1322 		struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1323 		u32 *buff = ch_tp_pio->outbuf;
1324 
1325 		if (is_t5(padap->params.chip)) {
1326 			tp_pio->ireg_addr = t5_tp_mib_index_array[i][0];
1327 			tp_pio->ireg_data = t5_tp_mib_index_array[i][1];
1328 			tp_pio->ireg_local_offset =
1329 				t5_tp_mib_index_array[i][2];
1330 			tp_pio->ireg_offset_range =
1331 				t5_tp_mib_index_array[i][3];
1332 		} else if (is_t6(padap->params.chip)) {
1333 			tp_pio->ireg_addr = t6_tp_mib_index_array[i][0];
1334 			tp_pio->ireg_data = t6_tp_mib_index_array[i][1];
1335 			tp_pio->ireg_local_offset =
1336 				t6_tp_mib_index_array[i][2];
1337 			tp_pio->ireg_offset_range =
1338 				t6_tp_mib_index_array[i][3];
1339 		}
1340 		t4_tp_mib_read(padap, buff, tp_pio->ireg_offset_range,
1341 			       tp_pio->ireg_local_offset, true);
1342 		ch_tp_pio++;
1343 	}
1344 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1345 }
1346 
1347 static void cudbg_read_sge_qbase_indirect_reg(struct adapter *padap,
1348 					      struct sge_qbase_reg_field *qbase,
1349 					      u32 func, bool is_pf)
1350 {
1351 	u32 *buff, i;
1352 
1353 	if (is_pf) {
1354 		buff = qbase->pf_data_value[func];
1355 	} else {
1356 		buff = qbase->vf_data_value[func];
1357 		/* In SGE_QBASE_INDEX,
1358 		 * Entries 0->7 are PF0->7, Entries 8->263 are VFID0->256.
1359 		 */
1360 		func += 8;
1361 	}
1362 
1363 	t4_write_reg(padap, qbase->reg_addr, func);
1364 	for (i = 0; i < SGE_QBASE_DATA_REG_NUM; i++, buff++)
1365 		*buff = t4_read_reg(padap, qbase->reg_data[i]);
1366 }
1367 
1368 int cudbg_collect_sge_indirect(struct cudbg_init *pdbg_init,
1369 			       struct cudbg_buffer *dbg_buff,
1370 			       struct cudbg_error *cudbg_err)
1371 {
1372 	struct adapter *padap = pdbg_init->adap;
1373 	struct cudbg_buffer temp_buff = { 0 };
1374 	struct sge_qbase_reg_field *sge_qbase;
1375 	struct ireg_buf *ch_sge_dbg;
1376 	int i, rc;
1377 
1378 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
1379 			    sizeof(*ch_sge_dbg) * 2 + sizeof(*sge_qbase),
1380 			    &temp_buff);
1381 	if (rc)
1382 		return rc;
1383 
1384 	ch_sge_dbg = (struct ireg_buf *)temp_buff.data;
1385 	for (i = 0; i < 2; i++) {
1386 		struct ireg_field *sge_pio = &ch_sge_dbg->tp_pio;
1387 		u32 *buff = ch_sge_dbg->outbuf;
1388 
1389 		sge_pio->ireg_addr = t5_sge_dbg_index_array[i][0];
1390 		sge_pio->ireg_data = t5_sge_dbg_index_array[i][1];
1391 		sge_pio->ireg_local_offset = t5_sge_dbg_index_array[i][2];
1392 		sge_pio->ireg_offset_range = t5_sge_dbg_index_array[i][3];
1393 		t4_read_indirect(padap,
1394 				 sge_pio->ireg_addr,
1395 				 sge_pio->ireg_data,
1396 				 buff,
1397 				 sge_pio->ireg_offset_range,
1398 				 sge_pio->ireg_local_offset);
1399 		ch_sge_dbg++;
1400 	}
1401 
1402 	if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5) {
1403 		sge_qbase = (struct sge_qbase_reg_field *)ch_sge_dbg;
1404 		/* 1 addr reg SGE_QBASE_INDEX and 4 data reg
1405 		 * SGE_QBASE_MAP[0-3]
1406 		 */
1407 		sge_qbase->reg_addr = t6_sge_qbase_index_array[0];
1408 		for (i = 0; i < SGE_QBASE_DATA_REG_NUM; i++)
1409 			sge_qbase->reg_data[i] =
1410 				t6_sge_qbase_index_array[i + 1];
1411 
1412 		for (i = 0; i <= PCIE_FW_MASTER_M; i++)
1413 			cudbg_read_sge_qbase_indirect_reg(padap, sge_qbase,
1414 							  i, true);
1415 
1416 		for (i = 0; i < padap->params.arch.vfcount; i++)
1417 			cudbg_read_sge_qbase_indirect_reg(padap, sge_qbase,
1418 							  i, false);
1419 
1420 		sge_qbase->vfcount = padap->params.arch.vfcount;
1421 	}
1422 
1423 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1424 }
1425 
1426 int cudbg_collect_ulprx_la(struct cudbg_init *pdbg_init,
1427 			   struct cudbg_buffer *dbg_buff,
1428 			   struct cudbg_error *cudbg_err)
1429 {
1430 	struct adapter *padap = pdbg_init->adap;
1431 	struct cudbg_buffer temp_buff = { 0 };
1432 	struct cudbg_ulprx_la *ulprx_la_buff;
1433 	int rc;
1434 
1435 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_ulprx_la),
1436 			    &temp_buff);
1437 	if (rc)
1438 		return rc;
1439 
1440 	ulprx_la_buff = (struct cudbg_ulprx_la *)temp_buff.data;
1441 	t4_ulprx_read_la(padap, (u32 *)ulprx_la_buff->data);
1442 	ulprx_la_buff->size = ULPRX_LA_SIZE;
1443 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1444 }
1445 
1446 int cudbg_collect_tp_la(struct cudbg_init *pdbg_init,
1447 			struct cudbg_buffer *dbg_buff,
1448 			struct cudbg_error *cudbg_err)
1449 {
1450 	struct adapter *padap = pdbg_init->adap;
1451 	struct cudbg_buffer temp_buff = { 0 };
1452 	struct cudbg_tp_la *tp_la_buff;
1453 	int size, rc;
1454 
1455 	size = sizeof(struct cudbg_tp_la) + TPLA_SIZE *  sizeof(u64);
1456 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1457 	if (rc)
1458 		return rc;
1459 
1460 	tp_la_buff = (struct cudbg_tp_la *)temp_buff.data;
1461 	tp_la_buff->mode = DBGLAMODE_G(t4_read_reg(padap, TP_DBG_LA_CONFIG_A));
1462 	t4_tp_read_la(padap, (u64 *)tp_la_buff->data, NULL);
1463 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1464 }
1465 
1466 int cudbg_collect_meminfo(struct cudbg_init *pdbg_init,
1467 			  struct cudbg_buffer *dbg_buff,
1468 			  struct cudbg_error *cudbg_err)
1469 {
1470 	struct adapter *padap = pdbg_init->adap;
1471 	struct cudbg_buffer temp_buff = { 0 };
1472 	struct cudbg_meminfo *meminfo_buff;
1473 	struct cudbg_ver_hdr *ver_hdr;
1474 	int rc;
1475 
1476 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
1477 			    sizeof(struct cudbg_ver_hdr) +
1478 			    sizeof(struct cudbg_meminfo),
1479 			    &temp_buff);
1480 	if (rc)
1481 		return rc;
1482 
1483 	ver_hdr = (struct cudbg_ver_hdr *)temp_buff.data;
1484 	ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
1485 	ver_hdr->revision = CUDBG_MEMINFO_REV;
1486 	ver_hdr->size = sizeof(struct cudbg_meminfo);
1487 
1488 	meminfo_buff = (struct cudbg_meminfo *)(temp_buff.data +
1489 						sizeof(*ver_hdr));
1490 	rc = cudbg_fill_meminfo(padap, meminfo_buff);
1491 	if (rc) {
1492 		cudbg_err->sys_err = rc;
1493 		cudbg_put_buff(pdbg_init, &temp_buff);
1494 		return rc;
1495 	}
1496 
1497 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1498 }
1499 
1500 int cudbg_collect_cim_pif_la(struct cudbg_init *pdbg_init,
1501 			     struct cudbg_buffer *dbg_buff,
1502 			     struct cudbg_error *cudbg_err)
1503 {
1504 	struct cudbg_cim_pif_la *cim_pif_la_buff;
1505 	struct adapter *padap = pdbg_init->adap;
1506 	struct cudbg_buffer temp_buff = { 0 };
1507 	int size, rc;
1508 
1509 	size = sizeof(struct cudbg_cim_pif_la) +
1510 	       2 * CIM_PIFLA_SIZE * 6 * sizeof(u32);
1511 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1512 	if (rc)
1513 		return rc;
1514 
1515 	cim_pif_la_buff = (struct cudbg_cim_pif_la *)temp_buff.data;
1516 	cim_pif_la_buff->size = CIM_PIFLA_SIZE;
1517 	t4_cim_read_pif_la(padap, (u32 *)cim_pif_la_buff->data,
1518 			   (u32 *)cim_pif_la_buff->data + 6 * CIM_PIFLA_SIZE,
1519 			   NULL, NULL);
1520 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1521 }
1522 
1523 int cudbg_collect_clk_info(struct cudbg_init *pdbg_init,
1524 			   struct cudbg_buffer *dbg_buff,
1525 			   struct cudbg_error *cudbg_err)
1526 {
1527 	struct adapter *padap = pdbg_init->adap;
1528 	struct cudbg_buffer temp_buff = { 0 };
1529 	struct cudbg_clk_info *clk_info_buff;
1530 	u64 tp_tick_us;
1531 	int rc;
1532 
1533 	if (!padap->params.vpd.cclk)
1534 		return CUDBG_STATUS_CCLK_NOT_DEFINED;
1535 
1536 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_clk_info),
1537 			    &temp_buff);
1538 	if (rc)
1539 		return rc;
1540 
1541 	clk_info_buff = (struct cudbg_clk_info *)temp_buff.data;
1542 	clk_info_buff->cclk_ps = 1000000000 / padap->params.vpd.cclk; /* psec */
1543 	clk_info_buff->res = t4_read_reg(padap, TP_TIMER_RESOLUTION_A);
1544 	clk_info_buff->tre = TIMERRESOLUTION_G(clk_info_buff->res);
1545 	clk_info_buff->dack_re = DELAYEDACKRESOLUTION_G(clk_info_buff->res);
1546 	tp_tick_us = (clk_info_buff->cclk_ps << clk_info_buff->tre) / 1000000;
1547 
1548 	clk_info_buff->dack_timer =
1549 		(clk_info_buff->cclk_ps << clk_info_buff->dack_re) / 1000000 *
1550 		t4_read_reg(padap, TP_DACK_TIMER_A);
1551 	clk_info_buff->retransmit_min =
1552 		tp_tick_us * t4_read_reg(padap, TP_RXT_MIN_A);
1553 	clk_info_buff->retransmit_max =
1554 		tp_tick_us * t4_read_reg(padap, TP_RXT_MAX_A);
1555 	clk_info_buff->persist_timer_min =
1556 		tp_tick_us * t4_read_reg(padap, TP_PERS_MIN_A);
1557 	clk_info_buff->persist_timer_max =
1558 		tp_tick_us * t4_read_reg(padap, TP_PERS_MAX_A);
1559 	clk_info_buff->keepalive_idle_timer =
1560 		tp_tick_us * t4_read_reg(padap, TP_KEEP_IDLE_A);
1561 	clk_info_buff->keepalive_interval =
1562 		tp_tick_us * t4_read_reg(padap, TP_KEEP_INTVL_A);
1563 	clk_info_buff->initial_srtt =
1564 		tp_tick_us * INITSRTT_G(t4_read_reg(padap, TP_INIT_SRTT_A));
1565 	clk_info_buff->finwait2_timer =
1566 		tp_tick_us * t4_read_reg(padap, TP_FINWAIT2_TIMER_A);
1567 
1568 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1569 }
1570 
1571 int cudbg_collect_pcie_indirect(struct cudbg_init *pdbg_init,
1572 				struct cudbg_buffer *dbg_buff,
1573 				struct cudbg_error *cudbg_err)
1574 {
1575 	struct adapter *padap = pdbg_init->adap;
1576 	struct cudbg_buffer temp_buff = { 0 };
1577 	struct ireg_buf *ch_pcie;
1578 	int i, rc, n;
1579 	u32 size;
1580 
1581 	n = sizeof(t5_pcie_pdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
1582 	size = sizeof(struct ireg_buf) * n * 2;
1583 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1584 	if (rc)
1585 		return rc;
1586 
1587 	ch_pcie = (struct ireg_buf *)temp_buff.data;
1588 	/* PCIE_PDBG */
1589 	for (i = 0; i < n; i++) {
1590 		struct ireg_field *pcie_pio = &ch_pcie->tp_pio;
1591 		u32 *buff = ch_pcie->outbuf;
1592 
1593 		pcie_pio->ireg_addr = t5_pcie_pdbg_array[i][0];
1594 		pcie_pio->ireg_data = t5_pcie_pdbg_array[i][1];
1595 		pcie_pio->ireg_local_offset = t5_pcie_pdbg_array[i][2];
1596 		pcie_pio->ireg_offset_range = t5_pcie_pdbg_array[i][3];
1597 		t4_read_indirect(padap,
1598 				 pcie_pio->ireg_addr,
1599 				 pcie_pio->ireg_data,
1600 				 buff,
1601 				 pcie_pio->ireg_offset_range,
1602 				 pcie_pio->ireg_local_offset);
1603 		ch_pcie++;
1604 	}
1605 
1606 	/* PCIE_CDBG */
1607 	n = sizeof(t5_pcie_cdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
1608 	for (i = 0; i < n; i++) {
1609 		struct ireg_field *pcie_pio = &ch_pcie->tp_pio;
1610 		u32 *buff = ch_pcie->outbuf;
1611 
1612 		pcie_pio->ireg_addr = t5_pcie_cdbg_array[i][0];
1613 		pcie_pio->ireg_data = t5_pcie_cdbg_array[i][1];
1614 		pcie_pio->ireg_local_offset = t5_pcie_cdbg_array[i][2];
1615 		pcie_pio->ireg_offset_range = t5_pcie_cdbg_array[i][3];
1616 		t4_read_indirect(padap,
1617 				 pcie_pio->ireg_addr,
1618 				 pcie_pio->ireg_data,
1619 				 buff,
1620 				 pcie_pio->ireg_offset_range,
1621 				 pcie_pio->ireg_local_offset);
1622 		ch_pcie++;
1623 	}
1624 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1625 }
1626 
1627 int cudbg_collect_pm_indirect(struct cudbg_init *pdbg_init,
1628 			      struct cudbg_buffer *dbg_buff,
1629 			      struct cudbg_error *cudbg_err)
1630 {
1631 	struct adapter *padap = pdbg_init->adap;
1632 	struct cudbg_buffer temp_buff = { 0 };
1633 	struct ireg_buf *ch_pm;
1634 	int i, rc, n;
1635 	u32 size;
1636 
1637 	n = sizeof(t5_pm_rx_array) / (IREG_NUM_ELEM * sizeof(u32));
1638 	size = sizeof(struct ireg_buf) * n * 2;
1639 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1640 	if (rc)
1641 		return rc;
1642 
1643 	ch_pm = (struct ireg_buf *)temp_buff.data;
1644 	/* PM_RX */
1645 	for (i = 0; i < n; i++) {
1646 		struct ireg_field *pm_pio = &ch_pm->tp_pio;
1647 		u32 *buff = ch_pm->outbuf;
1648 
1649 		pm_pio->ireg_addr = t5_pm_rx_array[i][0];
1650 		pm_pio->ireg_data = t5_pm_rx_array[i][1];
1651 		pm_pio->ireg_local_offset = t5_pm_rx_array[i][2];
1652 		pm_pio->ireg_offset_range = t5_pm_rx_array[i][3];
1653 		t4_read_indirect(padap,
1654 				 pm_pio->ireg_addr,
1655 				 pm_pio->ireg_data,
1656 				 buff,
1657 				 pm_pio->ireg_offset_range,
1658 				 pm_pio->ireg_local_offset);
1659 		ch_pm++;
1660 	}
1661 
1662 	/* PM_TX */
1663 	n = sizeof(t5_pm_tx_array) / (IREG_NUM_ELEM * sizeof(u32));
1664 	for (i = 0; i < n; i++) {
1665 		struct ireg_field *pm_pio = &ch_pm->tp_pio;
1666 		u32 *buff = ch_pm->outbuf;
1667 
1668 		pm_pio->ireg_addr = t5_pm_tx_array[i][0];
1669 		pm_pio->ireg_data = t5_pm_tx_array[i][1];
1670 		pm_pio->ireg_local_offset = t5_pm_tx_array[i][2];
1671 		pm_pio->ireg_offset_range = t5_pm_tx_array[i][3];
1672 		t4_read_indirect(padap,
1673 				 pm_pio->ireg_addr,
1674 				 pm_pio->ireg_data,
1675 				 buff,
1676 				 pm_pio->ireg_offset_range,
1677 				 pm_pio->ireg_local_offset);
1678 		ch_pm++;
1679 	}
1680 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1681 }
1682 
1683 int cudbg_collect_tid(struct cudbg_init *pdbg_init,
1684 		      struct cudbg_buffer *dbg_buff,
1685 		      struct cudbg_error *cudbg_err)
1686 {
1687 	struct adapter *padap = pdbg_init->adap;
1688 	struct cudbg_tid_info_region_rev1 *tid1;
1689 	struct cudbg_buffer temp_buff = { 0 };
1690 	struct cudbg_tid_info_region *tid;
1691 	u32 para[2], val[2];
1692 	int rc;
1693 
1694 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
1695 			    sizeof(struct cudbg_tid_info_region_rev1),
1696 			    &temp_buff);
1697 	if (rc)
1698 		return rc;
1699 
1700 	tid1 = (struct cudbg_tid_info_region_rev1 *)temp_buff.data;
1701 	tid = &tid1->tid;
1702 	tid1->ver_hdr.signature = CUDBG_ENTITY_SIGNATURE;
1703 	tid1->ver_hdr.revision = CUDBG_TID_INFO_REV;
1704 	tid1->ver_hdr.size = sizeof(struct cudbg_tid_info_region_rev1) -
1705 			     sizeof(struct cudbg_ver_hdr);
1706 
1707 	/* If firmware is not attached/alive, use backdoor register
1708 	 * access to collect dump.
1709 	 */
1710 	if (!is_fw_attached(pdbg_init))
1711 		goto fill_tid;
1712 
1713 #define FW_PARAM_PFVF_A(param) \
1714 	(FW_PARAMS_MNEM_V(FW_PARAMS_MNEM_PFVF) | \
1715 	 FW_PARAMS_PARAM_X_V(FW_PARAMS_PARAM_PFVF_##param) | \
1716 	 FW_PARAMS_PARAM_Y_V(0) | \
1717 	 FW_PARAMS_PARAM_Z_V(0))
1718 
1719 	para[0] = FW_PARAM_PFVF_A(ETHOFLD_START);
1720 	para[1] = FW_PARAM_PFVF_A(ETHOFLD_END);
1721 	rc = t4_query_params(padap, padap->mbox, padap->pf, 0, 2, para, val);
1722 	if (rc <  0) {
1723 		cudbg_err->sys_err = rc;
1724 		cudbg_put_buff(pdbg_init, &temp_buff);
1725 		return rc;
1726 	}
1727 	tid->uotid_base = val[0];
1728 	tid->nuotids = val[1] - val[0] + 1;
1729 
1730 	if (is_t5(padap->params.chip)) {
1731 		tid->sb = t4_read_reg(padap, LE_DB_SERVER_INDEX_A) / 4;
1732 	} else if (is_t6(padap->params.chip)) {
1733 		tid1->tid_start =
1734 			t4_read_reg(padap, LE_DB_ACTIVE_TABLE_START_INDEX_A);
1735 		tid->sb = t4_read_reg(padap, LE_DB_SRVR_START_INDEX_A);
1736 
1737 		para[0] = FW_PARAM_PFVF_A(HPFILTER_START);
1738 		para[1] = FW_PARAM_PFVF_A(HPFILTER_END);
1739 		rc = t4_query_params(padap, padap->mbox, padap->pf, 0, 2,
1740 				     para, val);
1741 		if (rc < 0) {
1742 			cudbg_err->sys_err = rc;
1743 			cudbg_put_buff(pdbg_init, &temp_buff);
1744 			return rc;
1745 		}
1746 		tid->hpftid_base = val[0];
1747 		tid->nhpftids = val[1] - val[0] + 1;
1748 	}
1749 
1750 #undef FW_PARAM_PFVF_A
1751 
1752 fill_tid:
1753 	tid->ntids = padap->tids.ntids;
1754 	tid->nstids = padap->tids.nstids;
1755 	tid->stid_base = padap->tids.stid_base;
1756 	tid->hash_base = padap->tids.hash_base;
1757 
1758 	tid->natids = padap->tids.natids;
1759 	tid->nftids = padap->tids.nftids;
1760 	tid->ftid_base = padap->tids.ftid_base;
1761 	tid->aftid_base = padap->tids.aftid_base;
1762 	tid->aftid_end = padap->tids.aftid_end;
1763 
1764 	tid->sftid_base = padap->tids.sftid_base;
1765 	tid->nsftids = padap->tids.nsftids;
1766 
1767 	tid->flags = padap->flags;
1768 	tid->le_db_conf = t4_read_reg(padap, LE_DB_CONFIG_A);
1769 	tid->ip_users = t4_read_reg(padap, LE_DB_ACT_CNT_IPV4_A);
1770 	tid->ipv6_users = t4_read_reg(padap, LE_DB_ACT_CNT_IPV6_A);
1771 
1772 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1773 }
1774 
1775 int cudbg_collect_pcie_config(struct cudbg_init *pdbg_init,
1776 			      struct cudbg_buffer *dbg_buff,
1777 			      struct cudbg_error *cudbg_err)
1778 {
1779 	struct adapter *padap = pdbg_init->adap;
1780 	struct cudbg_buffer temp_buff = { 0 };
1781 	u32 size, *value, j;
1782 	int i, rc, n;
1783 
1784 	size = sizeof(u32) * CUDBG_NUM_PCIE_CONFIG_REGS;
1785 	n = sizeof(t5_pcie_config_array) / (2 * sizeof(u32));
1786 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1787 	if (rc)
1788 		return rc;
1789 
1790 	value = (u32 *)temp_buff.data;
1791 	for (i = 0; i < n; i++) {
1792 		for (j = t5_pcie_config_array[i][0];
1793 		     j <= t5_pcie_config_array[i][1]; j += 4) {
1794 			t4_hw_pci_read_cfg4(padap, j, value);
1795 			value++;
1796 		}
1797 	}
1798 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1799 }
1800 
1801 static int cudbg_sge_ctxt_check_valid(u32 *buf, int type)
1802 {
1803 	int index, bit, bit_pos = 0;
1804 
1805 	switch (type) {
1806 	case CTXT_EGRESS:
1807 		bit_pos = 176;
1808 		break;
1809 	case CTXT_INGRESS:
1810 		bit_pos = 141;
1811 		break;
1812 	case CTXT_FLM:
1813 		bit_pos = 89;
1814 		break;
1815 	}
1816 	index = bit_pos / 32;
1817 	bit =  bit_pos % 32;
1818 	return buf[index] & (1U << bit);
1819 }
1820 
1821 static int cudbg_get_ctxt_region_info(struct adapter *padap,
1822 				      struct cudbg_region_info *ctx_info,
1823 				      u8 *mem_type)
1824 {
1825 	struct cudbg_mem_desc mem_desc;
1826 	struct cudbg_meminfo meminfo;
1827 	u32 i, j, value, found;
1828 	u8 flq;
1829 	int rc;
1830 
1831 	rc = cudbg_fill_meminfo(padap, &meminfo);
1832 	if (rc)
1833 		return rc;
1834 
1835 	/* Get EGRESS and INGRESS context region size */
1836 	for (i = CTXT_EGRESS; i <= CTXT_INGRESS; i++) {
1837 		found = 0;
1838 		memset(&mem_desc, 0, sizeof(struct cudbg_mem_desc));
1839 		for (j = 0; j < ARRAY_SIZE(meminfo.avail); j++) {
1840 			rc = cudbg_get_mem_region(padap, &meminfo, j,
1841 						  cudbg_region[i],
1842 						  &mem_desc);
1843 			if (!rc) {
1844 				found = 1;
1845 				rc = cudbg_get_mem_relative(padap, &meminfo, j,
1846 							    &mem_desc.base,
1847 							    &mem_desc.limit);
1848 				if (rc) {
1849 					ctx_info[i].exist = false;
1850 					break;
1851 				}
1852 				ctx_info[i].exist = true;
1853 				ctx_info[i].start = mem_desc.base;
1854 				ctx_info[i].end = mem_desc.limit;
1855 				mem_type[i] = j;
1856 				break;
1857 			}
1858 		}
1859 		if (!found)
1860 			ctx_info[i].exist = false;
1861 	}
1862 
1863 	/* Get FLM and CNM max qid. */
1864 	value = t4_read_reg(padap, SGE_FLM_CFG_A);
1865 
1866 	/* Get number of data freelist queues */
1867 	flq = HDRSTARTFLQ_G(value);
1868 	ctx_info[CTXT_FLM].exist = true;
1869 	ctx_info[CTXT_FLM].end = (CUDBG_MAX_FL_QIDS >> flq) * SGE_CTXT_SIZE;
1870 
1871 	/* The number of CONM contexts are same as number of freelist
1872 	 * queues.
1873 	 */
1874 	ctx_info[CTXT_CNM].exist = true;
1875 	ctx_info[CTXT_CNM].end = ctx_info[CTXT_FLM].end;
1876 
1877 	return 0;
1878 }
1879 
1880 int cudbg_dump_context_size(struct adapter *padap)
1881 {
1882 	struct cudbg_region_info region_info[CTXT_CNM + 1] = { {0} };
1883 	u8 mem_type[CTXT_INGRESS + 1] = { 0 };
1884 	u32 i, size = 0;
1885 	int rc;
1886 
1887 	/* Get max valid qid for each type of queue */
1888 	rc = cudbg_get_ctxt_region_info(padap, region_info, mem_type);
1889 	if (rc)
1890 		return rc;
1891 
1892 	for (i = 0; i < CTXT_CNM; i++) {
1893 		if (!region_info[i].exist) {
1894 			if (i == CTXT_EGRESS || i == CTXT_INGRESS)
1895 				size += CUDBG_LOWMEM_MAX_CTXT_QIDS *
1896 					SGE_CTXT_SIZE;
1897 			continue;
1898 		}
1899 
1900 		size += (region_info[i].end - region_info[i].start + 1) /
1901 			SGE_CTXT_SIZE;
1902 	}
1903 	return size * sizeof(struct cudbg_ch_cntxt);
1904 }
1905 
1906 static void cudbg_read_sge_ctxt(struct cudbg_init *pdbg_init, u32 cid,
1907 				enum ctxt_type ctype, u32 *data)
1908 {
1909 	struct adapter *padap = pdbg_init->adap;
1910 	int rc = -1;
1911 
1912 	/* Under heavy traffic, the SGE Queue contexts registers will be
1913 	 * frequently accessed by firmware.
1914 	 *
1915 	 * To avoid conflicts with firmware, always ask firmware to fetch
1916 	 * the SGE Queue contexts via mailbox. On failure, fallback to
1917 	 * accessing hardware registers directly.
1918 	 */
1919 	if (is_fw_attached(pdbg_init))
1920 		rc = t4_sge_ctxt_rd(padap, padap->mbox, cid, ctype, data);
1921 	if (rc)
1922 		t4_sge_ctxt_rd_bd(padap, cid, ctype, data);
1923 }
1924 
1925 static void cudbg_get_sge_ctxt_fw(struct cudbg_init *pdbg_init, u32 max_qid,
1926 				  u8 ctxt_type,
1927 				  struct cudbg_ch_cntxt **out_buff)
1928 {
1929 	struct cudbg_ch_cntxt *buff = *out_buff;
1930 	int rc;
1931 	u32 j;
1932 
1933 	for (j = 0; j < max_qid; j++) {
1934 		cudbg_read_sge_ctxt(pdbg_init, j, ctxt_type, buff->data);
1935 		rc = cudbg_sge_ctxt_check_valid(buff->data, ctxt_type);
1936 		if (!rc)
1937 			continue;
1938 
1939 		buff->cntxt_type = ctxt_type;
1940 		buff->cntxt_id = j;
1941 		buff++;
1942 		if (ctxt_type == CTXT_FLM) {
1943 			cudbg_read_sge_ctxt(pdbg_init, j, CTXT_CNM, buff->data);
1944 			buff->cntxt_type = CTXT_CNM;
1945 			buff->cntxt_id = j;
1946 			buff++;
1947 		}
1948 	}
1949 
1950 	*out_buff = buff;
1951 }
1952 
1953 int cudbg_collect_dump_context(struct cudbg_init *pdbg_init,
1954 			       struct cudbg_buffer *dbg_buff,
1955 			       struct cudbg_error *cudbg_err)
1956 {
1957 	struct cudbg_region_info region_info[CTXT_CNM + 1] = { {0} };
1958 	struct adapter *padap = pdbg_init->adap;
1959 	u32 j, size, max_ctx_size, max_ctx_qid;
1960 	u8 mem_type[CTXT_INGRESS + 1] = { 0 };
1961 	struct cudbg_buffer temp_buff = { 0 };
1962 	struct cudbg_ch_cntxt *buff;
1963 	u64 *dst_off, *src_off;
1964 	u8 *ctx_buf;
1965 	u8 i, k;
1966 	int rc;
1967 
1968 	/* Get max valid qid for each type of queue */
1969 	rc = cudbg_get_ctxt_region_info(padap, region_info, mem_type);
1970 	if (rc)
1971 		return rc;
1972 
1973 	rc = cudbg_dump_context_size(padap);
1974 	if (rc <= 0)
1975 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
1976 
1977 	size = rc;
1978 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1979 	if (rc)
1980 		return rc;
1981 
1982 	/* Get buffer with enough space to read the biggest context
1983 	 * region in memory.
1984 	 */
1985 	max_ctx_size = max(region_info[CTXT_EGRESS].end -
1986 			   region_info[CTXT_EGRESS].start + 1,
1987 			   region_info[CTXT_INGRESS].end -
1988 			   region_info[CTXT_INGRESS].start + 1);
1989 
1990 	ctx_buf = kvzalloc(max_ctx_size, GFP_KERNEL);
1991 	if (!ctx_buf) {
1992 		cudbg_put_buff(pdbg_init, &temp_buff);
1993 		return -ENOMEM;
1994 	}
1995 
1996 	buff = (struct cudbg_ch_cntxt *)temp_buff.data;
1997 
1998 	/* Collect EGRESS and INGRESS context data.
1999 	 * In case of failures, fallback to collecting via FW or
2000 	 * backdoor access.
2001 	 */
2002 	for (i = CTXT_EGRESS; i <= CTXT_INGRESS; i++) {
2003 		if (!region_info[i].exist) {
2004 			max_ctx_qid = CUDBG_LOWMEM_MAX_CTXT_QIDS;
2005 			cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, i,
2006 					      &buff);
2007 			continue;
2008 		}
2009 
2010 		max_ctx_size = region_info[i].end - region_info[i].start + 1;
2011 		max_ctx_qid = max_ctx_size / SGE_CTXT_SIZE;
2012 
2013 		/* If firmware is not attached/alive, use backdoor register
2014 		 * access to collect dump.
2015 		 */
2016 		if (is_fw_attached(pdbg_init)) {
2017 			t4_sge_ctxt_flush(padap, padap->mbox, i);
2018 
2019 			rc = t4_memory_rw(padap, MEMWIN_NIC, mem_type[i],
2020 					  region_info[i].start, max_ctx_size,
2021 					  (__be32 *)ctx_buf, 1);
2022 		}
2023 
2024 		if (rc || !is_fw_attached(pdbg_init)) {
2025 			max_ctx_qid = CUDBG_LOWMEM_MAX_CTXT_QIDS;
2026 			cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, i,
2027 					      &buff);
2028 			continue;
2029 		}
2030 
2031 		for (j = 0; j < max_ctx_qid; j++) {
2032 			src_off = (u64 *)(ctx_buf + j * SGE_CTXT_SIZE);
2033 			dst_off = (u64 *)buff->data;
2034 
2035 			/* The data is stored in 64-bit cpu order.  Convert it
2036 			 * to big endian before parsing.
2037 			 */
2038 			for (k = 0; k < SGE_CTXT_SIZE / sizeof(u64); k++)
2039 				dst_off[k] = cpu_to_be64(src_off[k]);
2040 
2041 			rc = cudbg_sge_ctxt_check_valid(buff->data, i);
2042 			if (!rc)
2043 				continue;
2044 
2045 			buff->cntxt_type = i;
2046 			buff->cntxt_id = j;
2047 			buff++;
2048 		}
2049 	}
2050 
2051 	kvfree(ctx_buf);
2052 
2053 	/* Collect FREELIST and CONGESTION MANAGER contexts */
2054 	max_ctx_size = region_info[CTXT_FLM].end -
2055 		       region_info[CTXT_FLM].start + 1;
2056 	max_ctx_qid = max_ctx_size / SGE_CTXT_SIZE;
2057 	/* Since FLM and CONM are 1-to-1 mapped, the below function
2058 	 * will fetch both FLM and CONM contexts.
2059 	 */
2060 	cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, CTXT_FLM, &buff);
2061 
2062 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2063 }
2064 
2065 static inline void cudbg_tcamxy2valmask(u64 x, u64 y, u8 *addr, u64 *mask)
2066 {
2067 	*mask = x | y;
2068 	y = (__force u64)cpu_to_be64(y);
2069 	memcpy(addr, (char *)&y + 2, ETH_ALEN);
2070 }
2071 
2072 static void cudbg_mps_rpl_backdoor(struct adapter *padap,
2073 				   struct fw_ldst_mps_rplc *mps_rplc)
2074 {
2075 	if (is_t5(padap->params.chip)) {
2076 		mps_rplc->rplc255_224 = htonl(t4_read_reg(padap,
2077 							  MPS_VF_RPLCT_MAP3_A));
2078 		mps_rplc->rplc223_192 = htonl(t4_read_reg(padap,
2079 							  MPS_VF_RPLCT_MAP2_A));
2080 		mps_rplc->rplc191_160 = htonl(t4_read_reg(padap,
2081 							  MPS_VF_RPLCT_MAP1_A));
2082 		mps_rplc->rplc159_128 = htonl(t4_read_reg(padap,
2083 							  MPS_VF_RPLCT_MAP0_A));
2084 	} else {
2085 		mps_rplc->rplc255_224 = htonl(t4_read_reg(padap,
2086 							  MPS_VF_RPLCT_MAP7_A));
2087 		mps_rplc->rplc223_192 = htonl(t4_read_reg(padap,
2088 							  MPS_VF_RPLCT_MAP6_A));
2089 		mps_rplc->rplc191_160 = htonl(t4_read_reg(padap,
2090 							  MPS_VF_RPLCT_MAP5_A));
2091 		mps_rplc->rplc159_128 = htonl(t4_read_reg(padap,
2092 							  MPS_VF_RPLCT_MAP4_A));
2093 	}
2094 	mps_rplc->rplc127_96 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP3_A));
2095 	mps_rplc->rplc95_64 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP2_A));
2096 	mps_rplc->rplc63_32 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP1_A));
2097 	mps_rplc->rplc31_0 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP0_A));
2098 }
2099 
2100 static int cudbg_collect_tcam_index(struct cudbg_init *pdbg_init,
2101 				    struct cudbg_mps_tcam *tcam, u32 idx)
2102 {
2103 	struct adapter *padap = pdbg_init->adap;
2104 	u64 tcamy, tcamx, val;
2105 	u32 ctl, data2;
2106 	int rc = 0;
2107 
2108 	if (CHELSIO_CHIP_VERSION(padap->params.chip) >= CHELSIO_T6) {
2109 		/* CtlReqID   - 1: use Host Driver Requester ID
2110 		 * CtlCmdType - 0: Read, 1: Write
2111 		 * CtlTcamSel - 0: TCAM0, 1: TCAM1
2112 		 * CtlXYBitSel- 0: Y bit, 1: X bit
2113 		 */
2114 
2115 		/* Read tcamy */
2116 		ctl = CTLREQID_V(1) | CTLCMDTYPE_V(0) | CTLXYBITSEL_V(0);
2117 		if (idx < 256)
2118 			ctl |= CTLTCAMINDEX_V(idx) | CTLTCAMSEL_V(0);
2119 		else
2120 			ctl |= CTLTCAMINDEX_V(idx - 256) | CTLTCAMSEL_V(1);
2121 
2122 		t4_write_reg(padap, MPS_CLS_TCAM_DATA2_CTL_A, ctl);
2123 		val = t4_read_reg(padap, MPS_CLS_TCAM_RDATA1_REQ_ID1_A);
2124 		tcamy = DMACH_G(val) << 32;
2125 		tcamy |= t4_read_reg(padap, MPS_CLS_TCAM_RDATA0_REQ_ID1_A);
2126 		data2 = t4_read_reg(padap, MPS_CLS_TCAM_RDATA2_REQ_ID1_A);
2127 		tcam->lookup_type = DATALKPTYPE_G(data2);
2128 
2129 		/* 0 - Outer header, 1 - Inner header
2130 		 * [71:48] bit locations are overloaded for
2131 		 * outer vs. inner lookup types.
2132 		 */
2133 		if (tcam->lookup_type && tcam->lookup_type != DATALKPTYPE_M) {
2134 			/* Inner header VNI */
2135 			tcam->vniy = (data2 & DATAVIDH2_F) | DATAVIDH1_G(data2);
2136 			tcam->vniy = (tcam->vniy << 16) | VIDL_G(val);
2137 			tcam->dip_hit = data2 & DATADIPHIT_F;
2138 		} else {
2139 			tcam->vlan_vld = data2 & DATAVIDH2_F;
2140 			tcam->ivlan = VIDL_G(val);
2141 		}
2142 
2143 		tcam->port_num = DATAPORTNUM_G(data2);
2144 
2145 		/* Read tcamx. Change the control param */
2146 		ctl |= CTLXYBITSEL_V(1);
2147 		t4_write_reg(padap, MPS_CLS_TCAM_DATA2_CTL_A, ctl);
2148 		val = t4_read_reg(padap, MPS_CLS_TCAM_RDATA1_REQ_ID1_A);
2149 		tcamx = DMACH_G(val) << 32;
2150 		tcamx |= t4_read_reg(padap, MPS_CLS_TCAM_RDATA0_REQ_ID1_A);
2151 		data2 = t4_read_reg(padap, MPS_CLS_TCAM_RDATA2_REQ_ID1_A);
2152 		if (tcam->lookup_type && tcam->lookup_type != DATALKPTYPE_M) {
2153 			/* Inner header VNI mask */
2154 			tcam->vnix = (data2 & DATAVIDH2_F) | DATAVIDH1_G(data2);
2155 			tcam->vnix = (tcam->vnix << 16) | VIDL_G(val);
2156 		}
2157 	} else {
2158 		tcamy = t4_read_reg64(padap, MPS_CLS_TCAM_Y_L(idx));
2159 		tcamx = t4_read_reg64(padap, MPS_CLS_TCAM_X_L(idx));
2160 	}
2161 
2162 	/* If no entry, return */
2163 	if (tcamx & tcamy)
2164 		return rc;
2165 
2166 	tcam->cls_lo = t4_read_reg(padap, MPS_CLS_SRAM_L(idx));
2167 	tcam->cls_hi = t4_read_reg(padap, MPS_CLS_SRAM_H(idx));
2168 
2169 	if (is_t5(padap->params.chip))
2170 		tcam->repli = (tcam->cls_lo & REPLICATE_F);
2171 	else if (is_t6(padap->params.chip))
2172 		tcam->repli = (tcam->cls_lo & T6_REPLICATE_F);
2173 
2174 	if (tcam->repli) {
2175 		struct fw_ldst_cmd ldst_cmd;
2176 		struct fw_ldst_mps_rplc mps_rplc;
2177 
2178 		memset(&ldst_cmd, 0, sizeof(ldst_cmd));
2179 		ldst_cmd.op_to_addrspace =
2180 			htonl(FW_CMD_OP_V(FW_LDST_CMD) |
2181 			      FW_CMD_REQUEST_F | FW_CMD_READ_F |
2182 			      FW_LDST_CMD_ADDRSPACE_V(FW_LDST_ADDRSPC_MPS));
2183 		ldst_cmd.cycles_to_len16 = htonl(FW_LEN16(ldst_cmd));
2184 		ldst_cmd.u.mps.rplc.fid_idx =
2185 			htons(FW_LDST_CMD_FID_V(FW_LDST_MPS_RPLC) |
2186 			      FW_LDST_CMD_IDX_V(idx));
2187 
2188 		/* If firmware is not attached/alive, use backdoor register
2189 		 * access to collect dump.
2190 		 */
2191 		if (is_fw_attached(pdbg_init))
2192 			rc = t4_wr_mbox(padap, padap->mbox, &ldst_cmd,
2193 					sizeof(ldst_cmd), &ldst_cmd);
2194 
2195 		if (rc || !is_fw_attached(pdbg_init)) {
2196 			cudbg_mps_rpl_backdoor(padap, &mps_rplc);
2197 			/* Ignore error since we collected directly from
2198 			 * reading registers.
2199 			 */
2200 			rc = 0;
2201 		} else {
2202 			mps_rplc = ldst_cmd.u.mps.rplc;
2203 		}
2204 
2205 		tcam->rplc[0] = ntohl(mps_rplc.rplc31_0);
2206 		tcam->rplc[1] = ntohl(mps_rplc.rplc63_32);
2207 		tcam->rplc[2] = ntohl(mps_rplc.rplc95_64);
2208 		tcam->rplc[3] = ntohl(mps_rplc.rplc127_96);
2209 		if (padap->params.arch.mps_rplc_size > CUDBG_MAX_RPLC_SIZE) {
2210 			tcam->rplc[4] = ntohl(mps_rplc.rplc159_128);
2211 			tcam->rplc[5] = ntohl(mps_rplc.rplc191_160);
2212 			tcam->rplc[6] = ntohl(mps_rplc.rplc223_192);
2213 			tcam->rplc[7] = ntohl(mps_rplc.rplc255_224);
2214 		}
2215 	}
2216 	cudbg_tcamxy2valmask(tcamx, tcamy, tcam->addr, &tcam->mask);
2217 	tcam->idx = idx;
2218 	tcam->rplc_size = padap->params.arch.mps_rplc_size;
2219 	return rc;
2220 }
2221 
2222 int cudbg_collect_mps_tcam(struct cudbg_init *pdbg_init,
2223 			   struct cudbg_buffer *dbg_buff,
2224 			   struct cudbg_error *cudbg_err)
2225 {
2226 	struct adapter *padap = pdbg_init->adap;
2227 	struct cudbg_buffer temp_buff = { 0 };
2228 	u32 size = 0, i, n, total_size = 0;
2229 	struct cudbg_mps_tcam *tcam;
2230 	int rc;
2231 
2232 	n = padap->params.arch.mps_tcam_size;
2233 	size = sizeof(struct cudbg_mps_tcam) * n;
2234 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2235 	if (rc)
2236 		return rc;
2237 
2238 	tcam = (struct cudbg_mps_tcam *)temp_buff.data;
2239 	for (i = 0; i < n; i++) {
2240 		rc = cudbg_collect_tcam_index(pdbg_init, tcam, i);
2241 		if (rc) {
2242 			cudbg_err->sys_err = rc;
2243 			cudbg_put_buff(pdbg_init, &temp_buff);
2244 			return rc;
2245 		}
2246 		total_size += sizeof(struct cudbg_mps_tcam);
2247 		tcam++;
2248 	}
2249 
2250 	if (!total_size) {
2251 		rc = CUDBG_SYSTEM_ERROR;
2252 		cudbg_err->sys_err = rc;
2253 		cudbg_put_buff(pdbg_init, &temp_buff);
2254 		return rc;
2255 	}
2256 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2257 }
2258 
2259 int cudbg_collect_vpd_data(struct cudbg_init *pdbg_init,
2260 			   struct cudbg_buffer *dbg_buff,
2261 			   struct cudbg_error *cudbg_err)
2262 {
2263 	struct adapter *padap = pdbg_init->adap;
2264 	struct cudbg_buffer temp_buff = { 0 };
2265 	char vpd_str[CUDBG_VPD_VER_LEN + 1];
2266 	u32 scfg_vers, vpd_vers, fw_vers;
2267 	struct cudbg_vpd_data *vpd_data;
2268 	struct vpd_params vpd = { 0 };
2269 	int rc, ret;
2270 
2271 	rc = t4_get_raw_vpd_params(padap, &vpd);
2272 	if (rc)
2273 		return rc;
2274 
2275 	rc = t4_get_fw_version(padap, &fw_vers);
2276 	if (rc)
2277 		return rc;
2278 
2279 	/* Serial Configuration Version is located beyond the PF's vpd size.
2280 	 * Temporarily give access to entire EEPROM to get it.
2281 	 */
2282 	rc = pci_set_vpd_size(padap->pdev, EEPROMVSIZE);
2283 	if (rc < 0)
2284 		return rc;
2285 
2286 	ret = cudbg_read_vpd_reg(padap, CUDBG_SCFG_VER_ADDR, CUDBG_SCFG_VER_LEN,
2287 				 &scfg_vers);
2288 
2289 	/* Restore back to original PF's vpd size */
2290 	rc = pci_set_vpd_size(padap->pdev, CUDBG_VPD_PF_SIZE);
2291 	if (rc < 0)
2292 		return rc;
2293 
2294 	if (ret)
2295 		return ret;
2296 
2297 	rc = cudbg_read_vpd_reg(padap, CUDBG_VPD_VER_ADDR, CUDBG_VPD_VER_LEN,
2298 				vpd_str);
2299 	if (rc)
2300 		return rc;
2301 
2302 	vpd_str[CUDBG_VPD_VER_LEN] = '\0';
2303 	rc = kstrtouint(vpd_str, 0, &vpd_vers);
2304 	if (rc)
2305 		return rc;
2306 
2307 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_vpd_data),
2308 			    &temp_buff);
2309 	if (rc)
2310 		return rc;
2311 
2312 	vpd_data = (struct cudbg_vpd_data *)temp_buff.data;
2313 	memcpy(vpd_data->sn, vpd.sn, SERNUM_LEN + 1);
2314 	memcpy(vpd_data->bn, vpd.pn, PN_LEN + 1);
2315 	memcpy(vpd_data->na, vpd.na, MACADDR_LEN + 1);
2316 	memcpy(vpd_data->mn, vpd.id, ID_LEN + 1);
2317 	vpd_data->scfg_vers = scfg_vers;
2318 	vpd_data->vpd_vers = vpd_vers;
2319 	vpd_data->fw_major = FW_HDR_FW_VER_MAJOR_G(fw_vers);
2320 	vpd_data->fw_minor = FW_HDR_FW_VER_MINOR_G(fw_vers);
2321 	vpd_data->fw_micro = FW_HDR_FW_VER_MICRO_G(fw_vers);
2322 	vpd_data->fw_build = FW_HDR_FW_VER_BUILD_G(fw_vers);
2323 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2324 }
2325 
2326 static int cudbg_read_tid(struct cudbg_init *pdbg_init, u32 tid,
2327 			  struct cudbg_tid_data *tid_data)
2328 {
2329 	struct adapter *padap = pdbg_init->adap;
2330 	int i, cmd_retry = 8;
2331 	u32 val;
2332 
2333 	/* Fill REQ_DATA regs with 0's */
2334 	for (i = 0; i < NUM_LE_DB_DBGI_REQ_DATA_INSTANCES; i++)
2335 		t4_write_reg(padap, LE_DB_DBGI_REQ_DATA_A + (i << 2), 0);
2336 
2337 	/* Write DBIG command */
2338 	val = DBGICMD_V(4) | DBGITID_V(tid);
2339 	t4_write_reg(padap, LE_DB_DBGI_REQ_TCAM_CMD_A, val);
2340 	tid_data->dbig_cmd = val;
2341 
2342 	val = DBGICMDSTRT_F | DBGICMDMODE_V(1); /* LE mode */
2343 	t4_write_reg(padap, LE_DB_DBGI_CONFIG_A, val);
2344 	tid_data->dbig_conf = val;
2345 
2346 	/* Poll the DBGICMDBUSY bit */
2347 	val = 1;
2348 	while (val) {
2349 		val = t4_read_reg(padap, LE_DB_DBGI_CONFIG_A);
2350 		val = val & DBGICMDBUSY_F;
2351 		cmd_retry--;
2352 		if (!cmd_retry)
2353 			return CUDBG_SYSTEM_ERROR;
2354 	}
2355 
2356 	/* Check RESP status */
2357 	val = t4_read_reg(padap, LE_DB_DBGI_RSP_STATUS_A);
2358 	tid_data->dbig_rsp_stat = val;
2359 	if (!(val & 1))
2360 		return CUDBG_SYSTEM_ERROR;
2361 
2362 	/* Read RESP data */
2363 	for (i = 0; i < NUM_LE_DB_DBGI_RSP_DATA_INSTANCES; i++)
2364 		tid_data->data[i] = t4_read_reg(padap,
2365 						LE_DB_DBGI_RSP_DATA_A +
2366 						(i << 2));
2367 	tid_data->tid = tid;
2368 	return 0;
2369 }
2370 
2371 static int cudbg_get_le_type(u32 tid, struct cudbg_tcam tcam_region)
2372 {
2373 	int type = LE_ET_UNKNOWN;
2374 
2375 	if (tid < tcam_region.server_start)
2376 		type = LE_ET_TCAM_CON;
2377 	else if (tid < tcam_region.filter_start)
2378 		type = LE_ET_TCAM_SERVER;
2379 	else if (tid < tcam_region.clip_start)
2380 		type = LE_ET_TCAM_FILTER;
2381 	else if (tid < tcam_region.routing_start)
2382 		type = LE_ET_TCAM_CLIP;
2383 	else if (tid < tcam_region.tid_hash_base)
2384 		type = LE_ET_TCAM_ROUTING;
2385 	else if (tid < tcam_region.max_tid)
2386 		type = LE_ET_HASH_CON;
2387 	else
2388 		type = LE_ET_INVALID_TID;
2389 
2390 	return type;
2391 }
2392 
2393 static int cudbg_is_ipv6_entry(struct cudbg_tid_data *tid_data,
2394 			       struct cudbg_tcam tcam_region)
2395 {
2396 	int ipv6 = 0;
2397 	int le_type;
2398 
2399 	le_type = cudbg_get_le_type(tid_data->tid, tcam_region);
2400 	if (tid_data->tid & 1)
2401 		return 0;
2402 
2403 	if (le_type == LE_ET_HASH_CON) {
2404 		ipv6 = tid_data->data[16] & 0x8000;
2405 	} else if (le_type == LE_ET_TCAM_CON) {
2406 		ipv6 = tid_data->data[16] & 0x8000;
2407 		if (ipv6)
2408 			ipv6 = tid_data->data[9] == 0x00C00000;
2409 	} else {
2410 		ipv6 = 0;
2411 	}
2412 	return ipv6;
2413 }
2414 
2415 void cudbg_fill_le_tcam_info(struct adapter *padap,
2416 			     struct cudbg_tcam *tcam_region)
2417 {
2418 	u32 value;
2419 
2420 	/* Get the LE regions */
2421 	value = t4_read_reg(padap, LE_DB_TID_HASHBASE_A); /* hash base index */
2422 	tcam_region->tid_hash_base = value;
2423 
2424 	/* Get routing table index */
2425 	value = t4_read_reg(padap, LE_DB_ROUTING_TABLE_INDEX_A);
2426 	tcam_region->routing_start = value;
2427 
2428 	/* Get clip table index. For T6 there is separate CLIP TCAM */
2429 	if (is_t6(padap->params.chip))
2430 		value = t4_read_reg(padap, LE_DB_CLCAM_TID_BASE_A);
2431 	else
2432 		value = t4_read_reg(padap, LE_DB_CLIP_TABLE_INDEX_A);
2433 	tcam_region->clip_start = value;
2434 
2435 	/* Get filter table index */
2436 	value = t4_read_reg(padap, LE_DB_FILTER_TABLE_INDEX_A);
2437 	tcam_region->filter_start = value;
2438 
2439 	/* Get server table index */
2440 	value = t4_read_reg(padap, LE_DB_SERVER_INDEX_A);
2441 	tcam_region->server_start = value;
2442 
2443 	/* Check whether hash is enabled and calculate the max tids */
2444 	value = t4_read_reg(padap, LE_DB_CONFIG_A);
2445 	if ((value >> HASHEN_S) & 1) {
2446 		value = t4_read_reg(padap, LE_DB_HASH_CONFIG_A);
2447 		if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5) {
2448 			tcam_region->max_tid = (value & 0xFFFFF) +
2449 					       tcam_region->tid_hash_base;
2450 		} else {
2451 			value = HASHTIDSIZE_G(value);
2452 			value = 1 << value;
2453 			tcam_region->max_tid = value +
2454 					       tcam_region->tid_hash_base;
2455 		}
2456 	} else { /* hash not enabled */
2457 		if (is_t6(padap->params.chip))
2458 			tcam_region->max_tid = (value & ASLIPCOMPEN_F) ?
2459 					       CUDBG_MAX_TID_COMP_EN :
2460 					       CUDBG_MAX_TID_COMP_DIS;
2461 		else
2462 			tcam_region->max_tid = CUDBG_MAX_TCAM_TID;
2463 	}
2464 
2465 	if (is_t6(padap->params.chip))
2466 		tcam_region->max_tid += CUDBG_T6_CLIP;
2467 }
2468 
2469 int cudbg_collect_le_tcam(struct cudbg_init *pdbg_init,
2470 			  struct cudbg_buffer *dbg_buff,
2471 			  struct cudbg_error *cudbg_err)
2472 {
2473 	struct adapter *padap = pdbg_init->adap;
2474 	struct cudbg_buffer temp_buff = { 0 };
2475 	struct cudbg_tcam tcam_region = { 0 };
2476 	struct cudbg_tid_data *tid_data;
2477 	u32 bytes = 0;
2478 	int rc, size;
2479 	u32 i;
2480 
2481 	cudbg_fill_le_tcam_info(padap, &tcam_region);
2482 
2483 	size = sizeof(struct cudbg_tid_data) * tcam_region.max_tid;
2484 	size += sizeof(struct cudbg_tcam);
2485 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2486 	if (rc)
2487 		return rc;
2488 
2489 	memcpy(temp_buff.data, &tcam_region, sizeof(struct cudbg_tcam));
2490 	bytes = sizeof(struct cudbg_tcam);
2491 	tid_data = (struct cudbg_tid_data *)(temp_buff.data + bytes);
2492 	/* read all tid */
2493 	for (i = 0; i < tcam_region.max_tid; ) {
2494 		rc = cudbg_read_tid(pdbg_init, i, tid_data);
2495 		if (rc) {
2496 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
2497 			/* Update tcam header and exit */
2498 			tcam_region.max_tid = i;
2499 			memcpy(temp_buff.data, &tcam_region,
2500 			       sizeof(struct cudbg_tcam));
2501 			goto out;
2502 		}
2503 
2504 		if (cudbg_is_ipv6_entry(tid_data, tcam_region)) {
2505 			/* T6 CLIP TCAM: ipv6 takes 4 entries */
2506 			if (is_t6(padap->params.chip) &&
2507 			    i >= tcam_region.clip_start &&
2508 			    i < tcam_region.clip_start + CUDBG_T6_CLIP)
2509 				i += 4;
2510 			else /* Main TCAM: ipv6 takes two tids */
2511 				i += 2;
2512 		} else {
2513 			i++;
2514 		}
2515 
2516 		tid_data++;
2517 		bytes += sizeof(struct cudbg_tid_data);
2518 	}
2519 
2520 out:
2521 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2522 }
2523 
2524 int cudbg_collect_cctrl(struct cudbg_init *pdbg_init,
2525 			struct cudbg_buffer *dbg_buff,
2526 			struct cudbg_error *cudbg_err)
2527 {
2528 	struct adapter *padap = pdbg_init->adap;
2529 	struct cudbg_buffer temp_buff = { 0 };
2530 	u32 size;
2531 	int rc;
2532 
2533 	size = sizeof(u16) * NMTUS * NCCTRL_WIN;
2534 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2535 	if (rc)
2536 		return rc;
2537 
2538 	t4_read_cong_tbl(padap, (void *)temp_buff.data);
2539 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2540 }
2541 
2542 int cudbg_collect_ma_indirect(struct cudbg_init *pdbg_init,
2543 			      struct cudbg_buffer *dbg_buff,
2544 			      struct cudbg_error *cudbg_err)
2545 {
2546 	struct adapter *padap = pdbg_init->adap;
2547 	struct cudbg_buffer temp_buff = { 0 };
2548 	struct ireg_buf *ma_indr;
2549 	int i, rc, n;
2550 	u32 size, j;
2551 
2552 	if (CHELSIO_CHIP_VERSION(padap->params.chip) < CHELSIO_T6)
2553 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
2554 
2555 	n = sizeof(t6_ma_ireg_array) / (IREG_NUM_ELEM * sizeof(u32));
2556 	size = sizeof(struct ireg_buf) * n * 2;
2557 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2558 	if (rc)
2559 		return rc;
2560 
2561 	ma_indr = (struct ireg_buf *)temp_buff.data;
2562 	for (i = 0; i < n; i++) {
2563 		struct ireg_field *ma_fli = &ma_indr->tp_pio;
2564 		u32 *buff = ma_indr->outbuf;
2565 
2566 		ma_fli->ireg_addr = t6_ma_ireg_array[i][0];
2567 		ma_fli->ireg_data = t6_ma_ireg_array[i][1];
2568 		ma_fli->ireg_local_offset = t6_ma_ireg_array[i][2];
2569 		ma_fli->ireg_offset_range = t6_ma_ireg_array[i][3];
2570 		t4_read_indirect(padap, ma_fli->ireg_addr, ma_fli->ireg_data,
2571 				 buff, ma_fli->ireg_offset_range,
2572 				 ma_fli->ireg_local_offset);
2573 		ma_indr++;
2574 	}
2575 
2576 	n = sizeof(t6_ma_ireg_array2) / (IREG_NUM_ELEM * sizeof(u32));
2577 	for (i = 0; i < n; i++) {
2578 		struct ireg_field *ma_fli = &ma_indr->tp_pio;
2579 		u32 *buff = ma_indr->outbuf;
2580 
2581 		ma_fli->ireg_addr = t6_ma_ireg_array2[i][0];
2582 		ma_fli->ireg_data = t6_ma_ireg_array2[i][1];
2583 		ma_fli->ireg_local_offset = t6_ma_ireg_array2[i][2];
2584 		for (j = 0; j < t6_ma_ireg_array2[i][3]; j++) {
2585 			t4_read_indirect(padap, ma_fli->ireg_addr,
2586 					 ma_fli->ireg_data, buff, 1,
2587 					 ma_fli->ireg_local_offset);
2588 			buff++;
2589 			ma_fli->ireg_local_offset += 0x20;
2590 		}
2591 		ma_indr++;
2592 	}
2593 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2594 }
2595 
2596 int cudbg_collect_ulptx_la(struct cudbg_init *pdbg_init,
2597 			   struct cudbg_buffer *dbg_buff,
2598 			   struct cudbg_error *cudbg_err)
2599 {
2600 	struct adapter *padap = pdbg_init->adap;
2601 	struct cudbg_buffer temp_buff = { 0 };
2602 	struct cudbg_ulptx_la *ulptx_la_buff;
2603 	struct cudbg_ver_hdr *ver_hdr;
2604 	u32 i, j;
2605 	int rc;
2606 
2607 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
2608 			    sizeof(struct cudbg_ver_hdr) +
2609 			    sizeof(struct cudbg_ulptx_la),
2610 			    &temp_buff);
2611 	if (rc)
2612 		return rc;
2613 
2614 	ver_hdr = (struct cudbg_ver_hdr *)temp_buff.data;
2615 	ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
2616 	ver_hdr->revision = CUDBG_ULPTX_LA_REV;
2617 	ver_hdr->size = sizeof(struct cudbg_ulptx_la);
2618 
2619 	ulptx_la_buff = (struct cudbg_ulptx_la *)(temp_buff.data +
2620 						  sizeof(*ver_hdr));
2621 	for (i = 0; i < CUDBG_NUM_ULPTX; i++) {
2622 		ulptx_la_buff->rdptr[i] = t4_read_reg(padap,
2623 						      ULP_TX_LA_RDPTR_0_A +
2624 						      0x10 * i);
2625 		ulptx_la_buff->wrptr[i] = t4_read_reg(padap,
2626 						      ULP_TX_LA_WRPTR_0_A +
2627 						      0x10 * i);
2628 		ulptx_la_buff->rddata[i] = t4_read_reg(padap,
2629 						       ULP_TX_LA_RDDATA_0_A +
2630 						       0x10 * i);
2631 		for (j = 0; j < CUDBG_NUM_ULPTX_READ; j++)
2632 			ulptx_la_buff->rd_data[i][j] =
2633 				t4_read_reg(padap,
2634 					    ULP_TX_LA_RDDATA_0_A + 0x10 * i);
2635 	}
2636 
2637 	for (i = 0; i < CUDBG_NUM_ULPTX_ASIC_READ; i++) {
2638 		t4_write_reg(padap, ULP_TX_ASIC_DEBUG_CTRL_A, 0x1);
2639 		ulptx_la_buff->rdptr_asic[i] =
2640 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_CTRL_A);
2641 		ulptx_la_buff->rddata_asic[i][0] =
2642 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_0_A);
2643 		ulptx_la_buff->rddata_asic[i][1] =
2644 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_1_A);
2645 		ulptx_la_buff->rddata_asic[i][2] =
2646 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_2_A);
2647 		ulptx_la_buff->rddata_asic[i][3] =
2648 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_3_A);
2649 		ulptx_la_buff->rddata_asic[i][4] =
2650 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_4_A);
2651 		ulptx_la_buff->rddata_asic[i][5] =
2652 				t4_read_reg(padap, PM_RX_BASE_ADDR);
2653 	}
2654 
2655 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2656 }
2657 
2658 int cudbg_collect_up_cim_indirect(struct cudbg_init *pdbg_init,
2659 				  struct cudbg_buffer *dbg_buff,
2660 				  struct cudbg_error *cudbg_err)
2661 {
2662 	struct adapter *padap = pdbg_init->adap;
2663 	struct cudbg_buffer temp_buff = { 0 };
2664 	u32 local_offset, local_range;
2665 	struct ireg_buf *up_cim;
2666 	u32 size, j, iter;
2667 	u32 instance = 0;
2668 	int i, rc, n;
2669 
2670 	if (is_t5(padap->params.chip))
2671 		n = sizeof(t5_up_cim_reg_array) /
2672 		    ((IREG_NUM_ELEM + 1) * sizeof(u32));
2673 	else if (is_t6(padap->params.chip))
2674 		n = sizeof(t6_up_cim_reg_array) /
2675 		    ((IREG_NUM_ELEM + 1) * sizeof(u32));
2676 	else
2677 		return CUDBG_STATUS_NOT_IMPLEMENTED;
2678 
2679 	size = sizeof(struct ireg_buf) * n;
2680 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2681 	if (rc)
2682 		return rc;
2683 
2684 	up_cim = (struct ireg_buf *)temp_buff.data;
2685 	for (i = 0; i < n; i++) {
2686 		struct ireg_field *up_cim_reg = &up_cim->tp_pio;
2687 		u32 *buff = up_cim->outbuf;
2688 
2689 		if (is_t5(padap->params.chip)) {
2690 			up_cim_reg->ireg_addr = t5_up_cim_reg_array[i][0];
2691 			up_cim_reg->ireg_data = t5_up_cim_reg_array[i][1];
2692 			up_cim_reg->ireg_local_offset =
2693 						t5_up_cim_reg_array[i][2];
2694 			up_cim_reg->ireg_offset_range =
2695 						t5_up_cim_reg_array[i][3];
2696 			instance = t5_up_cim_reg_array[i][4];
2697 		} else if (is_t6(padap->params.chip)) {
2698 			up_cim_reg->ireg_addr = t6_up_cim_reg_array[i][0];
2699 			up_cim_reg->ireg_data = t6_up_cim_reg_array[i][1];
2700 			up_cim_reg->ireg_local_offset =
2701 						t6_up_cim_reg_array[i][2];
2702 			up_cim_reg->ireg_offset_range =
2703 						t6_up_cim_reg_array[i][3];
2704 			instance = t6_up_cim_reg_array[i][4];
2705 		}
2706 
2707 		switch (instance) {
2708 		case NUM_CIM_CTL_TSCH_CHANNEL_INSTANCES:
2709 			iter = up_cim_reg->ireg_offset_range;
2710 			local_offset = 0x120;
2711 			local_range = 1;
2712 			break;
2713 		case NUM_CIM_CTL_TSCH_CHANNEL_TSCH_CLASS_INSTANCES:
2714 			iter = up_cim_reg->ireg_offset_range;
2715 			local_offset = 0x10;
2716 			local_range = 1;
2717 			break;
2718 		default:
2719 			iter = 1;
2720 			local_offset = 0;
2721 			local_range = up_cim_reg->ireg_offset_range;
2722 			break;
2723 		}
2724 
2725 		for (j = 0; j < iter; j++, buff++) {
2726 			rc = t4_cim_read(padap,
2727 					 up_cim_reg->ireg_local_offset +
2728 					 (j * local_offset), local_range, buff);
2729 			if (rc) {
2730 				cudbg_put_buff(pdbg_init, &temp_buff);
2731 				return rc;
2732 			}
2733 		}
2734 		up_cim++;
2735 	}
2736 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2737 }
2738 
2739 int cudbg_collect_pbt_tables(struct cudbg_init *pdbg_init,
2740 			     struct cudbg_buffer *dbg_buff,
2741 			     struct cudbg_error *cudbg_err)
2742 {
2743 	struct adapter *padap = pdbg_init->adap;
2744 	struct cudbg_buffer temp_buff = { 0 };
2745 	struct cudbg_pbt_tables *pbt;
2746 	int i, rc;
2747 	u32 addr;
2748 
2749 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
2750 			    sizeof(struct cudbg_pbt_tables),
2751 			    &temp_buff);
2752 	if (rc)
2753 		return rc;
2754 
2755 	pbt = (struct cudbg_pbt_tables *)temp_buff.data;
2756 	/* PBT dynamic entries */
2757 	addr = CUDBG_CHAC_PBT_ADDR;
2758 	for (i = 0; i < CUDBG_PBT_DYNAMIC_ENTRIES; i++) {
2759 		rc = t4_cim_read(padap, addr + (i * 4), 1,
2760 				 &pbt->pbt_dynamic[i]);
2761 		if (rc) {
2762 			cudbg_err->sys_err = rc;
2763 			cudbg_put_buff(pdbg_init, &temp_buff);
2764 			return rc;
2765 		}
2766 	}
2767 
2768 	/* PBT static entries */
2769 	/* static entries start when bit 6 is set */
2770 	addr = CUDBG_CHAC_PBT_ADDR + (1 << 6);
2771 	for (i = 0; i < CUDBG_PBT_STATIC_ENTRIES; i++) {
2772 		rc = t4_cim_read(padap, addr + (i * 4), 1,
2773 				 &pbt->pbt_static[i]);
2774 		if (rc) {
2775 			cudbg_err->sys_err = rc;
2776 			cudbg_put_buff(pdbg_init, &temp_buff);
2777 			return rc;
2778 		}
2779 	}
2780 
2781 	/* LRF entries */
2782 	addr = CUDBG_CHAC_PBT_LRF;
2783 	for (i = 0; i < CUDBG_LRF_ENTRIES; i++) {
2784 		rc = t4_cim_read(padap, addr + (i * 4), 1,
2785 				 &pbt->lrf_table[i]);
2786 		if (rc) {
2787 			cudbg_err->sys_err = rc;
2788 			cudbg_put_buff(pdbg_init, &temp_buff);
2789 			return rc;
2790 		}
2791 	}
2792 
2793 	/* PBT data entries */
2794 	addr = CUDBG_CHAC_PBT_DATA;
2795 	for (i = 0; i < CUDBG_PBT_DATA_ENTRIES; i++) {
2796 		rc = t4_cim_read(padap, addr + (i * 4), 1,
2797 				 &pbt->pbt_data[i]);
2798 		if (rc) {
2799 			cudbg_err->sys_err = rc;
2800 			cudbg_put_buff(pdbg_init, &temp_buff);
2801 			return rc;
2802 		}
2803 	}
2804 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2805 }
2806 
2807 int cudbg_collect_mbox_log(struct cudbg_init *pdbg_init,
2808 			   struct cudbg_buffer *dbg_buff,
2809 			   struct cudbg_error *cudbg_err)
2810 {
2811 	struct adapter *padap = pdbg_init->adap;
2812 	struct cudbg_mbox_log *mboxlog = NULL;
2813 	struct cudbg_buffer temp_buff = { 0 };
2814 	struct mbox_cmd_log *log = NULL;
2815 	struct mbox_cmd *entry;
2816 	unsigned int entry_idx;
2817 	u16 mbox_cmds;
2818 	int i, k, rc;
2819 	u64 flit;
2820 	u32 size;
2821 
2822 	log = padap->mbox_log;
2823 	mbox_cmds = padap->mbox_log->size;
2824 	size = sizeof(struct cudbg_mbox_log) * mbox_cmds;
2825 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2826 	if (rc)
2827 		return rc;
2828 
2829 	mboxlog = (struct cudbg_mbox_log *)temp_buff.data;
2830 	for (k = 0; k < mbox_cmds; k++) {
2831 		entry_idx = log->cursor + k;
2832 		if (entry_idx >= log->size)
2833 			entry_idx -= log->size;
2834 
2835 		entry = mbox_cmd_log_entry(log, entry_idx);
2836 		/* skip over unused entries */
2837 		if (entry->timestamp == 0)
2838 			continue;
2839 
2840 		memcpy(&mboxlog->entry, entry, sizeof(struct mbox_cmd));
2841 		for (i = 0; i < MBOX_LEN / 8; i++) {
2842 			flit = entry->cmd[i];
2843 			mboxlog->hi[i] = (u32)(flit >> 32);
2844 			mboxlog->lo[i] = (u32)flit;
2845 		}
2846 		mboxlog++;
2847 	}
2848 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2849 }
2850 
2851 int cudbg_collect_hma_indirect(struct cudbg_init *pdbg_init,
2852 			       struct cudbg_buffer *dbg_buff,
2853 			       struct cudbg_error *cudbg_err)
2854 {
2855 	struct adapter *padap = pdbg_init->adap;
2856 	struct cudbg_buffer temp_buff = { 0 };
2857 	struct ireg_buf *hma_indr;
2858 	int i, rc, n;
2859 	u32 size;
2860 
2861 	if (CHELSIO_CHIP_VERSION(padap->params.chip) < CHELSIO_T6)
2862 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
2863 
2864 	n = sizeof(t6_hma_ireg_array) / (IREG_NUM_ELEM * sizeof(u32));
2865 	size = sizeof(struct ireg_buf) * n;
2866 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2867 	if (rc)
2868 		return rc;
2869 
2870 	hma_indr = (struct ireg_buf *)temp_buff.data;
2871 	for (i = 0; i < n; i++) {
2872 		struct ireg_field *hma_fli = &hma_indr->tp_pio;
2873 		u32 *buff = hma_indr->outbuf;
2874 
2875 		hma_fli->ireg_addr = t6_hma_ireg_array[i][0];
2876 		hma_fli->ireg_data = t6_hma_ireg_array[i][1];
2877 		hma_fli->ireg_local_offset = t6_hma_ireg_array[i][2];
2878 		hma_fli->ireg_offset_range = t6_hma_ireg_array[i][3];
2879 		t4_read_indirect(padap, hma_fli->ireg_addr, hma_fli->ireg_data,
2880 				 buff, hma_fli->ireg_offset_range,
2881 				 hma_fli->ireg_local_offset);
2882 		hma_indr++;
2883 	}
2884 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2885 }
2886 
2887 void cudbg_fill_qdesc_num_and_size(const struct adapter *padap,
2888 				   u32 *num, u32 *size)
2889 {
2890 	u32 tot_entries = 0, tot_size = 0;
2891 
2892 	/* NIC TXQ, RXQ, FLQ, and CTRLQ */
2893 	tot_entries += MAX_ETH_QSETS * 3;
2894 	tot_entries += MAX_CTRL_QUEUES;
2895 
2896 	tot_size += MAX_ETH_QSETS * MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
2897 	tot_size += MAX_ETH_QSETS * MAX_RSPQ_ENTRIES * MAX_RXQ_DESC_SIZE;
2898 	tot_size += MAX_ETH_QSETS * MAX_RX_BUFFERS * MAX_FL_DESC_SIZE;
2899 	tot_size += MAX_CTRL_QUEUES * MAX_CTRL_TXQ_ENTRIES *
2900 		    MAX_CTRL_TXQ_DESC_SIZE;
2901 
2902 	/* FW_EVTQ and INTRQ */
2903 	tot_entries += INGQ_EXTRAS;
2904 	tot_size += INGQ_EXTRAS * MAX_RSPQ_ENTRIES * MAX_RXQ_DESC_SIZE;
2905 
2906 	/* PTP_TXQ */
2907 	tot_entries += 1;
2908 	tot_size += MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
2909 
2910 	/* ULD TXQ, RXQ, and FLQ */
2911 	tot_entries += CXGB4_TX_MAX * MAX_OFLD_QSETS;
2912 	tot_entries += CXGB4_ULD_MAX * MAX_ULD_QSETS * 2;
2913 
2914 	tot_size += CXGB4_TX_MAX * MAX_OFLD_QSETS * MAX_TXQ_ENTRIES *
2915 		    MAX_TXQ_DESC_SIZE;
2916 	tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * MAX_RSPQ_ENTRIES *
2917 		    MAX_RXQ_DESC_SIZE;
2918 	tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * MAX_RX_BUFFERS *
2919 		    MAX_FL_DESC_SIZE;
2920 
2921 	/* ULD CIQ */
2922 	tot_entries += CXGB4_ULD_MAX * MAX_ULD_QSETS;
2923 	tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * SGE_MAX_IQ_SIZE *
2924 		    MAX_RXQ_DESC_SIZE;
2925 
2926 	tot_size += sizeof(struct cudbg_ver_hdr) +
2927 		    sizeof(struct cudbg_qdesc_info) +
2928 		    sizeof(struct cudbg_qdesc_entry) * tot_entries;
2929 
2930 	if (num)
2931 		*num = tot_entries;
2932 
2933 	if (size)
2934 		*size = tot_size;
2935 }
2936 
2937 int cudbg_collect_qdesc(struct cudbg_init *pdbg_init,
2938 			struct cudbg_buffer *dbg_buff,
2939 			struct cudbg_error *cudbg_err)
2940 {
2941 	u32 num_queues = 0, tot_entries = 0, size = 0;
2942 	struct adapter *padap = pdbg_init->adap;
2943 	struct cudbg_buffer temp_buff = { 0 };
2944 	struct cudbg_qdesc_entry *qdesc_entry;
2945 	struct cudbg_qdesc_info *qdesc_info;
2946 	struct cudbg_ver_hdr *ver_hdr;
2947 	struct sge *s = &padap->sge;
2948 	u32 i, j, cur_off, tot_len;
2949 	u8 *data;
2950 	int rc;
2951 
2952 	cudbg_fill_qdesc_num_and_size(padap, &tot_entries, &size);
2953 	size = min_t(u32, size, CUDBG_DUMP_BUFF_SIZE);
2954 	tot_len = size;
2955 	data = kvzalloc(size, GFP_KERNEL);
2956 	if (!data)
2957 		return -ENOMEM;
2958 
2959 	ver_hdr = (struct cudbg_ver_hdr *)data;
2960 	ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
2961 	ver_hdr->revision = CUDBG_QDESC_REV;
2962 	ver_hdr->size = sizeof(struct cudbg_qdesc_info);
2963 	size -= sizeof(*ver_hdr);
2964 
2965 	qdesc_info = (struct cudbg_qdesc_info *)(data +
2966 						 sizeof(*ver_hdr));
2967 	size -= sizeof(*qdesc_info);
2968 	qdesc_entry = (struct cudbg_qdesc_entry *)qdesc_info->data;
2969 
2970 #define QDESC_GET(q, desc, type, label) do { \
2971 	if (size <= 0) { \
2972 		goto label; \
2973 	} \
2974 	if (desc) { \
2975 		cudbg_fill_qdesc_##q(q, type, qdesc_entry); \
2976 		size -= sizeof(*qdesc_entry) + qdesc_entry->data_size; \
2977 		num_queues++; \
2978 		qdesc_entry = cudbg_next_qdesc(qdesc_entry); \
2979 	} \
2980 } while (0)
2981 
2982 #define QDESC_GET_TXQ(q, type, label) do { \
2983 	struct sge_txq *txq = (struct sge_txq *)q; \
2984 	QDESC_GET(txq, txq->desc, type, label); \
2985 } while (0)
2986 
2987 #define QDESC_GET_RXQ(q, type, label) do { \
2988 	struct sge_rspq *rxq = (struct sge_rspq *)q; \
2989 	QDESC_GET(rxq, rxq->desc, type, label); \
2990 } while (0)
2991 
2992 #define QDESC_GET_FLQ(q, type, label) do { \
2993 	struct sge_fl *flq = (struct sge_fl *)q; \
2994 	QDESC_GET(flq, flq->desc, type, label); \
2995 } while (0)
2996 
2997 	/* NIC TXQ */
2998 	for (i = 0; i < s->ethqsets; i++)
2999 		QDESC_GET_TXQ(&s->ethtxq[i].q, CUDBG_QTYPE_NIC_TXQ, out);
3000 
3001 	/* NIC RXQ */
3002 	for (i = 0; i < s->ethqsets; i++)
3003 		QDESC_GET_RXQ(&s->ethrxq[i].rspq, CUDBG_QTYPE_NIC_RXQ, out);
3004 
3005 	/* NIC FLQ */
3006 	for (i = 0; i < s->ethqsets; i++)
3007 		QDESC_GET_FLQ(&s->ethrxq[i].fl, CUDBG_QTYPE_NIC_FLQ, out);
3008 
3009 	/* NIC CTRLQ */
3010 	for (i = 0; i < padap->params.nports; i++)
3011 		QDESC_GET_TXQ(&s->ctrlq[i].q, CUDBG_QTYPE_CTRLQ, out);
3012 
3013 	/* FW_EVTQ */
3014 	QDESC_GET_RXQ(&s->fw_evtq, CUDBG_QTYPE_FWEVTQ, out);
3015 
3016 	/* INTRQ */
3017 	QDESC_GET_RXQ(&s->intrq, CUDBG_QTYPE_INTRQ, out);
3018 
3019 	/* PTP_TXQ */
3020 	QDESC_GET_TXQ(&s->ptptxq.q, CUDBG_QTYPE_PTP_TXQ, out);
3021 
3022 	/* ULD Queues */
3023 	mutex_lock(&uld_mutex);
3024 
3025 	if (s->uld_txq_info) {
3026 		struct sge_uld_txq_info *utxq;
3027 
3028 		/* ULD TXQ */
3029 		for (j = 0; j < CXGB4_TX_MAX; j++) {
3030 			if (!s->uld_txq_info[j])
3031 				continue;
3032 
3033 			utxq = s->uld_txq_info[j];
3034 			for (i = 0; i < utxq->ntxq; i++)
3035 				QDESC_GET_TXQ(&utxq->uldtxq[i].q,
3036 					      cudbg_uld_txq_to_qtype(j),
3037 					      out_unlock);
3038 		}
3039 	}
3040 
3041 	if (s->uld_rxq_info) {
3042 		struct sge_uld_rxq_info *urxq;
3043 		u32 base;
3044 
3045 		/* ULD RXQ */
3046 		for (j = 0; j < CXGB4_ULD_MAX; j++) {
3047 			if (!s->uld_rxq_info[j])
3048 				continue;
3049 
3050 			urxq = s->uld_rxq_info[j];
3051 			for (i = 0; i < urxq->nrxq; i++)
3052 				QDESC_GET_RXQ(&urxq->uldrxq[i].rspq,
3053 					      cudbg_uld_rxq_to_qtype(j),
3054 					      out_unlock);
3055 		}
3056 
3057 		/* ULD FLQ */
3058 		for (j = 0; j < CXGB4_ULD_MAX; j++) {
3059 			if (!s->uld_rxq_info[j])
3060 				continue;
3061 
3062 			urxq = s->uld_rxq_info[j];
3063 			for (i = 0; i < urxq->nrxq; i++)
3064 				QDESC_GET_FLQ(&urxq->uldrxq[i].fl,
3065 					      cudbg_uld_flq_to_qtype(j),
3066 					      out_unlock);
3067 		}
3068 
3069 		/* ULD CIQ */
3070 		for (j = 0; j < CXGB4_ULD_MAX; j++) {
3071 			if (!s->uld_rxq_info[j])
3072 				continue;
3073 
3074 			urxq = s->uld_rxq_info[j];
3075 			base = urxq->nrxq;
3076 			for (i = 0; i < urxq->nciq; i++)
3077 				QDESC_GET_RXQ(&urxq->uldrxq[base + i].rspq,
3078 					      cudbg_uld_ciq_to_qtype(j),
3079 					      out_unlock);
3080 		}
3081 	}
3082 
3083 out_unlock:
3084 	mutex_unlock(&uld_mutex);
3085 
3086 out:
3087 	qdesc_info->qdesc_entry_size = sizeof(*qdesc_entry);
3088 	qdesc_info->num_queues = num_queues;
3089 	cur_off = 0;
3090 	while (tot_len) {
3091 		u32 chunk_size = min_t(u32, tot_len, CUDBG_CHUNK_SIZE);
3092 
3093 		rc = cudbg_get_buff(pdbg_init, dbg_buff, chunk_size,
3094 				    &temp_buff);
3095 		if (rc) {
3096 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3097 			goto out_free;
3098 		}
3099 
3100 		memcpy(temp_buff.data, data + cur_off, chunk_size);
3101 		tot_len -= chunk_size;
3102 		cur_off += chunk_size;
3103 		rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
3104 						  dbg_buff);
3105 		if (rc) {
3106 			cudbg_put_buff(pdbg_init, &temp_buff);
3107 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3108 			goto out_free;
3109 		}
3110 	}
3111 
3112 out_free:
3113 	if (data)
3114 		kvfree(data);
3115 
3116 #undef QDESC_GET_FLQ
3117 #undef QDESC_GET_RXQ
3118 #undef QDESC_GET_TXQ
3119 #undef QDESC_GET
3120 
3121 	return rc;
3122 }
3123