xref: /linux/drivers/net/ethernet/chelsio/cxgb4/cudbg_lib.c (revision 4d5e3b06e1fc1428be14cd4ebe3b37c1bb34f95d)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  *  Copyright (C) 2017 Chelsio Communications.  All rights reserved.
4  */
5 
6 #include <linux/sort.h>
7 #include <linux/string.h>
8 
9 #include "t4_regs.h"
10 #include "cxgb4.h"
11 #include "cxgb4_cudbg.h"
12 #include "cudbg_if.h"
13 #include "cudbg_lib_common.h"
14 #include "cudbg_entity.h"
15 #include "cudbg_lib.h"
16 #include "cudbg_zlib.h"
17 
18 static const u32 t6_tp_pio_array[][IREG_NUM_ELEM] = {
19 	{0x7e40, 0x7e44, 0x020, 28}, /* t6_tp_pio_regs_20_to_3b */
20 	{0x7e40, 0x7e44, 0x040, 10}, /* t6_tp_pio_regs_40_to_49 */
21 	{0x7e40, 0x7e44, 0x050, 10}, /* t6_tp_pio_regs_50_to_59 */
22 	{0x7e40, 0x7e44, 0x060, 14}, /* t6_tp_pio_regs_60_to_6d */
23 	{0x7e40, 0x7e44, 0x06F, 1}, /* t6_tp_pio_regs_6f */
24 	{0x7e40, 0x7e44, 0x070, 6}, /* t6_tp_pio_regs_70_to_75 */
25 	{0x7e40, 0x7e44, 0x130, 18}, /* t6_tp_pio_regs_130_to_141 */
26 	{0x7e40, 0x7e44, 0x145, 19}, /* t6_tp_pio_regs_145_to_157 */
27 	{0x7e40, 0x7e44, 0x160, 1}, /* t6_tp_pio_regs_160 */
28 	{0x7e40, 0x7e44, 0x230, 25}, /* t6_tp_pio_regs_230_to_248 */
29 	{0x7e40, 0x7e44, 0x24a, 3}, /* t6_tp_pio_regs_24c */
30 	{0x7e40, 0x7e44, 0x8C0, 1} /* t6_tp_pio_regs_8c0 */
31 };
32 
33 static const u32 t5_tp_pio_array[][IREG_NUM_ELEM] = {
34 	{0x7e40, 0x7e44, 0x020, 28}, /* t5_tp_pio_regs_20_to_3b */
35 	{0x7e40, 0x7e44, 0x040, 19}, /* t5_tp_pio_regs_40_to_52 */
36 	{0x7e40, 0x7e44, 0x054, 2}, /* t5_tp_pio_regs_54_to_55 */
37 	{0x7e40, 0x7e44, 0x060, 13}, /* t5_tp_pio_regs_60_to_6c */
38 	{0x7e40, 0x7e44, 0x06F, 1}, /* t5_tp_pio_regs_6f */
39 	{0x7e40, 0x7e44, 0x120, 4}, /* t5_tp_pio_regs_120_to_123 */
40 	{0x7e40, 0x7e44, 0x12b, 2}, /* t5_tp_pio_regs_12b_to_12c */
41 	{0x7e40, 0x7e44, 0x12f, 21}, /* t5_tp_pio_regs_12f_to_143 */
42 	{0x7e40, 0x7e44, 0x145, 19}, /* t5_tp_pio_regs_145_to_157 */
43 	{0x7e40, 0x7e44, 0x230, 25}, /* t5_tp_pio_regs_230_to_248 */
44 	{0x7e40, 0x7e44, 0x8C0, 1} /* t5_tp_pio_regs_8c0 */
45 };
46 
47 static const u32 t6_tp_tm_pio_array[][IREG_NUM_ELEM] = {
48 	{0x7e18, 0x7e1c, 0x0, 12}
49 };
50 
51 static const u32 t5_tp_tm_pio_array[][IREG_NUM_ELEM] = {
52 	{0x7e18, 0x7e1c, 0x0, 12}
53 };
54 
55 static const u32 t6_tp_mib_index_array[6][IREG_NUM_ELEM] = {
56 	{0x7e50, 0x7e54, 0x0, 13},
57 	{0x7e50, 0x7e54, 0x10, 6},
58 	{0x7e50, 0x7e54, 0x18, 21},
59 	{0x7e50, 0x7e54, 0x30, 32},
60 	{0x7e50, 0x7e54, 0x50, 22},
61 	{0x7e50, 0x7e54, 0x68, 12}
62 };
63 
64 static const u32 t5_tp_mib_index_array[9][IREG_NUM_ELEM] = {
65 	{0x7e50, 0x7e54, 0x0, 13},
66 	{0x7e50, 0x7e54, 0x10, 6},
67 	{0x7e50, 0x7e54, 0x18, 8},
68 	{0x7e50, 0x7e54, 0x20, 13},
69 	{0x7e50, 0x7e54, 0x30, 16},
70 	{0x7e50, 0x7e54, 0x40, 16},
71 	{0x7e50, 0x7e54, 0x50, 16},
72 	{0x7e50, 0x7e54, 0x60, 6},
73 	{0x7e50, 0x7e54, 0x68, 4}
74 };
75 
76 static const u32 t5_sge_dbg_index_array[2][IREG_NUM_ELEM] = {
77 	{0x10cc, 0x10d0, 0x0, 16},
78 	{0x10cc, 0x10d4, 0x0, 16},
79 };
80 
81 static const u32 t6_sge_qbase_index_array[] = {
82 	/* 1 addr reg SGE_QBASE_INDEX and 4 data reg SGE_QBASE_MAP[0-3] */
83 	0x1250, 0x1240, 0x1244, 0x1248, 0x124c,
84 };
85 
86 static const u32 t5_pcie_pdbg_array[][IREG_NUM_ELEM] = {
87 	{0x5a04, 0x5a0c, 0x00, 0x20}, /* t5_pcie_pdbg_regs_00_to_20 */
88 	{0x5a04, 0x5a0c, 0x21, 0x20}, /* t5_pcie_pdbg_regs_21_to_40 */
89 	{0x5a04, 0x5a0c, 0x41, 0x10}, /* t5_pcie_pdbg_regs_41_to_50 */
90 };
91 
92 static const u32 t5_pcie_cdbg_array[][IREG_NUM_ELEM] = {
93 	{0x5a10, 0x5a18, 0x00, 0x20}, /* t5_pcie_cdbg_regs_00_to_20 */
94 	{0x5a10, 0x5a18, 0x21, 0x18}, /* t5_pcie_cdbg_regs_21_to_37 */
95 };
96 
97 static const u32 t5_pm_rx_array[][IREG_NUM_ELEM] = {
98 	{0x8FD0, 0x8FD4, 0x10000, 0x20}, /* t5_pm_rx_regs_10000_to_10020 */
99 	{0x8FD0, 0x8FD4, 0x10021, 0x0D}, /* t5_pm_rx_regs_10021_to_1002c */
100 };
101 
102 static const u32 t5_pm_tx_array[][IREG_NUM_ELEM] = {
103 	{0x8FF0, 0x8FF4, 0x10000, 0x20}, /* t5_pm_tx_regs_10000_to_10020 */
104 	{0x8FF0, 0x8FF4, 0x10021, 0x1D}, /* t5_pm_tx_regs_10021_to_1003c */
105 };
106 
107 static const u32 t5_pcie_config_array[][2] = {
108 	{0x0, 0x34},
109 	{0x3c, 0x40},
110 	{0x50, 0x64},
111 	{0x70, 0x80},
112 	{0x94, 0xa0},
113 	{0xb0, 0xb8},
114 	{0xd0, 0xd4},
115 	{0x100, 0x128},
116 	{0x140, 0x148},
117 	{0x150, 0x164},
118 	{0x170, 0x178},
119 	{0x180, 0x194},
120 	{0x1a0, 0x1b8},
121 	{0x1c0, 0x208},
122 };
123 
124 static const u32 t6_ma_ireg_array[][IREG_NUM_ELEM] = {
125 	{0x78f8, 0x78fc, 0xa000, 23}, /* t6_ma_regs_a000_to_a016 */
126 	{0x78f8, 0x78fc, 0xa400, 30}, /* t6_ma_regs_a400_to_a41e */
127 	{0x78f8, 0x78fc, 0xa800, 20} /* t6_ma_regs_a800_to_a813 */
128 };
129 
130 static const u32 t6_ma_ireg_array2[][IREG_NUM_ELEM] = {
131 	{0x78f8, 0x78fc, 0xe400, 17}, /* t6_ma_regs_e400_to_e600 */
132 	{0x78f8, 0x78fc, 0xe640, 13} /* t6_ma_regs_e640_to_e7c0 */
133 };
134 
135 static const u32 t6_up_cim_reg_array[][IREG_NUM_ELEM + 1] = {
136 	{0x7b50, 0x7b54, 0x2000, 0x20, 0}, /* up_cim_2000_to_207c */
137 	{0x7b50, 0x7b54, 0x2080, 0x1d, 0}, /* up_cim_2080_to_20fc */
138 	{0x7b50, 0x7b54, 0x00, 0x20, 0}, /* up_cim_00_to_7c */
139 	{0x7b50, 0x7b54, 0x80, 0x20, 0}, /* up_cim_80_to_fc */
140 	{0x7b50, 0x7b54, 0x100, 0x11, 0}, /* up_cim_100_to_14c */
141 	{0x7b50, 0x7b54, 0x200, 0x10, 0}, /* up_cim_200_to_23c */
142 	{0x7b50, 0x7b54, 0x240, 0x2, 0}, /* up_cim_240_to_244 */
143 	{0x7b50, 0x7b54, 0x250, 0x2, 0}, /* up_cim_250_to_254 */
144 	{0x7b50, 0x7b54, 0x260, 0x2, 0}, /* up_cim_260_to_264 */
145 	{0x7b50, 0x7b54, 0x270, 0x2, 0}, /* up_cim_270_to_274 */
146 	{0x7b50, 0x7b54, 0x280, 0x20, 0}, /* up_cim_280_to_2fc */
147 	{0x7b50, 0x7b54, 0x300, 0x20, 0}, /* up_cim_300_to_37c */
148 	{0x7b50, 0x7b54, 0x380, 0x14, 0}, /* up_cim_380_to_3cc */
149 	{0x7b50, 0x7b54, 0x4900, 0x4, 0x4}, /* up_cim_4900_to_4c60 */
150 	{0x7b50, 0x7b54, 0x4904, 0x4, 0x4}, /* up_cim_4904_to_4c64 */
151 	{0x7b50, 0x7b54, 0x4908, 0x4, 0x4}, /* up_cim_4908_to_4c68 */
152 	{0x7b50, 0x7b54, 0x4910, 0x4, 0x4}, /* up_cim_4910_to_4c70 */
153 	{0x7b50, 0x7b54, 0x4914, 0x4, 0x4}, /* up_cim_4914_to_4c74 */
154 	{0x7b50, 0x7b54, 0x4920, 0x10, 0x10}, /* up_cim_4920_to_4a10 */
155 	{0x7b50, 0x7b54, 0x4924, 0x10, 0x10}, /* up_cim_4924_to_4a14 */
156 	{0x7b50, 0x7b54, 0x4928, 0x10, 0x10}, /* up_cim_4928_to_4a18 */
157 	{0x7b50, 0x7b54, 0x492c, 0x10, 0x10}, /* up_cim_492c_to_4a1c */
158 };
159 
160 static const u32 t5_up_cim_reg_array[][IREG_NUM_ELEM + 1] = {
161 	{0x7b50, 0x7b54, 0x2000, 0x20, 0}, /* up_cim_2000_to_207c */
162 	{0x7b50, 0x7b54, 0x2080, 0x19, 0}, /* up_cim_2080_to_20ec */
163 	{0x7b50, 0x7b54, 0x00, 0x20, 0}, /* up_cim_00_to_7c */
164 	{0x7b50, 0x7b54, 0x80, 0x20, 0}, /* up_cim_80_to_fc */
165 	{0x7b50, 0x7b54, 0x100, 0x11, 0}, /* up_cim_100_to_14c */
166 	{0x7b50, 0x7b54, 0x200, 0x10, 0}, /* up_cim_200_to_23c */
167 	{0x7b50, 0x7b54, 0x240, 0x2, 0}, /* up_cim_240_to_244 */
168 	{0x7b50, 0x7b54, 0x250, 0x2, 0}, /* up_cim_250_to_254 */
169 	{0x7b50, 0x7b54, 0x260, 0x2, 0}, /* up_cim_260_to_264 */
170 	{0x7b50, 0x7b54, 0x270, 0x2, 0}, /* up_cim_270_to_274 */
171 	{0x7b50, 0x7b54, 0x280, 0x20, 0}, /* up_cim_280_to_2fc */
172 	{0x7b50, 0x7b54, 0x300, 0x20, 0}, /* up_cim_300_to_37c */
173 	{0x7b50, 0x7b54, 0x380, 0x14, 0}, /* up_cim_380_to_3cc */
174 };
175 
176 static const u32 t6_hma_ireg_array[][IREG_NUM_ELEM] = {
177 	{0x51320, 0x51324, 0xa000, 32} /* t6_hma_regs_a000_to_a01f */
178 };
179 
180 u32 cudbg_get_entity_length(struct adapter *adap, u32 entity)
181 {
182 	struct cudbg_tcam tcam_region = { 0 };
183 	u32 value, n = 0, len = 0;
184 
185 	switch (entity) {
186 	case CUDBG_REG_DUMP:
187 		switch (CHELSIO_CHIP_VERSION(adap->params.chip)) {
188 		case CHELSIO_T4:
189 			len = T4_REGMAP_SIZE;
190 			break;
191 		case CHELSIO_T5:
192 		case CHELSIO_T6:
193 			len = T5_REGMAP_SIZE;
194 			break;
195 		default:
196 			break;
197 		}
198 		break;
199 	case CUDBG_DEV_LOG:
200 		len = adap->params.devlog.size;
201 		break;
202 	case CUDBG_CIM_LA:
203 		if (is_t6(adap->params.chip)) {
204 			len = adap->params.cim_la_size / 10 + 1;
205 			len *= 10 * sizeof(u32);
206 		} else {
207 			len = adap->params.cim_la_size / 8;
208 			len *= 8 * sizeof(u32);
209 		}
210 		len += sizeof(u32); /* for reading CIM LA configuration */
211 		break;
212 	case CUDBG_CIM_MA_LA:
213 		len = 2 * CIM_MALA_SIZE * 5 * sizeof(u32);
214 		break;
215 	case CUDBG_CIM_QCFG:
216 		len = sizeof(struct cudbg_cim_qcfg);
217 		break;
218 	case CUDBG_CIM_IBQ_TP0:
219 	case CUDBG_CIM_IBQ_TP1:
220 	case CUDBG_CIM_IBQ_ULP:
221 	case CUDBG_CIM_IBQ_SGE0:
222 	case CUDBG_CIM_IBQ_SGE1:
223 	case CUDBG_CIM_IBQ_NCSI:
224 		len = CIM_IBQ_SIZE * 4 * sizeof(u32);
225 		break;
226 	case CUDBG_CIM_OBQ_ULP0:
227 		len = cudbg_cim_obq_size(adap, 0);
228 		break;
229 	case CUDBG_CIM_OBQ_ULP1:
230 		len = cudbg_cim_obq_size(adap, 1);
231 		break;
232 	case CUDBG_CIM_OBQ_ULP2:
233 		len = cudbg_cim_obq_size(adap, 2);
234 		break;
235 	case CUDBG_CIM_OBQ_ULP3:
236 		len = cudbg_cim_obq_size(adap, 3);
237 		break;
238 	case CUDBG_CIM_OBQ_SGE:
239 		len = cudbg_cim_obq_size(adap, 4);
240 		break;
241 	case CUDBG_CIM_OBQ_NCSI:
242 		len = cudbg_cim_obq_size(adap, 5);
243 		break;
244 	case CUDBG_CIM_OBQ_RXQ0:
245 		len = cudbg_cim_obq_size(adap, 6);
246 		break;
247 	case CUDBG_CIM_OBQ_RXQ1:
248 		len = cudbg_cim_obq_size(adap, 7);
249 		break;
250 	case CUDBG_EDC0:
251 		value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
252 		if (value & EDRAM0_ENABLE_F) {
253 			value = t4_read_reg(adap, MA_EDRAM0_BAR_A);
254 			len = EDRAM0_SIZE_G(value);
255 		}
256 		len = cudbg_mbytes_to_bytes(len);
257 		break;
258 	case CUDBG_EDC1:
259 		value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
260 		if (value & EDRAM1_ENABLE_F) {
261 			value = t4_read_reg(adap, MA_EDRAM1_BAR_A);
262 			len = EDRAM1_SIZE_G(value);
263 		}
264 		len = cudbg_mbytes_to_bytes(len);
265 		break;
266 	case CUDBG_MC0:
267 		value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
268 		if (value & EXT_MEM0_ENABLE_F) {
269 			value = t4_read_reg(adap, MA_EXT_MEMORY0_BAR_A);
270 			len = EXT_MEM0_SIZE_G(value);
271 		}
272 		len = cudbg_mbytes_to_bytes(len);
273 		break;
274 	case CUDBG_MC1:
275 		value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
276 		if (value & EXT_MEM1_ENABLE_F) {
277 			value = t4_read_reg(adap, MA_EXT_MEMORY1_BAR_A);
278 			len = EXT_MEM1_SIZE_G(value);
279 		}
280 		len = cudbg_mbytes_to_bytes(len);
281 		break;
282 	case CUDBG_RSS:
283 		len = t4_chip_rss_size(adap) * sizeof(u16);
284 		break;
285 	case CUDBG_RSS_VF_CONF:
286 		len = adap->params.arch.vfcount *
287 		      sizeof(struct cudbg_rss_vf_conf);
288 		break;
289 	case CUDBG_PATH_MTU:
290 		len = NMTUS * sizeof(u16);
291 		break;
292 	case CUDBG_PM_STATS:
293 		len = sizeof(struct cudbg_pm_stats);
294 		break;
295 	case CUDBG_HW_SCHED:
296 		len = sizeof(struct cudbg_hw_sched);
297 		break;
298 	case CUDBG_TP_INDIRECT:
299 		switch (CHELSIO_CHIP_VERSION(adap->params.chip)) {
300 		case CHELSIO_T5:
301 			n = sizeof(t5_tp_pio_array) +
302 			    sizeof(t5_tp_tm_pio_array) +
303 			    sizeof(t5_tp_mib_index_array);
304 			break;
305 		case CHELSIO_T6:
306 			n = sizeof(t6_tp_pio_array) +
307 			    sizeof(t6_tp_tm_pio_array) +
308 			    sizeof(t6_tp_mib_index_array);
309 			break;
310 		default:
311 			break;
312 		}
313 		n = n / (IREG_NUM_ELEM * sizeof(u32));
314 		len = sizeof(struct ireg_buf) * n;
315 		break;
316 	case CUDBG_SGE_INDIRECT:
317 		len = sizeof(struct ireg_buf) * 2 +
318 		      sizeof(struct sge_qbase_reg_field);
319 		break;
320 	case CUDBG_ULPRX_LA:
321 		len = sizeof(struct cudbg_ulprx_la);
322 		break;
323 	case CUDBG_TP_LA:
324 		len = sizeof(struct cudbg_tp_la) + TPLA_SIZE * sizeof(u64);
325 		break;
326 	case CUDBG_MEMINFO:
327 		len = sizeof(struct cudbg_ver_hdr) +
328 		      sizeof(struct cudbg_meminfo);
329 		break;
330 	case CUDBG_CIM_PIF_LA:
331 		len = sizeof(struct cudbg_cim_pif_la);
332 		len += 2 * CIM_PIFLA_SIZE * 6 * sizeof(u32);
333 		break;
334 	case CUDBG_CLK:
335 		len = sizeof(struct cudbg_clk_info);
336 		break;
337 	case CUDBG_PCIE_INDIRECT:
338 		n = sizeof(t5_pcie_pdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
339 		len = sizeof(struct ireg_buf) * n * 2;
340 		break;
341 	case CUDBG_PM_INDIRECT:
342 		n = sizeof(t5_pm_rx_array) / (IREG_NUM_ELEM * sizeof(u32));
343 		len = sizeof(struct ireg_buf) * n * 2;
344 		break;
345 	case CUDBG_TID_INFO:
346 		len = sizeof(struct cudbg_tid_info_region_rev1);
347 		break;
348 	case CUDBG_PCIE_CONFIG:
349 		len = sizeof(u32) * CUDBG_NUM_PCIE_CONFIG_REGS;
350 		break;
351 	case CUDBG_DUMP_CONTEXT:
352 		len = cudbg_dump_context_size(adap);
353 		break;
354 	case CUDBG_MPS_TCAM:
355 		len = sizeof(struct cudbg_mps_tcam) *
356 		      adap->params.arch.mps_tcam_size;
357 		break;
358 	case CUDBG_VPD_DATA:
359 		len = sizeof(struct cudbg_vpd_data);
360 		break;
361 	case CUDBG_LE_TCAM:
362 		cudbg_fill_le_tcam_info(adap, &tcam_region);
363 		len = sizeof(struct cudbg_tcam) +
364 		      sizeof(struct cudbg_tid_data) * tcam_region.max_tid;
365 		break;
366 	case CUDBG_CCTRL:
367 		len = sizeof(u16) * NMTUS * NCCTRL_WIN;
368 		break;
369 	case CUDBG_MA_INDIRECT:
370 		if (CHELSIO_CHIP_VERSION(adap->params.chip) > CHELSIO_T5) {
371 			n = sizeof(t6_ma_ireg_array) /
372 			    (IREG_NUM_ELEM * sizeof(u32));
373 			len = sizeof(struct ireg_buf) * n * 2;
374 		}
375 		break;
376 	case CUDBG_ULPTX_LA:
377 		len = sizeof(struct cudbg_ver_hdr) +
378 		      sizeof(struct cudbg_ulptx_la);
379 		break;
380 	case CUDBG_UP_CIM_INDIRECT:
381 		n = 0;
382 		if (is_t5(adap->params.chip))
383 			n = sizeof(t5_up_cim_reg_array) /
384 			    ((IREG_NUM_ELEM + 1) * sizeof(u32));
385 		else if (is_t6(adap->params.chip))
386 			n = sizeof(t6_up_cim_reg_array) /
387 			    ((IREG_NUM_ELEM + 1) * sizeof(u32));
388 		len = sizeof(struct ireg_buf) * n;
389 		break;
390 	case CUDBG_PBT_TABLE:
391 		len = sizeof(struct cudbg_pbt_tables);
392 		break;
393 	case CUDBG_MBOX_LOG:
394 		len = sizeof(struct cudbg_mbox_log) * adap->mbox_log->size;
395 		break;
396 	case CUDBG_HMA_INDIRECT:
397 		if (CHELSIO_CHIP_VERSION(adap->params.chip) > CHELSIO_T5) {
398 			n = sizeof(t6_hma_ireg_array) /
399 			    (IREG_NUM_ELEM * sizeof(u32));
400 			len = sizeof(struct ireg_buf) * n;
401 		}
402 		break;
403 	case CUDBG_HMA:
404 		value = t4_read_reg(adap, MA_TARGET_MEM_ENABLE_A);
405 		if (value & HMA_MUX_F) {
406 			/* In T6, there's no MC1.  So, HMA shares MC1
407 			 * address space.
408 			 */
409 			value = t4_read_reg(adap, MA_EXT_MEMORY1_BAR_A);
410 			len = EXT_MEM1_SIZE_G(value);
411 		}
412 		len = cudbg_mbytes_to_bytes(len);
413 		break;
414 	case CUDBG_QDESC:
415 		cudbg_fill_qdesc_num_and_size(adap, NULL, &len);
416 		break;
417 	default:
418 		break;
419 	}
420 
421 	return len;
422 }
423 
424 static int cudbg_do_compression(struct cudbg_init *pdbg_init,
425 				struct cudbg_buffer *pin_buff,
426 				struct cudbg_buffer *dbg_buff)
427 {
428 	struct cudbg_buffer temp_in_buff = { 0 };
429 	int bytes_left, bytes_read, bytes;
430 	u32 offset = dbg_buff->offset;
431 	int rc;
432 
433 	temp_in_buff.offset = pin_buff->offset;
434 	temp_in_buff.data = pin_buff->data;
435 	temp_in_buff.size = pin_buff->size;
436 
437 	bytes_left = pin_buff->size;
438 	bytes_read = 0;
439 	while (bytes_left > 0) {
440 		/* Do compression in smaller chunks */
441 		bytes = min_t(unsigned long, bytes_left,
442 			      (unsigned long)CUDBG_CHUNK_SIZE);
443 		temp_in_buff.data = (char *)pin_buff->data + bytes_read;
444 		temp_in_buff.size = bytes;
445 		rc = cudbg_compress_buff(pdbg_init, &temp_in_buff, dbg_buff);
446 		if (rc)
447 			return rc;
448 		bytes_left -= bytes;
449 		bytes_read += bytes;
450 	}
451 
452 	pin_buff->size = dbg_buff->offset - offset;
453 	return 0;
454 }
455 
456 static int cudbg_write_and_release_buff(struct cudbg_init *pdbg_init,
457 					struct cudbg_buffer *pin_buff,
458 					struct cudbg_buffer *dbg_buff)
459 {
460 	int rc = 0;
461 
462 	if (pdbg_init->compress_type == CUDBG_COMPRESSION_NONE) {
463 		cudbg_update_buff(pin_buff, dbg_buff);
464 	} else {
465 		rc = cudbg_do_compression(pdbg_init, pin_buff, dbg_buff);
466 		if (rc)
467 			goto out;
468 	}
469 
470 out:
471 	cudbg_put_buff(pdbg_init, pin_buff);
472 	return rc;
473 }
474 
475 static int is_fw_attached(struct cudbg_init *pdbg_init)
476 {
477 	struct adapter *padap = pdbg_init->adap;
478 
479 	if (!(padap->flags & CXGB4_FW_OK) || padap->use_bd)
480 		return 0;
481 
482 	return 1;
483 }
484 
485 /* This function will add additional padding bytes into debug_buffer to make it
486  * 4 byte aligned.
487  */
488 void cudbg_align_debug_buffer(struct cudbg_buffer *dbg_buff,
489 			      struct cudbg_entity_hdr *entity_hdr)
490 {
491 	u8 zero_buf[4] = {0};
492 	u8 padding, remain;
493 
494 	remain = (dbg_buff->offset - entity_hdr->start_offset) % 4;
495 	padding = 4 - remain;
496 	if (remain) {
497 		memcpy(((u8 *)dbg_buff->data) + dbg_buff->offset, &zero_buf,
498 		       padding);
499 		dbg_buff->offset += padding;
500 		entity_hdr->num_pad = padding;
501 	}
502 	entity_hdr->size = dbg_buff->offset - entity_hdr->start_offset;
503 }
504 
505 struct cudbg_entity_hdr *cudbg_get_entity_hdr(void *outbuf, int i)
506 {
507 	struct cudbg_hdr *cudbg_hdr = (struct cudbg_hdr *)outbuf;
508 
509 	return (struct cudbg_entity_hdr *)
510 	       ((char *)outbuf + cudbg_hdr->hdr_len +
511 		(sizeof(struct cudbg_entity_hdr) * (i - 1)));
512 }
513 
514 static int cudbg_read_vpd_reg(struct adapter *padap, u32 addr, u32 len,
515 			      void *dest)
516 {
517 	int vaddr, rc;
518 
519 	vaddr = t4_eeprom_ptov(addr, padap->pf, EEPROMPFSIZE);
520 	if (vaddr < 0)
521 		return vaddr;
522 
523 	rc = pci_read_vpd(padap->pdev, vaddr, len, dest);
524 	if (rc < 0)
525 		return rc;
526 
527 	return 0;
528 }
529 
530 static int cudbg_mem_desc_cmp(const void *a, const void *b)
531 {
532 	return ((const struct cudbg_mem_desc *)a)->base -
533 	       ((const struct cudbg_mem_desc *)b)->base;
534 }
535 
536 int cudbg_fill_meminfo(struct adapter *padap,
537 		       struct cudbg_meminfo *meminfo_buff)
538 {
539 	struct cudbg_mem_desc *md;
540 	u32 lo, hi, used, alloc;
541 	int n, i;
542 
543 	memset(meminfo_buff->avail, 0,
544 	       ARRAY_SIZE(meminfo_buff->avail) *
545 	       sizeof(struct cudbg_mem_desc));
546 	memset(meminfo_buff->mem, 0,
547 	       (ARRAY_SIZE(cudbg_region) + 3) * sizeof(struct cudbg_mem_desc));
548 	md  = meminfo_buff->mem;
549 
550 	for (i = 0; i < ARRAY_SIZE(meminfo_buff->mem); i++) {
551 		meminfo_buff->mem[i].limit = 0;
552 		meminfo_buff->mem[i].idx = i;
553 	}
554 
555 	/* Find and sort the populated memory ranges */
556 	i = 0;
557 	lo = t4_read_reg(padap, MA_TARGET_MEM_ENABLE_A);
558 	if (lo & EDRAM0_ENABLE_F) {
559 		hi = t4_read_reg(padap, MA_EDRAM0_BAR_A);
560 		meminfo_buff->avail[i].base =
561 			cudbg_mbytes_to_bytes(EDRAM0_BASE_G(hi));
562 		meminfo_buff->avail[i].limit =
563 			meminfo_buff->avail[i].base +
564 			cudbg_mbytes_to_bytes(EDRAM0_SIZE_G(hi));
565 		meminfo_buff->avail[i].idx = 0;
566 		i++;
567 	}
568 
569 	if (lo & EDRAM1_ENABLE_F) {
570 		hi =  t4_read_reg(padap, MA_EDRAM1_BAR_A);
571 		meminfo_buff->avail[i].base =
572 			cudbg_mbytes_to_bytes(EDRAM1_BASE_G(hi));
573 		meminfo_buff->avail[i].limit =
574 			meminfo_buff->avail[i].base +
575 			cudbg_mbytes_to_bytes(EDRAM1_SIZE_G(hi));
576 		meminfo_buff->avail[i].idx = 1;
577 		i++;
578 	}
579 
580 	if (is_t5(padap->params.chip)) {
581 		if (lo & EXT_MEM0_ENABLE_F) {
582 			hi = t4_read_reg(padap, MA_EXT_MEMORY0_BAR_A);
583 			meminfo_buff->avail[i].base =
584 				cudbg_mbytes_to_bytes(EXT_MEM_BASE_G(hi));
585 			meminfo_buff->avail[i].limit =
586 				meminfo_buff->avail[i].base +
587 				cudbg_mbytes_to_bytes(EXT_MEM_SIZE_G(hi));
588 			meminfo_buff->avail[i].idx = 3;
589 			i++;
590 		}
591 
592 		if (lo & EXT_MEM1_ENABLE_F) {
593 			hi = t4_read_reg(padap, MA_EXT_MEMORY1_BAR_A);
594 			meminfo_buff->avail[i].base =
595 				cudbg_mbytes_to_bytes(EXT_MEM1_BASE_G(hi));
596 			meminfo_buff->avail[i].limit =
597 				meminfo_buff->avail[i].base +
598 				cudbg_mbytes_to_bytes(EXT_MEM1_SIZE_G(hi));
599 			meminfo_buff->avail[i].idx = 4;
600 			i++;
601 		}
602 	} else {
603 		if (lo & EXT_MEM_ENABLE_F) {
604 			hi = t4_read_reg(padap, MA_EXT_MEMORY_BAR_A);
605 			meminfo_buff->avail[i].base =
606 				cudbg_mbytes_to_bytes(EXT_MEM_BASE_G(hi));
607 			meminfo_buff->avail[i].limit =
608 				meminfo_buff->avail[i].base +
609 				cudbg_mbytes_to_bytes(EXT_MEM_SIZE_G(hi));
610 			meminfo_buff->avail[i].idx = 2;
611 			i++;
612 		}
613 
614 		if (lo & HMA_MUX_F) {
615 			hi = t4_read_reg(padap, MA_EXT_MEMORY1_BAR_A);
616 			meminfo_buff->avail[i].base =
617 				cudbg_mbytes_to_bytes(EXT_MEM1_BASE_G(hi));
618 			meminfo_buff->avail[i].limit =
619 				meminfo_buff->avail[i].base +
620 				cudbg_mbytes_to_bytes(EXT_MEM1_SIZE_G(hi));
621 			meminfo_buff->avail[i].idx = 5;
622 			i++;
623 		}
624 	}
625 
626 	if (!i) /* no memory available */
627 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
628 
629 	meminfo_buff->avail_c = i;
630 	sort(meminfo_buff->avail, i, sizeof(struct cudbg_mem_desc),
631 	     cudbg_mem_desc_cmp, NULL);
632 	(md++)->base = t4_read_reg(padap, SGE_DBQ_CTXT_BADDR_A);
633 	(md++)->base = t4_read_reg(padap, SGE_IMSG_CTXT_BADDR_A);
634 	(md++)->base = t4_read_reg(padap, SGE_FLM_CACHE_BADDR_A);
635 	(md++)->base = t4_read_reg(padap, TP_CMM_TCB_BASE_A);
636 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_BASE_A);
637 	(md++)->base = t4_read_reg(padap, TP_CMM_TIMER_BASE_A);
638 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_RX_FLST_BASE_A);
639 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_TX_FLST_BASE_A);
640 	(md++)->base = t4_read_reg(padap, TP_CMM_MM_PS_FLST_BASE_A);
641 
642 	/* the next few have explicit upper bounds */
643 	md->base = t4_read_reg(padap, TP_PMM_TX_BASE_A);
644 	md->limit = md->base - 1 +
645 		    t4_read_reg(padap, TP_PMM_TX_PAGE_SIZE_A) *
646 		    PMTXMAXPAGE_G(t4_read_reg(padap, TP_PMM_TX_MAX_PAGE_A));
647 	md++;
648 
649 	md->base = t4_read_reg(padap, TP_PMM_RX_BASE_A);
650 	md->limit = md->base - 1 +
651 		    t4_read_reg(padap, TP_PMM_RX_PAGE_SIZE_A) *
652 		    PMRXMAXPAGE_G(t4_read_reg(padap, TP_PMM_RX_MAX_PAGE_A));
653 	md++;
654 
655 	if (t4_read_reg(padap, LE_DB_CONFIG_A) & HASHEN_F) {
656 		if (CHELSIO_CHIP_VERSION(padap->params.chip) <= CHELSIO_T5) {
657 			hi = t4_read_reg(padap, LE_DB_TID_HASHBASE_A) / 4;
658 			md->base = t4_read_reg(padap, LE_DB_HASH_TID_BASE_A);
659 		} else {
660 			hi = t4_read_reg(padap, LE_DB_HASH_TID_BASE_A);
661 			md->base = t4_read_reg(padap,
662 					       LE_DB_HASH_TBL_BASE_ADDR_A);
663 		}
664 		md->limit = 0;
665 	} else {
666 		md->base = 0;
667 		md->idx = ARRAY_SIZE(cudbg_region);  /* hide it */
668 	}
669 	md++;
670 
671 #define ulp_region(reg) do { \
672 	md->base = t4_read_reg(padap, ULP_ ## reg ## _LLIMIT_A);\
673 	(md++)->limit = t4_read_reg(padap, ULP_ ## reg ## _ULIMIT_A);\
674 } while (0)
675 
676 	ulp_region(RX_ISCSI);
677 	ulp_region(RX_TDDP);
678 	ulp_region(TX_TPT);
679 	ulp_region(RX_STAG);
680 	ulp_region(RX_RQ);
681 	ulp_region(RX_RQUDP);
682 	ulp_region(RX_PBL);
683 	ulp_region(TX_PBL);
684 #undef ulp_region
685 	md->base = 0;
686 	md->idx = ARRAY_SIZE(cudbg_region);
687 	if (!is_t4(padap->params.chip)) {
688 		u32 fifo_size = t4_read_reg(padap, SGE_DBVFIFO_SIZE_A);
689 		u32 sge_ctrl = t4_read_reg(padap, SGE_CONTROL2_A);
690 		u32 size = 0;
691 
692 		if (is_t5(padap->params.chip)) {
693 			if (sge_ctrl & VFIFO_ENABLE_F)
694 				size = DBVFIFO_SIZE_G(fifo_size);
695 		} else {
696 			size = T6_DBVFIFO_SIZE_G(fifo_size);
697 		}
698 
699 		if (size) {
700 			md->base = BASEADDR_G(t4_read_reg(padap,
701 							  SGE_DBVFIFO_BADDR_A));
702 			md->limit = md->base + (size << 2) - 1;
703 		}
704 	}
705 
706 	md++;
707 
708 	md->base = t4_read_reg(padap, ULP_RX_CTX_BASE_A);
709 	md->limit = 0;
710 	md++;
711 	md->base = t4_read_reg(padap, ULP_TX_ERR_TABLE_BASE_A);
712 	md->limit = 0;
713 	md++;
714 
715 	md->base = padap->vres.ocq.start;
716 	if (padap->vres.ocq.size)
717 		md->limit = md->base + padap->vres.ocq.size - 1;
718 	else
719 		md->idx = ARRAY_SIZE(cudbg_region);  /* hide it */
720 	md++;
721 
722 	/* add any address-space holes, there can be up to 3 */
723 	for (n = 0; n < i - 1; n++)
724 		if (meminfo_buff->avail[n].limit <
725 		    meminfo_buff->avail[n + 1].base)
726 			(md++)->base = meminfo_buff->avail[n].limit;
727 
728 	if (meminfo_buff->avail[n].limit)
729 		(md++)->base = meminfo_buff->avail[n].limit;
730 
731 	n = md - meminfo_buff->mem;
732 	meminfo_buff->mem_c = n;
733 
734 	sort(meminfo_buff->mem, n, sizeof(struct cudbg_mem_desc),
735 	     cudbg_mem_desc_cmp, NULL);
736 
737 	lo = t4_read_reg(padap, CIM_SDRAM_BASE_ADDR_A);
738 	hi = t4_read_reg(padap, CIM_SDRAM_ADDR_SIZE_A) + lo - 1;
739 	meminfo_buff->up_ram_lo = lo;
740 	meminfo_buff->up_ram_hi = hi;
741 
742 	lo = t4_read_reg(padap, CIM_EXTMEM2_BASE_ADDR_A);
743 	hi = t4_read_reg(padap, CIM_EXTMEM2_ADDR_SIZE_A) + lo - 1;
744 	meminfo_buff->up_extmem2_lo = lo;
745 	meminfo_buff->up_extmem2_hi = hi;
746 
747 	lo = t4_read_reg(padap, TP_PMM_RX_MAX_PAGE_A);
748 	for (i = 0, meminfo_buff->free_rx_cnt = 0; i < 2; i++)
749 		meminfo_buff->free_rx_cnt +=
750 			FREERXPAGECOUNT_G(t4_read_reg(padap,
751 						      TP_FLM_FREE_RX_CNT_A));
752 
753 	meminfo_buff->rx_pages_data[0] =  PMRXMAXPAGE_G(lo);
754 	meminfo_buff->rx_pages_data[1] =
755 		t4_read_reg(padap, TP_PMM_RX_PAGE_SIZE_A) >> 10;
756 	meminfo_buff->rx_pages_data[2] = (lo & PMRXNUMCHN_F) ? 2 : 1;
757 
758 	lo = t4_read_reg(padap, TP_PMM_TX_MAX_PAGE_A);
759 	hi = t4_read_reg(padap, TP_PMM_TX_PAGE_SIZE_A);
760 	for (i = 0, meminfo_buff->free_tx_cnt = 0; i < 4; i++)
761 		meminfo_buff->free_tx_cnt +=
762 			FREETXPAGECOUNT_G(t4_read_reg(padap,
763 						      TP_FLM_FREE_TX_CNT_A));
764 
765 	meminfo_buff->tx_pages_data[0] = PMTXMAXPAGE_G(lo);
766 	meminfo_buff->tx_pages_data[1] =
767 		hi >= (1 << 20) ? (hi >> 20) : (hi >> 10);
768 	meminfo_buff->tx_pages_data[2] =
769 		hi >= (1 << 20) ? 'M' : 'K';
770 	meminfo_buff->tx_pages_data[3] = 1 << PMTXNUMCHN_G(lo);
771 
772 	meminfo_buff->p_structs = t4_read_reg(padap, TP_CMM_MM_MAX_PSTRUCT_A);
773 	meminfo_buff->p_structs_free_cnt =
774 		FREEPSTRUCTCOUNT_G(t4_read_reg(padap, TP_FLM_FREE_PS_CNT_A));
775 
776 	for (i = 0; i < 4; i++) {
777 		if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5)
778 			lo = t4_read_reg(padap,
779 					 MPS_RX_MAC_BG_PG_CNT0_A + i * 4);
780 		else
781 			lo = t4_read_reg(padap, MPS_RX_PG_RSV0_A + i * 4);
782 		if (is_t5(padap->params.chip)) {
783 			used = T5_USED_G(lo);
784 			alloc = T5_ALLOC_G(lo);
785 		} else {
786 			used = USED_G(lo);
787 			alloc = ALLOC_G(lo);
788 		}
789 		meminfo_buff->port_used[i] = used;
790 		meminfo_buff->port_alloc[i] = alloc;
791 	}
792 
793 	for (i = 0; i < padap->params.arch.nchan; i++) {
794 		if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5)
795 			lo = t4_read_reg(padap,
796 					 MPS_RX_LPBK_BG_PG_CNT0_A + i * 4);
797 		else
798 			lo = t4_read_reg(padap, MPS_RX_PG_RSV4_A + i * 4);
799 		if (is_t5(padap->params.chip)) {
800 			used = T5_USED_G(lo);
801 			alloc = T5_ALLOC_G(lo);
802 		} else {
803 			used = USED_G(lo);
804 			alloc = ALLOC_G(lo);
805 		}
806 		meminfo_buff->loopback_used[i] = used;
807 		meminfo_buff->loopback_alloc[i] = alloc;
808 	}
809 
810 	return 0;
811 }
812 
813 int cudbg_collect_reg_dump(struct cudbg_init *pdbg_init,
814 			   struct cudbg_buffer *dbg_buff,
815 			   struct cudbg_error *cudbg_err)
816 {
817 	struct adapter *padap = pdbg_init->adap;
818 	struct cudbg_buffer temp_buff = { 0 };
819 	u32 buf_size = 0;
820 	int rc = 0;
821 
822 	if (is_t4(padap->params.chip))
823 		buf_size = T4_REGMAP_SIZE;
824 	else if (is_t5(padap->params.chip) || is_t6(padap->params.chip))
825 		buf_size = T5_REGMAP_SIZE;
826 
827 	rc = cudbg_get_buff(pdbg_init, dbg_buff, buf_size, &temp_buff);
828 	if (rc)
829 		return rc;
830 	t4_get_regs(padap, (void *)temp_buff.data, temp_buff.size);
831 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
832 }
833 
834 int cudbg_collect_fw_devlog(struct cudbg_init *pdbg_init,
835 			    struct cudbg_buffer *dbg_buff,
836 			    struct cudbg_error *cudbg_err)
837 {
838 	struct adapter *padap = pdbg_init->adap;
839 	struct cudbg_buffer temp_buff = { 0 };
840 	struct devlog_params *dparams;
841 	int rc = 0;
842 
843 	rc = t4_init_devlog_params(padap);
844 	if (rc < 0) {
845 		cudbg_err->sys_err = rc;
846 		return rc;
847 	}
848 
849 	dparams = &padap->params.devlog;
850 	rc = cudbg_get_buff(pdbg_init, dbg_buff, dparams->size, &temp_buff);
851 	if (rc)
852 		return rc;
853 
854 	/* Collect FW devlog */
855 	if (dparams->start != 0) {
856 		spin_lock(&padap->win0_lock);
857 		rc = t4_memory_rw(padap, padap->params.drv_memwin,
858 				  dparams->memtype, dparams->start,
859 				  dparams->size,
860 				  (__be32 *)(char *)temp_buff.data,
861 				  1);
862 		spin_unlock(&padap->win0_lock);
863 		if (rc) {
864 			cudbg_err->sys_err = rc;
865 			cudbg_put_buff(pdbg_init, &temp_buff);
866 			return rc;
867 		}
868 	}
869 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
870 }
871 
872 int cudbg_collect_cim_la(struct cudbg_init *pdbg_init,
873 			 struct cudbg_buffer *dbg_buff,
874 			 struct cudbg_error *cudbg_err)
875 {
876 	struct adapter *padap = pdbg_init->adap;
877 	struct cudbg_buffer temp_buff = { 0 };
878 	int size, rc;
879 	u32 cfg = 0;
880 
881 	if (is_t6(padap->params.chip)) {
882 		size = padap->params.cim_la_size / 10 + 1;
883 		size *= 10 * sizeof(u32);
884 	} else {
885 		size = padap->params.cim_la_size / 8;
886 		size *= 8 * sizeof(u32);
887 	}
888 
889 	size += sizeof(cfg);
890 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
891 	if (rc)
892 		return rc;
893 
894 	rc = t4_cim_read(padap, UP_UP_DBG_LA_CFG_A, 1, &cfg);
895 	if (rc) {
896 		cudbg_err->sys_err = rc;
897 		cudbg_put_buff(pdbg_init, &temp_buff);
898 		return rc;
899 	}
900 
901 	memcpy((char *)temp_buff.data, &cfg, sizeof(cfg));
902 	rc = t4_cim_read_la(padap,
903 			    (u32 *)((char *)temp_buff.data + sizeof(cfg)),
904 			    NULL);
905 	if (rc < 0) {
906 		cudbg_err->sys_err = rc;
907 		cudbg_put_buff(pdbg_init, &temp_buff);
908 		return rc;
909 	}
910 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
911 }
912 
913 int cudbg_collect_cim_ma_la(struct cudbg_init *pdbg_init,
914 			    struct cudbg_buffer *dbg_buff,
915 			    struct cudbg_error *cudbg_err)
916 {
917 	struct adapter *padap = pdbg_init->adap;
918 	struct cudbg_buffer temp_buff = { 0 };
919 	int size, rc;
920 
921 	size = 2 * CIM_MALA_SIZE * 5 * sizeof(u32);
922 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
923 	if (rc)
924 		return rc;
925 
926 	t4_cim_read_ma_la(padap,
927 			  (u32 *)temp_buff.data,
928 			  (u32 *)((char *)temp_buff.data +
929 				  5 * CIM_MALA_SIZE));
930 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
931 }
932 
933 int cudbg_collect_cim_qcfg(struct cudbg_init *pdbg_init,
934 			   struct cudbg_buffer *dbg_buff,
935 			   struct cudbg_error *cudbg_err)
936 {
937 	struct adapter *padap = pdbg_init->adap;
938 	struct cudbg_buffer temp_buff = { 0 };
939 	struct cudbg_cim_qcfg *cim_qcfg_data;
940 	int rc;
941 
942 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_cim_qcfg),
943 			    &temp_buff);
944 	if (rc)
945 		return rc;
946 
947 	cim_qcfg_data = (struct cudbg_cim_qcfg *)temp_buff.data;
948 	cim_qcfg_data->chip = padap->params.chip;
949 	rc = t4_cim_read(padap, UP_IBQ_0_RDADDR_A,
950 			 ARRAY_SIZE(cim_qcfg_data->stat), cim_qcfg_data->stat);
951 	if (rc) {
952 		cudbg_err->sys_err = rc;
953 		cudbg_put_buff(pdbg_init, &temp_buff);
954 		return rc;
955 	}
956 
957 	rc = t4_cim_read(padap, UP_OBQ_0_REALADDR_A,
958 			 ARRAY_SIZE(cim_qcfg_data->obq_wr),
959 			 cim_qcfg_data->obq_wr);
960 	if (rc) {
961 		cudbg_err->sys_err = rc;
962 		cudbg_put_buff(pdbg_init, &temp_buff);
963 		return rc;
964 	}
965 
966 	t4_read_cimq_cfg(padap, cim_qcfg_data->base, cim_qcfg_data->size,
967 			 cim_qcfg_data->thres);
968 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
969 }
970 
971 static int cudbg_read_cim_ibq(struct cudbg_init *pdbg_init,
972 			      struct cudbg_buffer *dbg_buff,
973 			      struct cudbg_error *cudbg_err, int qid)
974 {
975 	struct adapter *padap = pdbg_init->adap;
976 	struct cudbg_buffer temp_buff = { 0 };
977 	int no_of_read_words, rc = 0;
978 	u32 qsize;
979 
980 	/* collect CIM IBQ */
981 	qsize = CIM_IBQ_SIZE * 4 * sizeof(u32);
982 	rc = cudbg_get_buff(pdbg_init, dbg_buff, qsize, &temp_buff);
983 	if (rc)
984 		return rc;
985 
986 	/* t4_read_cim_ibq will return no. of read words or error */
987 	no_of_read_words = t4_read_cim_ibq(padap, qid,
988 					   (u32 *)temp_buff.data, qsize);
989 	/* no_of_read_words is less than or equal to 0 means error */
990 	if (no_of_read_words <= 0) {
991 		if (!no_of_read_words)
992 			rc = CUDBG_SYSTEM_ERROR;
993 		else
994 			rc = no_of_read_words;
995 		cudbg_err->sys_err = rc;
996 		cudbg_put_buff(pdbg_init, &temp_buff);
997 		return rc;
998 	}
999 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1000 }
1001 
1002 int cudbg_collect_cim_ibq_tp0(struct cudbg_init *pdbg_init,
1003 			      struct cudbg_buffer *dbg_buff,
1004 			      struct cudbg_error *cudbg_err)
1005 {
1006 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 0);
1007 }
1008 
1009 int cudbg_collect_cim_ibq_tp1(struct cudbg_init *pdbg_init,
1010 			      struct cudbg_buffer *dbg_buff,
1011 			      struct cudbg_error *cudbg_err)
1012 {
1013 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 1);
1014 }
1015 
1016 int cudbg_collect_cim_ibq_ulp(struct cudbg_init *pdbg_init,
1017 			      struct cudbg_buffer *dbg_buff,
1018 			      struct cudbg_error *cudbg_err)
1019 {
1020 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 2);
1021 }
1022 
1023 int cudbg_collect_cim_ibq_sge0(struct cudbg_init *pdbg_init,
1024 			       struct cudbg_buffer *dbg_buff,
1025 			       struct cudbg_error *cudbg_err)
1026 {
1027 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 3);
1028 }
1029 
1030 int cudbg_collect_cim_ibq_sge1(struct cudbg_init *pdbg_init,
1031 			       struct cudbg_buffer *dbg_buff,
1032 			       struct cudbg_error *cudbg_err)
1033 {
1034 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 4);
1035 }
1036 
1037 int cudbg_collect_cim_ibq_ncsi(struct cudbg_init *pdbg_init,
1038 			       struct cudbg_buffer *dbg_buff,
1039 			       struct cudbg_error *cudbg_err)
1040 {
1041 	return cudbg_read_cim_ibq(pdbg_init, dbg_buff, cudbg_err, 5);
1042 }
1043 
1044 u32 cudbg_cim_obq_size(struct adapter *padap, int qid)
1045 {
1046 	u32 value;
1047 
1048 	t4_write_reg(padap, CIM_QUEUE_CONFIG_REF_A, OBQSELECT_F |
1049 		     QUENUMSELECT_V(qid));
1050 	value = t4_read_reg(padap, CIM_QUEUE_CONFIG_CTRL_A);
1051 	value = CIMQSIZE_G(value) * 64; /* size in number of words */
1052 	return value * sizeof(u32);
1053 }
1054 
1055 static int cudbg_read_cim_obq(struct cudbg_init *pdbg_init,
1056 			      struct cudbg_buffer *dbg_buff,
1057 			      struct cudbg_error *cudbg_err, int qid)
1058 {
1059 	struct adapter *padap = pdbg_init->adap;
1060 	struct cudbg_buffer temp_buff = { 0 };
1061 	int no_of_read_words, rc = 0;
1062 	u32 qsize;
1063 
1064 	/* collect CIM OBQ */
1065 	qsize =  cudbg_cim_obq_size(padap, qid);
1066 	rc = cudbg_get_buff(pdbg_init, dbg_buff, qsize, &temp_buff);
1067 	if (rc)
1068 		return rc;
1069 
1070 	/* t4_read_cim_obq will return no. of read words or error */
1071 	no_of_read_words = t4_read_cim_obq(padap, qid,
1072 					   (u32 *)temp_buff.data, qsize);
1073 	/* no_of_read_words is less than or equal to 0 means error */
1074 	if (no_of_read_words <= 0) {
1075 		if (!no_of_read_words)
1076 			rc = CUDBG_SYSTEM_ERROR;
1077 		else
1078 			rc = no_of_read_words;
1079 		cudbg_err->sys_err = rc;
1080 		cudbg_put_buff(pdbg_init, &temp_buff);
1081 		return rc;
1082 	}
1083 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1084 }
1085 
1086 int cudbg_collect_cim_obq_ulp0(struct cudbg_init *pdbg_init,
1087 			       struct cudbg_buffer *dbg_buff,
1088 			       struct cudbg_error *cudbg_err)
1089 {
1090 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 0);
1091 }
1092 
1093 int cudbg_collect_cim_obq_ulp1(struct cudbg_init *pdbg_init,
1094 			       struct cudbg_buffer *dbg_buff,
1095 			       struct cudbg_error *cudbg_err)
1096 {
1097 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 1);
1098 }
1099 
1100 int cudbg_collect_cim_obq_ulp2(struct cudbg_init *pdbg_init,
1101 			       struct cudbg_buffer *dbg_buff,
1102 			       struct cudbg_error *cudbg_err)
1103 {
1104 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 2);
1105 }
1106 
1107 int cudbg_collect_cim_obq_ulp3(struct cudbg_init *pdbg_init,
1108 			       struct cudbg_buffer *dbg_buff,
1109 			       struct cudbg_error *cudbg_err)
1110 {
1111 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 3);
1112 }
1113 
1114 int cudbg_collect_cim_obq_sge(struct cudbg_init *pdbg_init,
1115 			      struct cudbg_buffer *dbg_buff,
1116 			      struct cudbg_error *cudbg_err)
1117 {
1118 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 4);
1119 }
1120 
1121 int cudbg_collect_cim_obq_ncsi(struct cudbg_init *pdbg_init,
1122 			       struct cudbg_buffer *dbg_buff,
1123 			       struct cudbg_error *cudbg_err)
1124 {
1125 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 5);
1126 }
1127 
1128 int cudbg_collect_obq_sge_rx_q0(struct cudbg_init *pdbg_init,
1129 				struct cudbg_buffer *dbg_buff,
1130 				struct cudbg_error *cudbg_err)
1131 {
1132 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 6);
1133 }
1134 
1135 int cudbg_collect_obq_sge_rx_q1(struct cudbg_init *pdbg_init,
1136 				struct cudbg_buffer *dbg_buff,
1137 				struct cudbg_error *cudbg_err)
1138 {
1139 	return cudbg_read_cim_obq(pdbg_init, dbg_buff, cudbg_err, 7);
1140 }
1141 
1142 static int cudbg_meminfo_get_mem_index(struct adapter *padap,
1143 				       struct cudbg_meminfo *mem_info,
1144 				       u8 mem_type, u8 *idx)
1145 {
1146 	u8 i, flag;
1147 
1148 	switch (mem_type) {
1149 	case MEM_EDC0:
1150 		flag = EDC0_FLAG;
1151 		break;
1152 	case MEM_EDC1:
1153 		flag = EDC1_FLAG;
1154 		break;
1155 	case MEM_MC0:
1156 		/* Some T5 cards have both MC0 and MC1. */
1157 		flag = is_t5(padap->params.chip) ? MC0_FLAG : MC_FLAG;
1158 		break;
1159 	case MEM_MC1:
1160 		flag = MC1_FLAG;
1161 		break;
1162 	case MEM_HMA:
1163 		flag = HMA_FLAG;
1164 		break;
1165 	default:
1166 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
1167 	}
1168 
1169 	for (i = 0; i < mem_info->avail_c; i++) {
1170 		if (mem_info->avail[i].idx == flag) {
1171 			*idx = i;
1172 			return 0;
1173 		}
1174 	}
1175 
1176 	return CUDBG_STATUS_ENTITY_NOT_FOUND;
1177 }
1178 
1179 /* Fetch the @region_name's start and end from @meminfo. */
1180 static int cudbg_get_mem_region(struct adapter *padap,
1181 				struct cudbg_meminfo *meminfo,
1182 				u8 mem_type, const char *region_name,
1183 				struct cudbg_mem_desc *mem_desc)
1184 {
1185 	u8 mc, found = 0;
1186 	u32 idx = 0;
1187 	int rc, i;
1188 
1189 	rc = cudbg_meminfo_get_mem_index(padap, meminfo, mem_type, &mc);
1190 	if (rc)
1191 		return rc;
1192 
1193 	i = match_string(cudbg_region, ARRAY_SIZE(cudbg_region), region_name);
1194 	if (i < 0)
1195 		return -EINVAL;
1196 
1197 	idx = i;
1198 	for (i = 0; i < meminfo->mem_c; i++) {
1199 		if (meminfo->mem[i].idx >= ARRAY_SIZE(cudbg_region))
1200 			continue; /* Skip holes */
1201 
1202 		if (!(meminfo->mem[i].limit))
1203 			meminfo->mem[i].limit =
1204 				i < meminfo->mem_c - 1 ?
1205 				meminfo->mem[i + 1].base - 1 : ~0;
1206 
1207 		if (meminfo->mem[i].idx == idx) {
1208 			/* Check if the region exists in @mem_type memory */
1209 			if (meminfo->mem[i].base < meminfo->avail[mc].base &&
1210 			    meminfo->mem[i].limit < meminfo->avail[mc].base)
1211 				return -EINVAL;
1212 
1213 			if (meminfo->mem[i].base > meminfo->avail[mc].limit)
1214 				return -EINVAL;
1215 
1216 			memcpy(mem_desc, &meminfo->mem[i],
1217 			       sizeof(struct cudbg_mem_desc));
1218 			found = 1;
1219 			break;
1220 		}
1221 	}
1222 	if (!found)
1223 		return -EINVAL;
1224 
1225 	return 0;
1226 }
1227 
1228 /* Fetch and update the start and end of the requested memory region w.r.t 0
1229  * in the corresponding EDC/MC/HMA.
1230  */
1231 static int cudbg_get_mem_relative(struct adapter *padap,
1232 				  struct cudbg_meminfo *meminfo,
1233 				  u8 mem_type, u32 *out_base, u32 *out_end)
1234 {
1235 	u8 mc_idx;
1236 	int rc;
1237 
1238 	rc = cudbg_meminfo_get_mem_index(padap, meminfo, mem_type, &mc_idx);
1239 	if (rc)
1240 		return rc;
1241 
1242 	if (*out_base < meminfo->avail[mc_idx].base)
1243 		*out_base = 0;
1244 	else
1245 		*out_base -= meminfo->avail[mc_idx].base;
1246 
1247 	if (*out_end > meminfo->avail[mc_idx].limit)
1248 		*out_end = meminfo->avail[mc_idx].limit;
1249 	else
1250 		*out_end -= meminfo->avail[mc_idx].base;
1251 
1252 	return 0;
1253 }
1254 
1255 /* Get TX and RX Payload region */
1256 static int cudbg_get_payload_range(struct adapter *padap, u8 mem_type,
1257 				   const char *region_name,
1258 				   struct cudbg_region_info *payload)
1259 {
1260 	struct cudbg_mem_desc mem_desc = { 0 };
1261 	struct cudbg_meminfo meminfo;
1262 	int rc;
1263 
1264 	rc = cudbg_fill_meminfo(padap, &meminfo);
1265 	if (rc)
1266 		return rc;
1267 
1268 	rc = cudbg_get_mem_region(padap, &meminfo, mem_type, region_name,
1269 				  &mem_desc);
1270 	if (rc) {
1271 		payload->exist = false;
1272 		return 0;
1273 	}
1274 
1275 	payload->exist = true;
1276 	payload->start = mem_desc.base;
1277 	payload->end = mem_desc.limit;
1278 
1279 	return cudbg_get_mem_relative(padap, &meminfo, mem_type,
1280 				      &payload->start, &payload->end);
1281 }
1282 
1283 static int cudbg_memory_read(struct cudbg_init *pdbg_init, int win,
1284 			     int mtype, u32 addr, u32 len, void *hbuf)
1285 {
1286 	u32 win_pf, memoffset, mem_aperture, mem_base;
1287 	struct adapter *adap = pdbg_init->adap;
1288 	u32 pos, offset, resid;
1289 	u32 *res_buf;
1290 	u64 *buf;
1291 	int ret;
1292 
1293 	/* Argument sanity checks ...
1294 	 */
1295 	if (addr & 0x3 || (uintptr_t)hbuf & 0x3)
1296 		return -EINVAL;
1297 
1298 	buf = (u64 *)hbuf;
1299 
1300 	/* Try to do 64-bit reads.  Residual will be handled later. */
1301 	resid = len & 0x7;
1302 	len -= resid;
1303 
1304 	ret = t4_memory_rw_init(adap, win, mtype, &memoffset, &mem_base,
1305 				&mem_aperture);
1306 	if (ret)
1307 		return ret;
1308 
1309 	addr = addr + memoffset;
1310 	win_pf = is_t4(adap->params.chip) ? 0 : PFNUM_V(adap->pf);
1311 
1312 	pos = addr & ~(mem_aperture - 1);
1313 	offset = addr - pos;
1314 
1315 	/* Set up initial PCI-E Memory Window to cover the start of our
1316 	 * transfer.
1317 	 */
1318 	t4_memory_update_win(adap, win, pos | win_pf);
1319 
1320 	/* Transfer data from the adapter */
1321 	while (len > 0) {
1322 		*buf++ = le64_to_cpu((__force __le64)
1323 				     t4_read_reg64(adap, mem_base + offset));
1324 		offset += sizeof(u64);
1325 		len -= sizeof(u64);
1326 
1327 		/* If we've reached the end of our current window aperture,
1328 		 * move the PCI-E Memory Window on to the next.
1329 		 */
1330 		if (offset == mem_aperture) {
1331 			pos += mem_aperture;
1332 			offset = 0;
1333 			t4_memory_update_win(adap, win, pos | win_pf);
1334 		}
1335 	}
1336 
1337 	res_buf = (u32 *)buf;
1338 	/* Read residual in 32-bit multiples */
1339 	while (resid > sizeof(u32)) {
1340 		*res_buf++ = le32_to_cpu((__force __le32)
1341 					 t4_read_reg(adap, mem_base + offset));
1342 		offset += sizeof(u32);
1343 		resid -= sizeof(u32);
1344 
1345 		/* If we've reached the end of our current window aperture,
1346 		 * move the PCI-E Memory Window on to the next.
1347 		 */
1348 		if (offset == mem_aperture) {
1349 			pos += mem_aperture;
1350 			offset = 0;
1351 			t4_memory_update_win(adap, win, pos | win_pf);
1352 		}
1353 	}
1354 
1355 	/* Transfer residual < 32-bits */
1356 	if (resid)
1357 		t4_memory_rw_residual(adap, resid, mem_base + offset,
1358 				      (u8 *)res_buf, T4_MEMORY_READ);
1359 
1360 	return 0;
1361 }
1362 
1363 #define CUDBG_YIELD_ITERATION 256
1364 
1365 static int cudbg_read_fw_mem(struct cudbg_init *pdbg_init,
1366 			     struct cudbg_buffer *dbg_buff, u8 mem_type,
1367 			     unsigned long tot_len,
1368 			     struct cudbg_error *cudbg_err)
1369 {
1370 	static const char * const region_name[] = { "Tx payload:",
1371 						    "Rx payload:" };
1372 	unsigned long bytes, bytes_left, bytes_read = 0;
1373 	struct adapter *padap = pdbg_init->adap;
1374 	struct cudbg_buffer temp_buff = { 0 };
1375 	struct cudbg_region_info payload[2];
1376 	u32 yield_count = 0;
1377 	int rc = 0;
1378 	u8 i;
1379 
1380 	/* Get TX/RX Payload region range if they exist */
1381 	memset(payload, 0, sizeof(payload));
1382 	for (i = 0; i < ARRAY_SIZE(region_name); i++) {
1383 		rc = cudbg_get_payload_range(padap, mem_type, region_name[i],
1384 					     &payload[i]);
1385 		if (rc)
1386 			return rc;
1387 
1388 		if (payload[i].exist) {
1389 			/* Align start and end to avoid wrap around */
1390 			payload[i].start = roundup(payload[i].start,
1391 						   CUDBG_CHUNK_SIZE);
1392 			payload[i].end = rounddown(payload[i].end,
1393 						   CUDBG_CHUNK_SIZE);
1394 		}
1395 	}
1396 
1397 	bytes_left = tot_len;
1398 	while (bytes_left > 0) {
1399 		/* As MC size is huge and read through PIO access, this
1400 		 * loop will hold cpu for a longer time. OS may think that
1401 		 * the process is hanged and will generate CPU stall traces.
1402 		 * So yield the cpu regularly.
1403 		 */
1404 		yield_count++;
1405 		if (!(yield_count % CUDBG_YIELD_ITERATION))
1406 			schedule();
1407 
1408 		bytes = min_t(unsigned long, bytes_left,
1409 			      (unsigned long)CUDBG_CHUNK_SIZE);
1410 		rc = cudbg_get_buff(pdbg_init, dbg_buff, bytes, &temp_buff);
1411 		if (rc)
1412 			return rc;
1413 
1414 		for (i = 0; i < ARRAY_SIZE(payload); i++)
1415 			if (payload[i].exist &&
1416 			    bytes_read >= payload[i].start &&
1417 			    bytes_read + bytes <= payload[i].end)
1418 				/* TX and RX Payload regions can't overlap */
1419 				goto skip_read;
1420 
1421 		spin_lock(&padap->win0_lock);
1422 		rc = cudbg_memory_read(pdbg_init, MEMWIN_NIC, mem_type,
1423 				       bytes_read, bytes, temp_buff.data);
1424 		spin_unlock(&padap->win0_lock);
1425 		if (rc) {
1426 			cudbg_err->sys_err = rc;
1427 			cudbg_put_buff(pdbg_init, &temp_buff);
1428 			return rc;
1429 		}
1430 
1431 skip_read:
1432 		bytes_left -= bytes;
1433 		bytes_read += bytes;
1434 		rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
1435 						  dbg_buff);
1436 		if (rc) {
1437 			cudbg_put_buff(pdbg_init, &temp_buff);
1438 			return rc;
1439 		}
1440 	}
1441 	return rc;
1442 }
1443 
1444 static void cudbg_t4_fwcache(struct cudbg_init *pdbg_init,
1445 			     struct cudbg_error *cudbg_err)
1446 {
1447 	struct adapter *padap = pdbg_init->adap;
1448 	int rc;
1449 
1450 	if (is_fw_attached(pdbg_init)) {
1451 		/* Flush uP dcache before reading edcX/mcX  */
1452 		rc = t4_fwcache(padap, FW_PARAM_DEV_FWCACHE_FLUSH);
1453 		if (rc)
1454 			cudbg_err->sys_warn = rc;
1455 	}
1456 }
1457 
1458 static int cudbg_mem_region_size(struct cudbg_init *pdbg_init,
1459 				 struct cudbg_error *cudbg_err,
1460 				 u8 mem_type, unsigned long *region_size)
1461 {
1462 	struct adapter *padap = pdbg_init->adap;
1463 	struct cudbg_meminfo mem_info;
1464 	u8 mc_idx;
1465 	int rc;
1466 
1467 	memset(&mem_info, 0, sizeof(struct cudbg_meminfo));
1468 	rc = cudbg_fill_meminfo(padap, &mem_info);
1469 	if (rc) {
1470 		cudbg_err->sys_err = rc;
1471 		return rc;
1472 	}
1473 
1474 	cudbg_t4_fwcache(pdbg_init, cudbg_err);
1475 	rc = cudbg_meminfo_get_mem_index(padap, &mem_info, mem_type, &mc_idx);
1476 	if (rc) {
1477 		cudbg_err->sys_err = rc;
1478 		return rc;
1479 	}
1480 
1481 	if (region_size)
1482 		*region_size = mem_info.avail[mc_idx].limit -
1483 			       mem_info.avail[mc_idx].base;
1484 
1485 	return 0;
1486 }
1487 
1488 static int cudbg_collect_mem_region(struct cudbg_init *pdbg_init,
1489 				    struct cudbg_buffer *dbg_buff,
1490 				    struct cudbg_error *cudbg_err,
1491 				    u8 mem_type)
1492 {
1493 	unsigned long size = 0;
1494 	int rc;
1495 
1496 	rc = cudbg_mem_region_size(pdbg_init, cudbg_err, mem_type, &size);
1497 	if (rc)
1498 		return rc;
1499 
1500 	return cudbg_read_fw_mem(pdbg_init, dbg_buff, mem_type, size,
1501 				 cudbg_err);
1502 }
1503 
1504 int cudbg_collect_edc0_meminfo(struct cudbg_init *pdbg_init,
1505 			       struct cudbg_buffer *dbg_buff,
1506 			       struct cudbg_error *cudbg_err)
1507 {
1508 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1509 					MEM_EDC0);
1510 }
1511 
1512 int cudbg_collect_edc1_meminfo(struct cudbg_init *pdbg_init,
1513 			       struct cudbg_buffer *dbg_buff,
1514 			       struct cudbg_error *cudbg_err)
1515 {
1516 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1517 					MEM_EDC1);
1518 }
1519 
1520 int cudbg_collect_mc0_meminfo(struct cudbg_init *pdbg_init,
1521 			      struct cudbg_buffer *dbg_buff,
1522 			      struct cudbg_error *cudbg_err)
1523 {
1524 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1525 					MEM_MC0);
1526 }
1527 
1528 int cudbg_collect_mc1_meminfo(struct cudbg_init *pdbg_init,
1529 			      struct cudbg_buffer *dbg_buff,
1530 			      struct cudbg_error *cudbg_err)
1531 {
1532 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1533 					MEM_MC1);
1534 }
1535 
1536 int cudbg_collect_hma_meminfo(struct cudbg_init *pdbg_init,
1537 			      struct cudbg_buffer *dbg_buff,
1538 			      struct cudbg_error *cudbg_err)
1539 {
1540 	return cudbg_collect_mem_region(pdbg_init, dbg_buff, cudbg_err,
1541 					MEM_HMA);
1542 }
1543 
1544 int cudbg_collect_rss(struct cudbg_init *pdbg_init,
1545 		      struct cudbg_buffer *dbg_buff,
1546 		      struct cudbg_error *cudbg_err)
1547 {
1548 	struct adapter *padap = pdbg_init->adap;
1549 	struct cudbg_buffer temp_buff = { 0 };
1550 	int rc, nentries;
1551 
1552 	nentries = t4_chip_rss_size(padap);
1553 	rc = cudbg_get_buff(pdbg_init, dbg_buff, nentries * sizeof(u16),
1554 			    &temp_buff);
1555 	if (rc)
1556 		return rc;
1557 
1558 	rc = t4_read_rss(padap, (u16 *)temp_buff.data);
1559 	if (rc) {
1560 		cudbg_err->sys_err = rc;
1561 		cudbg_put_buff(pdbg_init, &temp_buff);
1562 		return rc;
1563 	}
1564 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1565 }
1566 
1567 int cudbg_collect_rss_vf_config(struct cudbg_init *pdbg_init,
1568 				struct cudbg_buffer *dbg_buff,
1569 				struct cudbg_error *cudbg_err)
1570 {
1571 	struct adapter *padap = pdbg_init->adap;
1572 	struct cudbg_buffer temp_buff = { 0 };
1573 	struct cudbg_rss_vf_conf *vfconf;
1574 	int vf, rc, vf_count;
1575 
1576 	vf_count = padap->params.arch.vfcount;
1577 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
1578 			    vf_count * sizeof(struct cudbg_rss_vf_conf),
1579 			    &temp_buff);
1580 	if (rc)
1581 		return rc;
1582 
1583 	vfconf = (struct cudbg_rss_vf_conf *)temp_buff.data;
1584 	for (vf = 0; vf < vf_count; vf++)
1585 		t4_read_rss_vf_config(padap, vf, &vfconf[vf].rss_vf_vfl,
1586 				      &vfconf[vf].rss_vf_vfh, true);
1587 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1588 }
1589 
1590 int cudbg_collect_path_mtu(struct cudbg_init *pdbg_init,
1591 			   struct cudbg_buffer *dbg_buff,
1592 			   struct cudbg_error *cudbg_err)
1593 {
1594 	struct adapter *padap = pdbg_init->adap;
1595 	struct cudbg_buffer temp_buff = { 0 };
1596 	int rc;
1597 
1598 	rc = cudbg_get_buff(pdbg_init, dbg_buff, NMTUS * sizeof(u16),
1599 			    &temp_buff);
1600 	if (rc)
1601 		return rc;
1602 
1603 	t4_read_mtu_tbl(padap, (u16 *)temp_buff.data, NULL);
1604 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1605 }
1606 
1607 int cudbg_collect_pm_stats(struct cudbg_init *pdbg_init,
1608 			   struct cudbg_buffer *dbg_buff,
1609 			   struct cudbg_error *cudbg_err)
1610 {
1611 	struct adapter *padap = pdbg_init->adap;
1612 	struct cudbg_buffer temp_buff = { 0 };
1613 	struct cudbg_pm_stats *pm_stats_buff;
1614 	int rc;
1615 
1616 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_pm_stats),
1617 			    &temp_buff);
1618 	if (rc)
1619 		return rc;
1620 
1621 	pm_stats_buff = (struct cudbg_pm_stats *)temp_buff.data;
1622 	t4_pmtx_get_stats(padap, pm_stats_buff->tx_cnt, pm_stats_buff->tx_cyc);
1623 	t4_pmrx_get_stats(padap, pm_stats_buff->rx_cnt, pm_stats_buff->rx_cyc);
1624 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1625 }
1626 
1627 int cudbg_collect_hw_sched(struct cudbg_init *pdbg_init,
1628 			   struct cudbg_buffer *dbg_buff,
1629 			   struct cudbg_error *cudbg_err)
1630 {
1631 	struct adapter *padap = pdbg_init->adap;
1632 	struct cudbg_buffer temp_buff = { 0 };
1633 	struct cudbg_hw_sched *hw_sched_buff;
1634 	int i, rc = 0;
1635 
1636 	if (!padap->params.vpd.cclk)
1637 		return CUDBG_STATUS_CCLK_NOT_DEFINED;
1638 
1639 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_hw_sched),
1640 			    &temp_buff);
1641 
1642 	if (rc)
1643 		return rc;
1644 
1645 	hw_sched_buff = (struct cudbg_hw_sched *)temp_buff.data;
1646 	hw_sched_buff->map = t4_read_reg(padap, TP_TX_MOD_QUEUE_REQ_MAP_A);
1647 	hw_sched_buff->mode = TIMERMODE_G(t4_read_reg(padap, TP_MOD_CONFIG_A));
1648 	t4_read_pace_tbl(padap, hw_sched_buff->pace_tab);
1649 	for (i = 0; i < NTX_SCHED; ++i)
1650 		t4_get_tx_sched(padap, i, &hw_sched_buff->kbps[i],
1651 				&hw_sched_buff->ipg[i], true);
1652 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1653 }
1654 
1655 int cudbg_collect_tp_indirect(struct cudbg_init *pdbg_init,
1656 			      struct cudbg_buffer *dbg_buff,
1657 			      struct cudbg_error *cudbg_err)
1658 {
1659 	struct adapter *padap = pdbg_init->adap;
1660 	struct cudbg_buffer temp_buff = { 0 };
1661 	struct ireg_buf *ch_tp_pio;
1662 	int i, rc, n = 0;
1663 	u32 size;
1664 
1665 	if (is_t5(padap->params.chip))
1666 		n = sizeof(t5_tp_pio_array) +
1667 		    sizeof(t5_tp_tm_pio_array) +
1668 		    sizeof(t5_tp_mib_index_array);
1669 	else
1670 		n = sizeof(t6_tp_pio_array) +
1671 		    sizeof(t6_tp_tm_pio_array) +
1672 		    sizeof(t6_tp_mib_index_array);
1673 
1674 	n = n / (IREG_NUM_ELEM * sizeof(u32));
1675 	size = sizeof(struct ireg_buf) * n;
1676 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1677 	if (rc)
1678 		return rc;
1679 
1680 	ch_tp_pio = (struct ireg_buf *)temp_buff.data;
1681 
1682 	/* TP_PIO */
1683 	if (is_t5(padap->params.chip))
1684 		n = sizeof(t5_tp_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1685 	else if (is_t6(padap->params.chip))
1686 		n = sizeof(t6_tp_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1687 
1688 	for (i = 0; i < n; i++) {
1689 		struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1690 		u32 *buff = ch_tp_pio->outbuf;
1691 
1692 		if (is_t5(padap->params.chip)) {
1693 			tp_pio->ireg_addr = t5_tp_pio_array[i][0];
1694 			tp_pio->ireg_data = t5_tp_pio_array[i][1];
1695 			tp_pio->ireg_local_offset = t5_tp_pio_array[i][2];
1696 			tp_pio->ireg_offset_range = t5_tp_pio_array[i][3];
1697 		} else if (is_t6(padap->params.chip)) {
1698 			tp_pio->ireg_addr = t6_tp_pio_array[i][0];
1699 			tp_pio->ireg_data = t6_tp_pio_array[i][1];
1700 			tp_pio->ireg_local_offset = t6_tp_pio_array[i][2];
1701 			tp_pio->ireg_offset_range = t6_tp_pio_array[i][3];
1702 		}
1703 		t4_tp_pio_read(padap, buff, tp_pio->ireg_offset_range,
1704 			       tp_pio->ireg_local_offset, true);
1705 		ch_tp_pio++;
1706 	}
1707 
1708 	/* TP_TM_PIO */
1709 	if (is_t5(padap->params.chip))
1710 		n = sizeof(t5_tp_tm_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1711 	else if (is_t6(padap->params.chip))
1712 		n = sizeof(t6_tp_tm_pio_array) / (IREG_NUM_ELEM * sizeof(u32));
1713 
1714 	for (i = 0; i < n; i++) {
1715 		struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1716 		u32 *buff = ch_tp_pio->outbuf;
1717 
1718 		if (is_t5(padap->params.chip)) {
1719 			tp_pio->ireg_addr = t5_tp_tm_pio_array[i][0];
1720 			tp_pio->ireg_data = t5_tp_tm_pio_array[i][1];
1721 			tp_pio->ireg_local_offset = t5_tp_tm_pio_array[i][2];
1722 			tp_pio->ireg_offset_range = t5_tp_tm_pio_array[i][3];
1723 		} else if (is_t6(padap->params.chip)) {
1724 			tp_pio->ireg_addr = t6_tp_tm_pio_array[i][0];
1725 			tp_pio->ireg_data = t6_tp_tm_pio_array[i][1];
1726 			tp_pio->ireg_local_offset = t6_tp_tm_pio_array[i][2];
1727 			tp_pio->ireg_offset_range = t6_tp_tm_pio_array[i][3];
1728 		}
1729 		t4_tp_tm_pio_read(padap, buff, tp_pio->ireg_offset_range,
1730 				  tp_pio->ireg_local_offset, true);
1731 		ch_tp_pio++;
1732 	}
1733 
1734 	/* TP_MIB_INDEX */
1735 	if (is_t5(padap->params.chip))
1736 		n = sizeof(t5_tp_mib_index_array) /
1737 		    (IREG_NUM_ELEM * sizeof(u32));
1738 	else if (is_t6(padap->params.chip))
1739 		n = sizeof(t6_tp_mib_index_array) /
1740 		    (IREG_NUM_ELEM * sizeof(u32));
1741 
1742 	for (i = 0; i < n ; i++) {
1743 		struct ireg_field *tp_pio = &ch_tp_pio->tp_pio;
1744 		u32 *buff = ch_tp_pio->outbuf;
1745 
1746 		if (is_t5(padap->params.chip)) {
1747 			tp_pio->ireg_addr = t5_tp_mib_index_array[i][0];
1748 			tp_pio->ireg_data = t5_tp_mib_index_array[i][1];
1749 			tp_pio->ireg_local_offset =
1750 				t5_tp_mib_index_array[i][2];
1751 			tp_pio->ireg_offset_range =
1752 				t5_tp_mib_index_array[i][3];
1753 		} else if (is_t6(padap->params.chip)) {
1754 			tp_pio->ireg_addr = t6_tp_mib_index_array[i][0];
1755 			tp_pio->ireg_data = t6_tp_mib_index_array[i][1];
1756 			tp_pio->ireg_local_offset =
1757 				t6_tp_mib_index_array[i][2];
1758 			tp_pio->ireg_offset_range =
1759 				t6_tp_mib_index_array[i][3];
1760 		}
1761 		t4_tp_mib_read(padap, buff, tp_pio->ireg_offset_range,
1762 			       tp_pio->ireg_local_offset, true);
1763 		ch_tp_pio++;
1764 	}
1765 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1766 }
1767 
1768 static void cudbg_read_sge_qbase_indirect_reg(struct adapter *padap,
1769 					      struct sge_qbase_reg_field *qbase,
1770 					      u32 func, bool is_pf)
1771 {
1772 	u32 *buff, i;
1773 
1774 	if (is_pf) {
1775 		buff = qbase->pf_data_value[func];
1776 	} else {
1777 		buff = qbase->vf_data_value[func];
1778 		/* In SGE_QBASE_INDEX,
1779 		 * Entries 0->7 are PF0->7, Entries 8->263 are VFID0->256.
1780 		 */
1781 		func += 8;
1782 	}
1783 
1784 	t4_write_reg(padap, qbase->reg_addr, func);
1785 	for (i = 0; i < SGE_QBASE_DATA_REG_NUM; i++, buff++)
1786 		*buff = t4_read_reg(padap, qbase->reg_data[i]);
1787 }
1788 
1789 int cudbg_collect_sge_indirect(struct cudbg_init *pdbg_init,
1790 			       struct cudbg_buffer *dbg_buff,
1791 			       struct cudbg_error *cudbg_err)
1792 {
1793 	struct adapter *padap = pdbg_init->adap;
1794 	struct cudbg_buffer temp_buff = { 0 };
1795 	struct sge_qbase_reg_field *sge_qbase;
1796 	struct ireg_buf *ch_sge_dbg;
1797 	u8 padap_running = 0;
1798 	int i, rc;
1799 	u32 size;
1800 
1801 	/* Accessing SGE_QBASE_MAP[0-3] and SGE_QBASE_INDEX regs can
1802 	 * lead to SGE missing doorbells under heavy traffic. So, only
1803 	 * collect them when adapter is idle.
1804 	 */
1805 	for_each_port(padap, i) {
1806 		padap_running = netif_running(padap->port[i]);
1807 		if (padap_running)
1808 			break;
1809 	}
1810 
1811 	size = sizeof(*ch_sge_dbg) * 2;
1812 	if (!padap_running)
1813 		size += sizeof(*sge_qbase);
1814 
1815 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1816 	if (rc)
1817 		return rc;
1818 
1819 	ch_sge_dbg = (struct ireg_buf *)temp_buff.data;
1820 	for (i = 0; i < 2; i++) {
1821 		struct ireg_field *sge_pio = &ch_sge_dbg->tp_pio;
1822 		u32 *buff = ch_sge_dbg->outbuf;
1823 
1824 		sge_pio->ireg_addr = t5_sge_dbg_index_array[i][0];
1825 		sge_pio->ireg_data = t5_sge_dbg_index_array[i][1];
1826 		sge_pio->ireg_local_offset = t5_sge_dbg_index_array[i][2];
1827 		sge_pio->ireg_offset_range = t5_sge_dbg_index_array[i][3];
1828 		t4_read_indirect(padap,
1829 				 sge_pio->ireg_addr,
1830 				 sge_pio->ireg_data,
1831 				 buff,
1832 				 sge_pio->ireg_offset_range,
1833 				 sge_pio->ireg_local_offset);
1834 		ch_sge_dbg++;
1835 	}
1836 
1837 	if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5 &&
1838 	    !padap_running) {
1839 		sge_qbase = (struct sge_qbase_reg_field *)ch_sge_dbg;
1840 		/* 1 addr reg SGE_QBASE_INDEX and 4 data reg
1841 		 * SGE_QBASE_MAP[0-3]
1842 		 */
1843 		sge_qbase->reg_addr = t6_sge_qbase_index_array[0];
1844 		for (i = 0; i < SGE_QBASE_DATA_REG_NUM; i++)
1845 			sge_qbase->reg_data[i] =
1846 				t6_sge_qbase_index_array[i + 1];
1847 
1848 		for (i = 0; i <= PCIE_FW_MASTER_M; i++)
1849 			cudbg_read_sge_qbase_indirect_reg(padap, sge_qbase,
1850 							  i, true);
1851 
1852 		for (i = 0; i < padap->params.arch.vfcount; i++)
1853 			cudbg_read_sge_qbase_indirect_reg(padap, sge_qbase,
1854 							  i, false);
1855 
1856 		sge_qbase->vfcount = padap->params.arch.vfcount;
1857 	}
1858 
1859 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1860 }
1861 
1862 int cudbg_collect_ulprx_la(struct cudbg_init *pdbg_init,
1863 			   struct cudbg_buffer *dbg_buff,
1864 			   struct cudbg_error *cudbg_err)
1865 {
1866 	struct adapter *padap = pdbg_init->adap;
1867 	struct cudbg_buffer temp_buff = { 0 };
1868 	struct cudbg_ulprx_la *ulprx_la_buff;
1869 	int rc;
1870 
1871 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_ulprx_la),
1872 			    &temp_buff);
1873 	if (rc)
1874 		return rc;
1875 
1876 	ulprx_la_buff = (struct cudbg_ulprx_la *)temp_buff.data;
1877 	t4_ulprx_read_la(padap, (u32 *)ulprx_la_buff->data);
1878 	ulprx_la_buff->size = ULPRX_LA_SIZE;
1879 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1880 }
1881 
1882 int cudbg_collect_tp_la(struct cudbg_init *pdbg_init,
1883 			struct cudbg_buffer *dbg_buff,
1884 			struct cudbg_error *cudbg_err)
1885 {
1886 	struct adapter *padap = pdbg_init->adap;
1887 	struct cudbg_buffer temp_buff = { 0 };
1888 	struct cudbg_tp_la *tp_la_buff;
1889 	int size, rc;
1890 
1891 	size = sizeof(struct cudbg_tp_la) + TPLA_SIZE *  sizeof(u64);
1892 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1893 	if (rc)
1894 		return rc;
1895 
1896 	tp_la_buff = (struct cudbg_tp_la *)temp_buff.data;
1897 	tp_la_buff->mode = DBGLAMODE_G(t4_read_reg(padap, TP_DBG_LA_CONFIG_A));
1898 	t4_tp_read_la(padap, (u64 *)tp_la_buff->data, NULL);
1899 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1900 }
1901 
1902 int cudbg_collect_meminfo(struct cudbg_init *pdbg_init,
1903 			  struct cudbg_buffer *dbg_buff,
1904 			  struct cudbg_error *cudbg_err)
1905 {
1906 	struct adapter *padap = pdbg_init->adap;
1907 	struct cudbg_buffer temp_buff = { 0 };
1908 	struct cudbg_meminfo *meminfo_buff;
1909 	struct cudbg_ver_hdr *ver_hdr;
1910 	int rc;
1911 
1912 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
1913 			    sizeof(struct cudbg_ver_hdr) +
1914 			    sizeof(struct cudbg_meminfo),
1915 			    &temp_buff);
1916 	if (rc)
1917 		return rc;
1918 
1919 	ver_hdr = (struct cudbg_ver_hdr *)temp_buff.data;
1920 	ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
1921 	ver_hdr->revision = CUDBG_MEMINFO_REV;
1922 	ver_hdr->size = sizeof(struct cudbg_meminfo);
1923 
1924 	meminfo_buff = (struct cudbg_meminfo *)(temp_buff.data +
1925 						sizeof(*ver_hdr));
1926 	rc = cudbg_fill_meminfo(padap, meminfo_buff);
1927 	if (rc) {
1928 		cudbg_err->sys_err = rc;
1929 		cudbg_put_buff(pdbg_init, &temp_buff);
1930 		return rc;
1931 	}
1932 
1933 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1934 }
1935 
1936 int cudbg_collect_cim_pif_la(struct cudbg_init *pdbg_init,
1937 			     struct cudbg_buffer *dbg_buff,
1938 			     struct cudbg_error *cudbg_err)
1939 {
1940 	struct cudbg_cim_pif_la *cim_pif_la_buff;
1941 	struct adapter *padap = pdbg_init->adap;
1942 	struct cudbg_buffer temp_buff = { 0 };
1943 	int size, rc;
1944 
1945 	size = sizeof(struct cudbg_cim_pif_la) +
1946 	       2 * CIM_PIFLA_SIZE * 6 * sizeof(u32);
1947 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
1948 	if (rc)
1949 		return rc;
1950 
1951 	cim_pif_la_buff = (struct cudbg_cim_pif_la *)temp_buff.data;
1952 	cim_pif_la_buff->size = CIM_PIFLA_SIZE;
1953 	t4_cim_read_pif_la(padap, (u32 *)cim_pif_la_buff->data,
1954 			   (u32 *)cim_pif_la_buff->data + 6 * CIM_PIFLA_SIZE,
1955 			   NULL, NULL);
1956 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
1957 }
1958 
1959 int cudbg_collect_clk_info(struct cudbg_init *pdbg_init,
1960 			   struct cudbg_buffer *dbg_buff,
1961 			   struct cudbg_error *cudbg_err)
1962 {
1963 	struct adapter *padap = pdbg_init->adap;
1964 	struct cudbg_buffer temp_buff = { 0 };
1965 	struct cudbg_clk_info *clk_info_buff;
1966 	u64 tp_tick_us;
1967 	int rc;
1968 
1969 	if (!padap->params.vpd.cclk)
1970 		return CUDBG_STATUS_CCLK_NOT_DEFINED;
1971 
1972 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_clk_info),
1973 			    &temp_buff);
1974 	if (rc)
1975 		return rc;
1976 
1977 	clk_info_buff = (struct cudbg_clk_info *)temp_buff.data;
1978 	clk_info_buff->cclk_ps = 1000000000 / padap->params.vpd.cclk; /* psec */
1979 	clk_info_buff->res = t4_read_reg(padap, TP_TIMER_RESOLUTION_A);
1980 	clk_info_buff->tre = TIMERRESOLUTION_G(clk_info_buff->res);
1981 	clk_info_buff->dack_re = DELAYEDACKRESOLUTION_G(clk_info_buff->res);
1982 	tp_tick_us = (clk_info_buff->cclk_ps << clk_info_buff->tre) / 1000000;
1983 
1984 	clk_info_buff->dack_timer =
1985 		(clk_info_buff->cclk_ps << clk_info_buff->dack_re) / 1000000 *
1986 		t4_read_reg(padap, TP_DACK_TIMER_A);
1987 	clk_info_buff->retransmit_min =
1988 		tp_tick_us * t4_read_reg(padap, TP_RXT_MIN_A);
1989 	clk_info_buff->retransmit_max =
1990 		tp_tick_us * t4_read_reg(padap, TP_RXT_MAX_A);
1991 	clk_info_buff->persist_timer_min =
1992 		tp_tick_us * t4_read_reg(padap, TP_PERS_MIN_A);
1993 	clk_info_buff->persist_timer_max =
1994 		tp_tick_us * t4_read_reg(padap, TP_PERS_MAX_A);
1995 	clk_info_buff->keepalive_idle_timer =
1996 		tp_tick_us * t4_read_reg(padap, TP_KEEP_IDLE_A);
1997 	clk_info_buff->keepalive_interval =
1998 		tp_tick_us * t4_read_reg(padap, TP_KEEP_INTVL_A);
1999 	clk_info_buff->initial_srtt =
2000 		tp_tick_us * INITSRTT_G(t4_read_reg(padap, TP_INIT_SRTT_A));
2001 	clk_info_buff->finwait2_timer =
2002 		tp_tick_us * t4_read_reg(padap, TP_FINWAIT2_TIMER_A);
2003 
2004 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2005 }
2006 
2007 int cudbg_collect_pcie_indirect(struct cudbg_init *pdbg_init,
2008 				struct cudbg_buffer *dbg_buff,
2009 				struct cudbg_error *cudbg_err)
2010 {
2011 	struct adapter *padap = pdbg_init->adap;
2012 	struct cudbg_buffer temp_buff = { 0 };
2013 	struct ireg_buf *ch_pcie;
2014 	int i, rc, n;
2015 	u32 size;
2016 
2017 	n = sizeof(t5_pcie_pdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
2018 	size = sizeof(struct ireg_buf) * n * 2;
2019 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2020 	if (rc)
2021 		return rc;
2022 
2023 	ch_pcie = (struct ireg_buf *)temp_buff.data;
2024 	/* PCIE_PDBG */
2025 	for (i = 0; i < n; i++) {
2026 		struct ireg_field *pcie_pio = &ch_pcie->tp_pio;
2027 		u32 *buff = ch_pcie->outbuf;
2028 
2029 		pcie_pio->ireg_addr = t5_pcie_pdbg_array[i][0];
2030 		pcie_pio->ireg_data = t5_pcie_pdbg_array[i][1];
2031 		pcie_pio->ireg_local_offset = t5_pcie_pdbg_array[i][2];
2032 		pcie_pio->ireg_offset_range = t5_pcie_pdbg_array[i][3];
2033 		t4_read_indirect(padap,
2034 				 pcie_pio->ireg_addr,
2035 				 pcie_pio->ireg_data,
2036 				 buff,
2037 				 pcie_pio->ireg_offset_range,
2038 				 pcie_pio->ireg_local_offset);
2039 		ch_pcie++;
2040 	}
2041 
2042 	/* PCIE_CDBG */
2043 	n = sizeof(t5_pcie_cdbg_array) / (IREG_NUM_ELEM * sizeof(u32));
2044 	for (i = 0; i < n; i++) {
2045 		struct ireg_field *pcie_pio = &ch_pcie->tp_pio;
2046 		u32 *buff = ch_pcie->outbuf;
2047 
2048 		pcie_pio->ireg_addr = t5_pcie_cdbg_array[i][0];
2049 		pcie_pio->ireg_data = t5_pcie_cdbg_array[i][1];
2050 		pcie_pio->ireg_local_offset = t5_pcie_cdbg_array[i][2];
2051 		pcie_pio->ireg_offset_range = t5_pcie_cdbg_array[i][3];
2052 		t4_read_indirect(padap,
2053 				 pcie_pio->ireg_addr,
2054 				 pcie_pio->ireg_data,
2055 				 buff,
2056 				 pcie_pio->ireg_offset_range,
2057 				 pcie_pio->ireg_local_offset);
2058 		ch_pcie++;
2059 	}
2060 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2061 }
2062 
2063 int cudbg_collect_pm_indirect(struct cudbg_init *pdbg_init,
2064 			      struct cudbg_buffer *dbg_buff,
2065 			      struct cudbg_error *cudbg_err)
2066 {
2067 	struct adapter *padap = pdbg_init->adap;
2068 	struct cudbg_buffer temp_buff = { 0 };
2069 	struct ireg_buf *ch_pm;
2070 	int i, rc, n;
2071 	u32 size;
2072 
2073 	n = sizeof(t5_pm_rx_array) / (IREG_NUM_ELEM * sizeof(u32));
2074 	size = sizeof(struct ireg_buf) * n * 2;
2075 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2076 	if (rc)
2077 		return rc;
2078 
2079 	ch_pm = (struct ireg_buf *)temp_buff.data;
2080 	/* PM_RX */
2081 	for (i = 0; i < n; i++) {
2082 		struct ireg_field *pm_pio = &ch_pm->tp_pio;
2083 		u32 *buff = ch_pm->outbuf;
2084 
2085 		pm_pio->ireg_addr = t5_pm_rx_array[i][0];
2086 		pm_pio->ireg_data = t5_pm_rx_array[i][1];
2087 		pm_pio->ireg_local_offset = t5_pm_rx_array[i][2];
2088 		pm_pio->ireg_offset_range = t5_pm_rx_array[i][3];
2089 		t4_read_indirect(padap,
2090 				 pm_pio->ireg_addr,
2091 				 pm_pio->ireg_data,
2092 				 buff,
2093 				 pm_pio->ireg_offset_range,
2094 				 pm_pio->ireg_local_offset);
2095 		ch_pm++;
2096 	}
2097 
2098 	/* PM_TX */
2099 	n = sizeof(t5_pm_tx_array) / (IREG_NUM_ELEM * sizeof(u32));
2100 	for (i = 0; i < n; i++) {
2101 		struct ireg_field *pm_pio = &ch_pm->tp_pio;
2102 		u32 *buff = ch_pm->outbuf;
2103 
2104 		pm_pio->ireg_addr = t5_pm_tx_array[i][0];
2105 		pm_pio->ireg_data = t5_pm_tx_array[i][1];
2106 		pm_pio->ireg_local_offset = t5_pm_tx_array[i][2];
2107 		pm_pio->ireg_offset_range = t5_pm_tx_array[i][3];
2108 		t4_read_indirect(padap,
2109 				 pm_pio->ireg_addr,
2110 				 pm_pio->ireg_data,
2111 				 buff,
2112 				 pm_pio->ireg_offset_range,
2113 				 pm_pio->ireg_local_offset);
2114 		ch_pm++;
2115 	}
2116 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2117 }
2118 
2119 int cudbg_collect_tid(struct cudbg_init *pdbg_init,
2120 		      struct cudbg_buffer *dbg_buff,
2121 		      struct cudbg_error *cudbg_err)
2122 {
2123 	struct adapter *padap = pdbg_init->adap;
2124 	struct cudbg_tid_info_region_rev1 *tid1;
2125 	struct cudbg_buffer temp_buff = { 0 };
2126 	struct cudbg_tid_info_region *tid;
2127 	u32 para[2], val[2];
2128 	int rc;
2129 
2130 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
2131 			    sizeof(struct cudbg_tid_info_region_rev1),
2132 			    &temp_buff);
2133 	if (rc)
2134 		return rc;
2135 
2136 	tid1 = (struct cudbg_tid_info_region_rev1 *)temp_buff.data;
2137 	tid = &tid1->tid;
2138 	tid1->ver_hdr.signature = CUDBG_ENTITY_SIGNATURE;
2139 	tid1->ver_hdr.revision = CUDBG_TID_INFO_REV;
2140 	tid1->ver_hdr.size = sizeof(struct cudbg_tid_info_region_rev1) -
2141 			     sizeof(struct cudbg_ver_hdr);
2142 
2143 	/* If firmware is not attached/alive, use backdoor register
2144 	 * access to collect dump.
2145 	 */
2146 	if (!is_fw_attached(pdbg_init))
2147 		goto fill_tid;
2148 
2149 #define FW_PARAM_PFVF_A(param) \
2150 	(FW_PARAMS_MNEM_V(FW_PARAMS_MNEM_PFVF) | \
2151 	 FW_PARAMS_PARAM_X_V(FW_PARAMS_PARAM_PFVF_##param) | \
2152 	 FW_PARAMS_PARAM_Y_V(0) | \
2153 	 FW_PARAMS_PARAM_Z_V(0))
2154 
2155 	para[0] = FW_PARAM_PFVF_A(ETHOFLD_START);
2156 	para[1] = FW_PARAM_PFVF_A(ETHOFLD_END);
2157 	rc = t4_query_params(padap, padap->mbox, padap->pf, 0, 2, para, val);
2158 	if (rc <  0) {
2159 		cudbg_err->sys_err = rc;
2160 		cudbg_put_buff(pdbg_init, &temp_buff);
2161 		return rc;
2162 	}
2163 	tid->uotid_base = val[0];
2164 	tid->nuotids = val[1] - val[0] + 1;
2165 
2166 	if (is_t5(padap->params.chip)) {
2167 		tid->sb = t4_read_reg(padap, LE_DB_SERVER_INDEX_A) / 4;
2168 	} else if (is_t6(padap->params.chip)) {
2169 		tid1->tid_start =
2170 			t4_read_reg(padap, LE_DB_ACTIVE_TABLE_START_INDEX_A);
2171 		tid->sb = t4_read_reg(padap, LE_DB_SRVR_START_INDEX_A);
2172 
2173 		para[0] = FW_PARAM_PFVF_A(HPFILTER_START);
2174 		para[1] = FW_PARAM_PFVF_A(HPFILTER_END);
2175 		rc = t4_query_params(padap, padap->mbox, padap->pf, 0, 2,
2176 				     para, val);
2177 		if (rc < 0) {
2178 			cudbg_err->sys_err = rc;
2179 			cudbg_put_buff(pdbg_init, &temp_buff);
2180 			return rc;
2181 		}
2182 		tid->hpftid_base = val[0];
2183 		tid->nhpftids = val[1] - val[0] + 1;
2184 	}
2185 
2186 #undef FW_PARAM_PFVF_A
2187 
2188 fill_tid:
2189 	tid->ntids = padap->tids.ntids;
2190 	tid->nstids = padap->tids.nstids;
2191 	tid->stid_base = padap->tids.stid_base;
2192 	tid->hash_base = padap->tids.hash_base;
2193 
2194 	tid->natids = padap->tids.natids;
2195 	tid->nftids = padap->tids.nftids;
2196 	tid->ftid_base = padap->tids.ftid_base;
2197 	tid->aftid_base = padap->tids.aftid_base;
2198 	tid->aftid_end = padap->tids.aftid_end;
2199 
2200 	tid->sftid_base = padap->tids.sftid_base;
2201 	tid->nsftids = padap->tids.nsftids;
2202 
2203 	tid->flags = padap->flags;
2204 	tid->le_db_conf = t4_read_reg(padap, LE_DB_CONFIG_A);
2205 	tid->ip_users = t4_read_reg(padap, LE_DB_ACT_CNT_IPV4_A);
2206 	tid->ipv6_users = t4_read_reg(padap, LE_DB_ACT_CNT_IPV6_A);
2207 
2208 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2209 }
2210 
2211 int cudbg_collect_pcie_config(struct cudbg_init *pdbg_init,
2212 			      struct cudbg_buffer *dbg_buff,
2213 			      struct cudbg_error *cudbg_err)
2214 {
2215 	struct adapter *padap = pdbg_init->adap;
2216 	struct cudbg_buffer temp_buff = { 0 };
2217 	u32 size, *value, j;
2218 	int i, rc, n;
2219 
2220 	size = sizeof(u32) * CUDBG_NUM_PCIE_CONFIG_REGS;
2221 	n = sizeof(t5_pcie_config_array) / (2 * sizeof(u32));
2222 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2223 	if (rc)
2224 		return rc;
2225 
2226 	value = (u32 *)temp_buff.data;
2227 	for (i = 0; i < n; i++) {
2228 		for (j = t5_pcie_config_array[i][0];
2229 		     j <= t5_pcie_config_array[i][1]; j += 4) {
2230 			t4_hw_pci_read_cfg4(padap, j, value);
2231 			value++;
2232 		}
2233 	}
2234 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2235 }
2236 
2237 static int cudbg_sge_ctxt_check_valid(u32 *buf, int type)
2238 {
2239 	int index, bit, bit_pos = 0;
2240 
2241 	switch (type) {
2242 	case CTXT_EGRESS:
2243 		bit_pos = 176;
2244 		break;
2245 	case CTXT_INGRESS:
2246 		bit_pos = 141;
2247 		break;
2248 	case CTXT_FLM:
2249 		bit_pos = 89;
2250 		break;
2251 	}
2252 	index = bit_pos / 32;
2253 	bit =  bit_pos % 32;
2254 	return buf[index] & (1U << bit);
2255 }
2256 
2257 static int cudbg_get_ctxt_region_info(struct adapter *padap,
2258 				      struct cudbg_region_info *ctx_info,
2259 				      u8 *mem_type)
2260 {
2261 	struct cudbg_mem_desc mem_desc;
2262 	struct cudbg_meminfo meminfo;
2263 	u32 i, j, value, found;
2264 	u8 flq;
2265 	int rc;
2266 
2267 	rc = cudbg_fill_meminfo(padap, &meminfo);
2268 	if (rc)
2269 		return rc;
2270 
2271 	/* Get EGRESS and INGRESS context region size */
2272 	for (i = CTXT_EGRESS; i <= CTXT_INGRESS; i++) {
2273 		found = 0;
2274 		memset(&mem_desc, 0, sizeof(struct cudbg_mem_desc));
2275 		for (j = 0; j < ARRAY_SIZE(meminfo.avail); j++) {
2276 			rc = cudbg_get_mem_region(padap, &meminfo, j,
2277 						  cudbg_region[i],
2278 						  &mem_desc);
2279 			if (!rc) {
2280 				found = 1;
2281 				rc = cudbg_get_mem_relative(padap, &meminfo, j,
2282 							    &mem_desc.base,
2283 							    &mem_desc.limit);
2284 				if (rc) {
2285 					ctx_info[i].exist = false;
2286 					break;
2287 				}
2288 				ctx_info[i].exist = true;
2289 				ctx_info[i].start = mem_desc.base;
2290 				ctx_info[i].end = mem_desc.limit;
2291 				mem_type[i] = j;
2292 				break;
2293 			}
2294 		}
2295 		if (!found)
2296 			ctx_info[i].exist = false;
2297 	}
2298 
2299 	/* Get FLM and CNM max qid. */
2300 	value = t4_read_reg(padap, SGE_FLM_CFG_A);
2301 
2302 	/* Get number of data freelist queues */
2303 	flq = HDRSTARTFLQ_G(value);
2304 	ctx_info[CTXT_FLM].exist = true;
2305 	ctx_info[CTXT_FLM].end = (CUDBG_MAX_FL_QIDS >> flq) * SGE_CTXT_SIZE;
2306 
2307 	/* The number of CONM contexts are same as number of freelist
2308 	 * queues.
2309 	 */
2310 	ctx_info[CTXT_CNM].exist = true;
2311 	ctx_info[CTXT_CNM].end = ctx_info[CTXT_FLM].end;
2312 
2313 	return 0;
2314 }
2315 
2316 int cudbg_dump_context_size(struct adapter *padap)
2317 {
2318 	struct cudbg_region_info region_info[CTXT_CNM + 1] = { {0} };
2319 	u8 mem_type[CTXT_INGRESS + 1] = { 0 };
2320 	u32 i, size = 0;
2321 	int rc;
2322 
2323 	/* Get max valid qid for each type of queue */
2324 	rc = cudbg_get_ctxt_region_info(padap, region_info, mem_type);
2325 	if (rc)
2326 		return rc;
2327 
2328 	for (i = 0; i < CTXT_CNM; i++) {
2329 		if (!region_info[i].exist) {
2330 			if (i == CTXT_EGRESS || i == CTXT_INGRESS)
2331 				size += CUDBG_LOWMEM_MAX_CTXT_QIDS *
2332 					SGE_CTXT_SIZE;
2333 			continue;
2334 		}
2335 
2336 		size += (region_info[i].end - region_info[i].start + 1) /
2337 			SGE_CTXT_SIZE;
2338 	}
2339 	return size * sizeof(struct cudbg_ch_cntxt);
2340 }
2341 
2342 static void cudbg_read_sge_ctxt(struct cudbg_init *pdbg_init, u32 cid,
2343 				enum ctxt_type ctype, u32 *data)
2344 {
2345 	struct adapter *padap = pdbg_init->adap;
2346 	int rc = -1;
2347 
2348 	/* Under heavy traffic, the SGE Queue contexts registers will be
2349 	 * frequently accessed by firmware.
2350 	 *
2351 	 * To avoid conflicts with firmware, always ask firmware to fetch
2352 	 * the SGE Queue contexts via mailbox. On failure, fallback to
2353 	 * accessing hardware registers directly.
2354 	 */
2355 	if (is_fw_attached(pdbg_init))
2356 		rc = t4_sge_ctxt_rd(padap, padap->mbox, cid, ctype, data);
2357 	if (rc)
2358 		t4_sge_ctxt_rd_bd(padap, cid, ctype, data);
2359 }
2360 
2361 static void cudbg_get_sge_ctxt_fw(struct cudbg_init *pdbg_init, u32 max_qid,
2362 				  u8 ctxt_type,
2363 				  struct cudbg_ch_cntxt **out_buff)
2364 {
2365 	struct cudbg_ch_cntxt *buff = *out_buff;
2366 	int rc;
2367 	u32 j;
2368 
2369 	for (j = 0; j < max_qid; j++) {
2370 		cudbg_read_sge_ctxt(pdbg_init, j, ctxt_type, buff->data);
2371 		rc = cudbg_sge_ctxt_check_valid(buff->data, ctxt_type);
2372 		if (!rc)
2373 			continue;
2374 
2375 		buff->cntxt_type = ctxt_type;
2376 		buff->cntxt_id = j;
2377 		buff++;
2378 		if (ctxt_type == CTXT_FLM) {
2379 			cudbg_read_sge_ctxt(pdbg_init, j, CTXT_CNM, buff->data);
2380 			buff->cntxt_type = CTXT_CNM;
2381 			buff->cntxt_id = j;
2382 			buff++;
2383 		}
2384 	}
2385 
2386 	*out_buff = buff;
2387 }
2388 
2389 int cudbg_collect_dump_context(struct cudbg_init *pdbg_init,
2390 			       struct cudbg_buffer *dbg_buff,
2391 			       struct cudbg_error *cudbg_err)
2392 {
2393 	struct cudbg_region_info region_info[CTXT_CNM + 1] = { {0} };
2394 	struct adapter *padap = pdbg_init->adap;
2395 	u32 j, size, max_ctx_size, max_ctx_qid;
2396 	u8 mem_type[CTXT_INGRESS + 1] = { 0 };
2397 	struct cudbg_buffer temp_buff = { 0 };
2398 	struct cudbg_ch_cntxt *buff;
2399 	u8 *ctx_buf;
2400 	u8 i, k;
2401 	int rc;
2402 
2403 	/* Get max valid qid for each type of queue */
2404 	rc = cudbg_get_ctxt_region_info(padap, region_info, mem_type);
2405 	if (rc)
2406 		return rc;
2407 
2408 	rc = cudbg_dump_context_size(padap);
2409 	if (rc <= 0)
2410 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
2411 
2412 	size = rc;
2413 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2414 	if (rc)
2415 		return rc;
2416 
2417 	/* Get buffer with enough space to read the biggest context
2418 	 * region in memory.
2419 	 */
2420 	max_ctx_size = max(region_info[CTXT_EGRESS].end -
2421 			   region_info[CTXT_EGRESS].start + 1,
2422 			   region_info[CTXT_INGRESS].end -
2423 			   region_info[CTXT_INGRESS].start + 1);
2424 
2425 	ctx_buf = kvzalloc(max_ctx_size, GFP_KERNEL);
2426 	if (!ctx_buf) {
2427 		cudbg_put_buff(pdbg_init, &temp_buff);
2428 		return -ENOMEM;
2429 	}
2430 
2431 	buff = (struct cudbg_ch_cntxt *)temp_buff.data;
2432 
2433 	/* Collect EGRESS and INGRESS context data.
2434 	 * In case of failures, fallback to collecting via FW or
2435 	 * backdoor access.
2436 	 */
2437 	for (i = CTXT_EGRESS; i <= CTXT_INGRESS; i++) {
2438 		if (!region_info[i].exist) {
2439 			max_ctx_qid = CUDBG_LOWMEM_MAX_CTXT_QIDS;
2440 			cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, i,
2441 					      &buff);
2442 			continue;
2443 		}
2444 
2445 		max_ctx_size = region_info[i].end - region_info[i].start + 1;
2446 		max_ctx_qid = max_ctx_size / SGE_CTXT_SIZE;
2447 
2448 		/* If firmware is not attached/alive, use backdoor register
2449 		 * access to collect dump.
2450 		 */
2451 		if (is_fw_attached(pdbg_init)) {
2452 			t4_sge_ctxt_flush(padap, padap->mbox, i);
2453 
2454 			rc = t4_memory_rw(padap, MEMWIN_NIC, mem_type[i],
2455 					  region_info[i].start, max_ctx_size,
2456 					  (__be32 *)ctx_buf, 1);
2457 		}
2458 
2459 		if (rc || !is_fw_attached(pdbg_init)) {
2460 			max_ctx_qid = CUDBG_LOWMEM_MAX_CTXT_QIDS;
2461 			cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, i,
2462 					      &buff);
2463 			continue;
2464 		}
2465 
2466 		for (j = 0; j < max_ctx_qid; j++) {
2467 			__be64 *dst_off;
2468 			u64 *src_off;
2469 
2470 			src_off = (u64 *)(ctx_buf + j * SGE_CTXT_SIZE);
2471 			dst_off = (__be64 *)buff->data;
2472 
2473 			/* The data is stored in 64-bit cpu order.  Convert it
2474 			 * to big endian before parsing.
2475 			 */
2476 			for (k = 0; k < SGE_CTXT_SIZE / sizeof(u64); k++)
2477 				dst_off[k] = cpu_to_be64(src_off[k]);
2478 
2479 			rc = cudbg_sge_ctxt_check_valid(buff->data, i);
2480 			if (!rc)
2481 				continue;
2482 
2483 			buff->cntxt_type = i;
2484 			buff->cntxt_id = j;
2485 			buff++;
2486 		}
2487 	}
2488 
2489 	kvfree(ctx_buf);
2490 
2491 	/* Collect FREELIST and CONGESTION MANAGER contexts */
2492 	max_ctx_size = region_info[CTXT_FLM].end -
2493 		       region_info[CTXT_FLM].start + 1;
2494 	max_ctx_qid = max_ctx_size / SGE_CTXT_SIZE;
2495 	/* Since FLM and CONM are 1-to-1 mapped, the below function
2496 	 * will fetch both FLM and CONM contexts.
2497 	 */
2498 	cudbg_get_sge_ctxt_fw(pdbg_init, max_ctx_qid, CTXT_FLM, &buff);
2499 
2500 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2501 }
2502 
2503 static inline void cudbg_tcamxy2valmask(u64 x, u64 y, u8 *addr, u64 *mask)
2504 {
2505 	*mask = x | y;
2506 	y = (__force u64)cpu_to_be64(y);
2507 	memcpy(addr, (char *)&y + 2, ETH_ALEN);
2508 }
2509 
2510 static void cudbg_mps_rpl_backdoor(struct adapter *padap,
2511 				   struct fw_ldst_mps_rplc *mps_rplc)
2512 {
2513 	if (is_t5(padap->params.chip)) {
2514 		mps_rplc->rplc255_224 = htonl(t4_read_reg(padap,
2515 							  MPS_VF_RPLCT_MAP3_A));
2516 		mps_rplc->rplc223_192 = htonl(t4_read_reg(padap,
2517 							  MPS_VF_RPLCT_MAP2_A));
2518 		mps_rplc->rplc191_160 = htonl(t4_read_reg(padap,
2519 							  MPS_VF_RPLCT_MAP1_A));
2520 		mps_rplc->rplc159_128 = htonl(t4_read_reg(padap,
2521 							  MPS_VF_RPLCT_MAP0_A));
2522 	} else {
2523 		mps_rplc->rplc255_224 = htonl(t4_read_reg(padap,
2524 							  MPS_VF_RPLCT_MAP7_A));
2525 		mps_rplc->rplc223_192 = htonl(t4_read_reg(padap,
2526 							  MPS_VF_RPLCT_MAP6_A));
2527 		mps_rplc->rplc191_160 = htonl(t4_read_reg(padap,
2528 							  MPS_VF_RPLCT_MAP5_A));
2529 		mps_rplc->rplc159_128 = htonl(t4_read_reg(padap,
2530 							  MPS_VF_RPLCT_MAP4_A));
2531 	}
2532 	mps_rplc->rplc127_96 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP3_A));
2533 	mps_rplc->rplc95_64 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP2_A));
2534 	mps_rplc->rplc63_32 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP1_A));
2535 	mps_rplc->rplc31_0 = htonl(t4_read_reg(padap, MPS_VF_RPLCT_MAP0_A));
2536 }
2537 
2538 static int cudbg_collect_tcam_index(struct cudbg_init *pdbg_init,
2539 				    struct cudbg_mps_tcam *tcam, u32 idx)
2540 {
2541 	struct adapter *padap = pdbg_init->adap;
2542 	u64 tcamy, tcamx, val;
2543 	u32 ctl, data2;
2544 	int rc = 0;
2545 
2546 	if (CHELSIO_CHIP_VERSION(padap->params.chip) >= CHELSIO_T6) {
2547 		/* CtlReqID   - 1: use Host Driver Requester ID
2548 		 * CtlCmdType - 0: Read, 1: Write
2549 		 * CtlTcamSel - 0: TCAM0, 1: TCAM1
2550 		 * CtlXYBitSel- 0: Y bit, 1: X bit
2551 		 */
2552 
2553 		/* Read tcamy */
2554 		ctl = CTLREQID_V(1) | CTLCMDTYPE_V(0) | CTLXYBITSEL_V(0);
2555 		if (idx < 256)
2556 			ctl |= CTLTCAMINDEX_V(idx) | CTLTCAMSEL_V(0);
2557 		else
2558 			ctl |= CTLTCAMINDEX_V(idx - 256) | CTLTCAMSEL_V(1);
2559 
2560 		t4_write_reg(padap, MPS_CLS_TCAM_DATA2_CTL_A, ctl);
2561 		val = t4_read_reg(padap, MPS_CLS_TCAM_RDATA1_REQ_ID1_A);
2562 		tcamy = DMACH_G(val) << 32;
2563 		tcamy |= t4_read_reg(padap, MPS_CLS_TCAM_RDATA0_REQ_ID1_A);
2564 		data2 = t4_read_reg(padap, MPS_CLS_TCAM_RDATA2_REQ_ID1_A);
2565 		tcam->lookup_type = DATALKPTYPE_G(data2);
2566 
2567 		/* 0 - Outer header, 1 - Inner header
2568 		 * [71:48] bit locations are overloaded for
2569 		 * outer vs. inner lookup types.
2570 		 */
2571 		if (tcam->lookup_type && tcam->lookup_type != DATALKPTYPE_M) {
2572 			/* Inner header VNI */
2573 			tcam->vniy = (data2 & DATAVIDH2_F) | DATAVIDH1_G(data2);
2574 			tcam->vniy = (tcam->vniy << 16) | VIDL_G(val);
2575 			tcam->dip_hit = data2 & DATADIPHIT_F;
2576 		} else {
2577 			tcam->vlan_vld = data2 & DATAVIDH2_F;
2578 			tcam->ivlan = VIDL_G(val);
2579 		}
2580 
2581 		tcam->port_num = DATAPORTNUM_G(data2);
2582 
2583 		/* Read tcamx. Change the control param */
2584 		ctl |= CTLXYBITSEL_V(1);
2585 		t4_write_reg(padap, MPS_CLS_TCAM_DATA2_CTL_A, ctl);
2586 		val = t4_read_reg(padap, MPS_CLS_TCAM_RDATA1_REQ_ID1_A);
2587 		tcamx = DMACH_G(val) << 32;
2588 		tcamx |= t4_read_reg(padap, MPS_CLS_TCAM_RDATA0_REQ_ID1_A);
2589 		data2 = t4_read_reg(padap, MPS_CLS_TCAM_RDATA2_REQ_ID1_A);
2590 		if (tcam->lookup_type && tcam->lookup_type != DATALKPTYPE_M) {
2591 			/* Inner header VNI mask */
2592 			tcam->vnix = (data2 & DATAVIDH2_F) | DATAVIDH1_G(data2);
2593 			tcam->vnix = (tcam->vnix << 16) | VIDL_G(val);
2594 		}
2595 	} else {
2596 		tcamy = t4_read_reg64(padap, MPS_CLS_TCAM_Y_L(idx));
2597 		tcamx = t4_read_reg64(padap, MPS_CLS_TCAM_X_L(idx));
2598 	}
2599 
2600 	/* If no entry, return */
2601 	if (tcamx & tcamy)
2602 		return rc;
2603 
2604 	tcam->cls_lo = t4_read_reg(padap, MPS_CLS_SRAM_L(idx));
2605 	tcam->cls_hi = t4_read_reg(padap, MPS_CLS_SRAM_H(idx));
2606 
2607 	if (is_t5(padap->params.chip))
2608 		tcam->repli = (tcam->cls_lo & REPLICATE_F);
2609 	else if (is_t6(padap->params.chip))
2610 		tcam->repli = (tcam->cls_lo & T6_REPLICATE_F);
2611 
2612 	if (tcam->repli) {
2613 		struct fw_ldst_cmd ldst_cmd;
2614 		struct fw_ldst_mps_rplc mps_rplc;
2615 
2616 		memset(&ldst_cmd, 0, sizeof(ldst_cmd));
2617 		ldst_cmd.op_to_addrspace =
2618 			htonl(FW_CMD_OP_V(FW_LDST_CMD) |
2619 			      FW_CMD_REQUEST_F | FW_CMD_READ_F |
2620 			      FW_LDST_CMD_ADDRSPACE_V(FW_LDST_ADDRSPC_MPS));
2621 		ldst_cmd.cycles_to_len16 = htonl(FW_LEN16(ldst_cmd));
2622 		ldst_cmd.u.mps.rplc.fid_idx =
2623 			htons(FW_LDST_CMD_FID_V(FW_LDST_MPS_RPLC) |
2624 			      FW_LDST_CMD_IDX_V(idx));
2625 
2626 		/* If firmware is not attached/alive, use backdoor register
2627 		 * access to collect dump.
2628 		 */
2629 		if (is_fw_attached(pdbg_init))
2630 			rc = t4_wr_mbox(padap, padap->mbox, &ldst_cmd,
2631 					sizeof(ldst_cmd), &ldst_cmd);
2632 
2633 		if (rc || !is_fw_attached(pdbg_init)) {
2634 			cudbg_mps_rpl_backdoor(padap, &mps_rplc);
2635 			/* Ignore error since we collected directly from
2636 			 * reading registers.
2637 			 */
2638 			rc = 0;
2639 		} else {
2640 			mps_rplc = ldst_cmd.u.mps.rplc;
2641 		}
2642 
2643 		tcam->rplc[0] = ntohl(mps_rplc.rplc31_0);
2644 		tcam->rplc[1] = ntohl(mps_rplc.rplc63_32);
2645 		tcam->rplc[2] = ntohl(mps_rplc.rplc95_64);
2646 		tcam->rplc[3] = ntohl(mps_rplc.rplc127_96);
2647 		if (padap->params.arch.mps_rplc_size > CUDBG_MAX_RPLC_SIZE) {
2648 			tcam->rplc[4] = ntohl(mps_rplc.rplc159_128);
2649 			tcam->rplc[5] = ntohl(mps_rplc.rplc191_160);
2650 			tcam->rplc[6] = ntohl(mps_rplc.rplc223_192);
2651 			tcam->rplc[7] = ntohl(mps_rplc.rplc255_224);
2652 		}
2653 	}
2654 	cudbg_tcamxy2valmask(tcamx, tcamy, tcam->addr, &tcam->mask);
2655 	tcam->idx = idx;
2656 	tcam->rplc_size = padap->params.arch.mps_rplc_size;
2657 	return rc;
2658 }
2659 
2660 int cudbg_collect_mps_tcam(struct cudbg_init *pdbg_init,
2661 			   struct cudbg_buffer *dbg_buff,
2662 			   struct cudbg_error *cudbg_err)
2663 {
2664 	struct adapter *padap = pdbg_init->adap;
2665 	struct cudbg_buffer temp_buff = { 0 };
2666 	u32 size = 0, i, n, total_size = 0;
2667 	struct cudbg_mps_tcam *tcam;
2668 	int rc;
2669 
2670 	n = padap->params.arch.mps_tcam_size;
2671 	size = sizeof(struct cudbg_mps_tcam) * n;
2672 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2673 	if (rc)
2674 		return rc;
2675 
2676 	tcam = (struct cudbg_mps_tcam *)temp_buff.data;
2677 	for (i = 0; i < n; i++) {
2678 		rc = cudbg_collect_tcam_index(pdbg_init, tcam, i);
2679 		if (rc) {
2680 			cudbg_err->sys_err = rc;
2681 			cudbg_put_buff(pdbg_init, &temp_buff);
2682 			return rc;
2683 		}
2684 		total_size += sizeof(struct cudbg_mps_tcam);
2685 		tcam++;
2686 	}
2687 
2688 	if (!total_size) {
2689 		rc = CUDBG_SYSTEM_ERROR;
2690 		cudbg_err->sys_err = rc;
2691 		cudbg_put_buff(pdbg_init, &temp_buff);
2692 		return rc;
2693 	}
2694 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2695 }
2696 
2697 int cudbg_collect_vpd_data(struct cudbg_init *pdbg_init,
2698 			   struct cudbg_buffer *dbg_buff,
2699 			   struct cudbg_error *cudbg_err)
2700 {
2701 	struct adapter *padap = pdbg_init->adap;
2702 	struct cudbg_buffer temp_buff = { 0 };
2703 	char vpd_str[CUDBG_VPD_VER_LEN + 1];
2704 	struct cudbg_vpd_data *vpd_data;
2705 	struct vpd_params vpd = { 0 };
2706 	u32 vpd_vers, fw_vers;
2707 	int rc;
2708 
2709 	rc = t4_get_raw_vpd_params(padap, &vpd);
2710 	if (rc)
2711 		return rc;
2712 
2713 	rc = t4_get_fw_version(padap, &fw_vers);
2714 	if (rc)
2715 		return rc;
2716 
2717 	rc = cudbg_read_vpd_reg(padap, CUDBG_VPD_VER_ADDR, CUDBG_VPD_VER_LEN,
2718 				vpd_str);
2719 	if (rc)
2720 		return rc;
2721 
2722 	vpd_str[CUDBG_VPD_VER_LEN] = '\0';
2723 	rc = kstrtouint(vpd_str, 0, &vpd_vers);
2724 	if (rc)
2725 		return rc;
2726 
2727 	rc = cudbg_get_buff(pdbg_init, dbg_buff, sizeof(struct cudbg_vpd_data),
2728 			    &temp_buff);
2729 	if (rc)
2730 		return rc;
2731 
2732 	vpd_data = (struct cudbg_vpd_data *)temp_buff.data;
2733 	memcpy(vpd_data->sn, vpd.sn, SERNUM_LEN + 1);
2734 	memcpy(vpd_data->bn, vpd.pn, PN_LEN + 1);
2735 	memcpy(vpd_data->na, vpd.na, MACADDR_LEN + 1);
2736 	memcpy(vpd_data->mn, vpd.id, ID_LEN + 1);
2737 	vpd_data->scfg_vers = t4_read_reg(padap, PCIE_STATIC_SPARE2_A);
2738 	vpd_data->vpd_vers = vpd_vers;
2739 	vpd_data->fw_major = FW_HDR_FW_VER_MAJOR_G(fw_vers);
2740 	vpd_data->fw_minor = FW_HDR_FW_VER_MINOR_G(fw_vers);
2741 	vpd_data->fw_micro = FW_HDR_FW_VER_MICRO_G(fw_vers);
2742 	vpd_data->fw_build = FW_HDR_FW_VER_BUILD_G(fw_vers);
2743 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2744 }
2745 
2746 static int cudbg_read_tid(struct cudbg_init *pdbg_init, u32 tid,
2747 			  struct cudbg_tid_data *tid_data)
2748 {
2749 	struct adapter *padap = pdbg_init->adap;
2750 	int i, cmd_retry = 8;
2751 	u32 val;
2752 
2753 	/* Fill REQ_DATA regs with 0's */
2754 	for (i = 0; i < NUM_LE_DB_DBGI_REQ_DATA_INSTANCES; i++)
2755 		t4_write_reg(padap, LE_DB_DBGI_REQ_DATA_A + (i << 2), 0);
2756 
2757 	/* Write DBIG command */
2758 	val = DBGICMD_V(4) | DBGITID_V(tid);
2759 	t4_write_reg(padap, LE_DB_DBGI_REQ_TCAM_CMD_A, val);
2760 	tid_data->dbig_cmd = val;
2761 
2762 	val = DBGICMDSTRT_F | DBGICMDMODE_V(1); /* LE mode */
2763 	t4_write_reg(padap, LE_DB_DBGI_CONFIG_A, val);
2764 	tid_data->dbig_conf = val;
2765 
2766 	/* Poll the DBGICMDBUSY bit */
2767 	val = 1;
2768 	while (val) {
2769 		val = t4_read_reg(padap, LE_DB_DBGI_CONFIG_A);
2770 		val = val & DBGICMDBUSY_F;
2771 		cmd_retry--;
2772 		if (!cmd_retry)
2773 			return CUDBG_SYSTEM_ERROR;
2774 	}
2775 
2776 	/* Check RESP status */
2777 	val = t4_read_reg(padap, LE_DB_DBGI_RSP_STATUS_A);
2778 	tid_data->dbig_rsp_stat = val;
2779 	if (!(val & 1))
2780 		return CUDBG_SYSTEM_ERROR;
2781 
2782 	/* Read RESP data */
2783 	for (i = 0; i < NUM_LE_DB_DBGI_RSP_DATA_INSTANCES; i++)
2784 		tid_data->data[i] = t4_read_reg(padap,
2785 						LE_DB_DBGI_RSP_DATA_A +
2786 						(i << 2));
2787 	tid_data->tid = tid;
2788 	return 0;
2789 }
2790 
2791 static int cudbg_get_le_type(u32 tid, struct cudbg_tcam tcam_region)
2792 {
2793 	int type = LE_ET_UNKNOWN;
2794 
2795 	if (tid < tcam_region.server_start)
2796 		type = LE_ET_TCAM_CON;
2797 	else if (tid < tcam_region.filter_start)
2798 		type = LE_ET_TCAM_SERVER;
2799 	else if (tid < tcam_region.clip_start)
2800 		type = LE_ET_TCAM_FILTER;
2801 	else if (tid < tcam_region.routing_start)
2802 		type = LE_ET_TCAM_CLIP;
2803 	else if (tid < tcam_region.tid_hash_base)
2804 		type = LE_ET_TCAM_ROUTING;
2805 	else if (tid < tcam_region.max_tid)
2806 		type = LE_ET_HASH_CON;
2807 	else
2808 		type = LE_ET_INVALID_TID;
2809 
2810 	return type;
2811 }
2812 
2813 static int cudbg_is_ipv6_entry(struct cudbg_tid_data *tid_data,
2814 			       struct cudbg_tcam tcam_region)
2815 {
2816 	int ipv6 = 0;
2817 	int le_type;
2818 
2819 	le_type = cudbg_get_le_type(tid_data->tid, tcam_region);
2820 	if (tid_data->tid & 1)
2821 		return 0;
2822 
2823 	if (le_type == LE_ET_HASH_CON) {
2824 		ipv6 = tid_data->data[16] & 0x8000;
2825 	} else if (le_type == LE_ET_TCAM_CON) {
2826 		ipv6 = tid_data->data[16] & 0x8000;
2827 		if (ipv6)
2828 			ipv6 = tid_data->data[9] == 0x00C00000;
2829 	} else {
2830 		ipv6 = 0;
2831 	}
2832 	return ipv6;
2833 }
2834 
2835 void cudbg_fill_le_tcam_info(struct adapter *padap,
2836 			     struct cudbg_tcam *tcam_region)
2837 {
2838 	u32 value;
2839 
2840 	/* Get the LE regions */
2841 	value = t4_read_reg(padap, LE_DB_TID_HASHBASE_A); /* hash base index */
2842 	tcam_region->tid_hash_base = value;
2843 
2844 	/* Get routing table index */
2845 	value = t4_read_reg(padap, LE_DB_ROUTING_TABLE_INDEX_A);
2846 	tcam_region->routing_start = value;
2847 
2848 	/* Get clip table index. For T6 there is separate CLIP TCAM */
2849 	if (is_t6(padap->params.chip))
2850 		value = t4_read_reg(padap, LE_DB_CLCAM_TID_BASE_A);
2851 	else
2852 		value = t4_read_reg(padap, LE_DB_CLIP_TABLE_INDEX_A);
2853 	tcam_region->clip_start = value;
2854 
2855 	/* Get filter table index */
2856 	value = t4_read_reg(padap, LE_DB_FILTER_TABLE_INDEX_A);
2857 	tcam_region->filter_start = value;
2858 
2859 	/* Get server table index */
2860 	value = t4_read_reg(padap, LE_DB_SERVER_INDEX_A);
2861 	tcam_region->server_start = value;
2862 
2863 	/* Check whether hash is enabled and calculate the max tids */
2864 	value = t4_read_reg(padap, LE_DB_CONFIG_A);
2865 	if ((value >> HASHEN_S) & 1) {
2866 		value = t4_read_reg(padap, LE_DB_HASH_CONFIG_A);
2867 		if (CHELSIO_CHIP_VERSION(padap->params.chip) > CHELSIO_T5) {
2868 			tcam_region->max_tid = (value & 0xFFFFF) +
2869 					       tcam_region->tid_hash_base;
2870 		} else {
2871 			value = HASHTIDSIZE_G(value);
2872 			value = 1 << value;
2873 			tcam_region->max_tid = value +
2874 					       tcam_region->tid_hash_base;
2875 		}
2876 	} else { /* hash not enabled */
2877 		if (is_t6(padap->params.chip))
2878 			tcam_region->max_tid = (value & ASLIPCOMPEN_F) ?
2879 					       CUDBG_MAX_TID_COMP_EN :
2880 					       CUDBG_MAX_TID_COMP_DIS;
2881 		else
2882 			tcam_region->max_tid = CUDBG_MAX_TCAM_TID;
2883 	}
2884 
2885 	if (is_t6(padap->params.chip))
2886 		tcam_region->max_tid += CUDBG_T6_CLIP;
2887 }
2888 
2889 int cudbg_collect_le_tcam(struct cudbg_init *pdbg_init,
2890 			  struct cudbg_buffer *dbg_buff,
2891 			  struct cudbg_error *cudbg_err)
2892 {
2893 	struct adapter *padap = pdbg_init->adap;
2894 	struct cudbg_buffer temp_buff = { 0 };
2895 	struct cudbg_tcam tcam_region = { 0 };
2896 	struct cudbg_tid_data *tid_data;
2897 	u32 bytes = 0;
2898 	int rc, size;
2899 	u32 i;
2900 
2901 	cudbg_fill_le_tcam_info(padap, &tcam_region);
2902 
2903 	size = sizeof(struct cudbg_tid_data) * tcam_region.max_tid;
2904 	size += sizeof(struct cudbg_tcam);
2905 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2906 	if (rc)
2907 		return rc;
2908 
2909 	memcpy(temp_buff.data, &tcam_region, sizeof(struct cudbg_tcam));
2910 	bytes = sizeof(struct cudbg_tcam);
2911 	tid_data = (struct cudbg_tid_data *)(temp_buff.data + bytes);
2912 	/* read all tid */
2913 	for (i = 0; i < tcam_region.max_tid; ) {
2914 		rc = cudbg_read_tid(pdbg_init, i, tid_data);
2915 		if (rc) {
2916 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
2917 			/* Update tcam header and exit */
2918 			tcam_region.max_tid = i;
2919 			memcpy(temp_buff.data, &tcam_region,
2920 			       sizeof(struct cudbg_tcam));
2921 			goto out;
2922 		}
2923 
2924 		if (cudbg_is_ipv6_entry(tid_data, tcam_region)) {
2925 			/* T6 CLIP TCAM: ipv6 takes 4 entries */
2926 			if (is_t6(padap->params.chip) &&
2927 			    i >= tcam_region.clip_start &&
2928 			    i < tcam_region.clip_start + CUDBG_T6_CLIP)
2929 				i += 4;
2930 			else /* Main TCAM: ipv6 takes two tids */
2931 				i += 2;
2932 		} else {
2933 			i++;
2934 		}
2935 
2936 		tid_data++;
2937 		bytes += sizeof(struct cudbg_tid_data);
2938 	}
2939 
2940 out:
2941 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2942 }
2943 
2944 int cudbg_collect_cctrl(struct cudbg_init *pdbg_init,
2945 			struct cudbg_buffer *dbg_buff,
2946 			struct cudbg_error *cudbg_err)
2947 {
2948 	struct adapter *padap = pdbg_init->adap;
2949 	struct cudbg_buffer temp_buff = { 0 };
2950 	u32 size;
2951 	int rc;
2952 
2953 	size = sizeof(u16) * NMTUS * NCCTRL_WIN;
2954 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2955 	if (rc)
2956 		return rc;
2957 
2958 	t4_read_cong_tbl(padap, (void *)temp_buff.data);
2959 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
2960 }
2961 
2962 int cudbg_collect_ma_indirect(struct cudbg_init *pdbg_init,
2963 			      struct cudbg_buffer *dbg_buff,
2964 			      struct cudbg_error *cudbg_err)
2965 {
2966 	struct adapter *padap = pdbg_init->adap;
2967 	struct cudbg_buffer temp_buff = { 0 };
2968 	struct ireg_buf *ma_indr;
2969 	int i, rc, n;
2970 	u32 size, j;
2971 
2972 	if (CHELSIO_CHIP_VERSION(padap->params.chip) < CHELSIO_T6)
2973 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
2974 
2975 	n = sizeof(t6_ma_ireg_array) / (IREG_NUM_ELEM * sizeof(u32));
2976 	size = sizeof(struct ireg_buf) * n * 2;
2977 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
2978 	if (rc)
2979 		return rc;
2980 
2981 	ma_indr = (struct ireg_buf *)temp_buff.data;
2982 	for (i = 0; i < n; i++) {
2983 		struct ireg_field *ma_fli = &ma_indr->tp_pio;
2984 		u32 *buff = ma_indr->outbuf;
2985 
2986 		ma_fli->ireg_addr = t6_ma_ireg_array[i][0];
2987 		ma_fli->ireg_data = t6_ma_ireg_array[i][1];
2988 		ma_fli->ireg_local_offset = t6_ma_ireg_array[i][2];
2989 		ma_fli->ireg_offset_range = t6_ma_ireg_array[i][3];
2990 		t4_read_indirect(padap, ma_fli->ireg_addr, ma_fli->ireg_data,
2991 				 buff, ma_fli->ireg_offset_range,
2992 				 ma_fli->ireg_local_offset);
2993 		ma_indr++;
2994 	}
2995 
2996 	n = sizeof(t6_ma_ireg_array2) / (IREG_NUM_ELEM * sizeof(u32));
2997 	for (i = 0; i < n; i++) {
2998 		struct ireg_field *ma_fli = &ma_indr->tp_pio;
2999 		u32 *buff = ma_indr->outbuf;
3000 
3001 		ma_fli->ireg_addr = t6_ma_ireg_array2[i][0];
3002 		ma_fli->ireg_data = t6_ma_ireg_array2[i][1];
3003 		ma_fli->ireg_local_offset = t6_ma_ireg_array2[i][2];
3004 		for (j = 0; j < t6_ma_ireg_array2[i][3]; j++) {
3005 			t4_read_indirect(padap, ma_fli->ireg_addr,
3006 					 ma_fli->ireg_data, buff, 1,
3007 					 ma_fli->ireg_local_offset);
3008 			buff++;
3009 			ma_fli->ireg_local_offset += 0x20;
3010 		}
3011 		ma_indr++;
3012 	}
3013 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3014 }
3015 
3016 int cudbg_collect_ulptx_la(struct cudbg_init *pdbg_init,
3017 			   struct cudbg_buffer *dbg_buff,
3018 			   struct cudbg_error *cudbg_err)
3019 {
3020 	struct adapter *padap = pdbg_init->adap;
3021 	struct cudbg_buffer temp_buff = { 0 };
3022 	struct cudbg_ulptx_la *ulptx_la_buff;
3023 	struct cudbg_ver_hdr *ver_hdr;
3024 	u32 i, j;
3025 	int rc;
3026 
3027 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
3028 			    sizeof(struct cudbg_ver_hdr) +
3029 			    sizeof(struct cudbg_ulptx_la),
3030 			    &temp_buff);
3031 	if (rc)
3032 		return rc;
3033 
3034 	ver_hdr = (struct cudbg_ver_hdr *)temp_buff.data;
3035 	ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
3036 	ver_hdr->revision = CUDBG_ULPTX_LA_REV;
3037 	ver_hdr->size = sizeof(struct cudbg_ulptx_la);
3038 
3039 	ulptx_la_buff = (struct cudbg_ulptx_la *)(temp_buff.data +
3040 						  sizeof(*ver_hdr));
3041 	for (i = 0; i < CUDBG_NUM_ULPTX; i++) {
3042 		ulptx_la_buff->rdptr[i] = t4_read_reg(padap,
3043 						      ULP_TX_LA_RDPTR_0_A +
3044 						      0x10 * i);
3045 		ulptx_la_buff->wrptr[i] = t4_read_reg(padap,
3046 						      ULP_TX_LA_WRPTR_0_A +
3047 						      0x10 * i);
3048 		ulptx_la_buff->rddata[i] = t4_read_reg(padap,
3049 						       ULP_TX_LA_RDDATA_0_A +
3050 						       0x10 * i);
3051 		for (j = 0; j < CUDBG_NUM_ULPTX_READ; j++)
3052 			ulptx_la_buff->rd_data[i][j] =
3053 				t4_read_reg(padap,
3054 					    ULP_TX_LA_RDDATA_0_A + 0x10 * i);
3055 	}
3056 
3057 	for (i = 0; i < CUDBG_NUM_ULPTX_ASIC_READ; i++) {
3058 		t4_write_reg(padap, ULP_TX_ASIC_DEBUG_CTRL_A, 0x1);
3059 		ulptx_la_buff->rdptr_asic[i] =
3060 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_CTRL_A);
3061 		ulptx_la_buff->rddata_asic[i][0] =
3062 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_0_A);
3063 		ulptx_la_buff->rddata_asic[i][1] =
3064 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_1_A);
3065 		ulptx_la_buff->rddata_asic[i][2] =
3066 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_2_A);
3067 		ulptx_la_buff->rddata_asic[i][3] =
3068 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_3_A);
3069 		ulptx_la_buff->rddata_asic[i][4] =
3070 				t4_read_reg(padap, ULP_TX_ASIC_DEBUG_4_A);
3071 		ulptx_la_buff->rddata_asic[i][5] =
3072 				t4_read_reg(padap, PM_RX_BASE_ADDR);
3073 	}
3074 
3075 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3076 }
3077 
3078 int cudbg_collect_up_cim_indirect(struct cudbg_init *pdbg_init,
3079 				  struct cudbg_buffer *dbg_buff,
3080 				  struct cudbg_error *cudbg_err)
3081 {
3082 	struct adapter *padap = pdbg_init->adap;
3083 	struct cudbg_buffer temp_buff = { 0 };
3084 	u32 local_offset, local_range;
3085 	struct ireg_buf *up_cim;
3086 	u32 size, j, iter;
3087 	u32 instance = 0;
3088 	int i, rc, n;
3089 
3090 	if (is_t5(padap->params.chip))
3091 		n = sizeof(t5_up_cim_reg_array) /
3092 		    ((IREG_NUM_ELEM + 1) * sizeof(u32));
3093 	else if (is_t6(padap->params.chip))
3094 		n = sizeof(t6_up_cim_reg_array) /
3095 		    ((IREG_NUM_ELEM + 1) * sizeof(u32));
3096 	else
3097 		return CUDBG_STATUS_NOT_IMPLEMENTED;
3098 
3099 	size = sizeof(struct ireg_buf) * n;
3100 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
3101 	if (rc)
3102 		return rc;
3103 
3104 	up_cim = (struct ireg_buf *)temp_buff.data;
3105 	for (i = 0; i < n; i++) {
3106 		struct ireg_field *up_cim_reg = &up_cim->tp_pio;
3107 		u32 *buff = up_cim->outbuf;
3108 
3109 		if (is_t5(padap->params.chip)) {
3110 			up_cim_reg->ireg_addr = t5_up_cim_reg_array[i][0];
3111 			up_cim_reg->ireg_data = t5_up_cim_reg_array[i][1];
3112 			up_cim_reg->ireg_local_offset =
3113 						t5_up_cim_reg_array[i][2];
3114 			up_cim_reg->ireg_offset_range =
3115 						t5_up_cim_reg_array[i][3];
3116 			instance = t5_up_cim_reg_array[i][4];
3117 		} else if (is_t6(padap->params.chip)) {
3118 			up_cim_reg->ireg_addr = t6_up_cim_reg_array[i][0];
3119 			up_cim_reg->ireg_data = t6_up_cim_reg_array[i][1];
3120 			up_cim_reg->ireg_local_offset =
3121 						t6_up_cim_reg_array[i][2];
3122 			up_cim_reg->ireg_offset_range =
3123 						t6_up_cim_reg_array[i][3];
3124 			instance = t6_up_cim_reg_array[i][4];
3125 		}
3126 
3127 		switch (instance) {
3128 		case NUM_CIM_CTL_TSCH_CHANNEL_INSTANCES:
3129 			iter = up_cim_reg->ireg_offset_range;
3130 			local_offset = 0x120;
3131 			local_range = 1;
3132 			break;
3133 		case NUM_CIM_CTL_TSCH_CHANNEL_TSCH_CLASS_INSTANCES:
3134 			iter = up_cim_reg->ireg_offset_range;
3135 			local_offset = 0x10;
3136 			local_range = 1;
3137 			break;
3138 		default:
3139 			iter = 1;
3140 			local_offset = 0;
3141 			local_range = up_cim_reg->ireg_offset_range;
3142 			break;
3143 		}
3144 
3145 		for (j = 0; j < iter; j++, buff++) {
3146 			rc = t4_cim_read(padap,
3147 					 up_cim_reg->ireg_local_offset +
3148 					 (j * local_offset), local_range, buff);
3149 			if (rc) {
3150 				cudbg_put_buff(pdbg_init, &temp_buff);
3151 				return rc;
3152 			}
3153 		}
3154 		up_cim++;
3155 	}
3156 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3157 }
3158 
3159 int cudbg_collect_pbt_tables(struct cudbg_init *pdbg_init,
3160 			     struct cudbg_buffer *dbg_buff,
3161 			     struct cudbg_error *cudbg_err)
3162 {
3163 	struct adapter *padap = pdbg_init->adap;
3164 	struct cudbg_buffer temp_buff = { 0 };
3165 	struct cudbg_pbt_tables *pbt;
3166 	int i, rc;
3167 	u32 addr;
3168 
3169 	rc = cudbg_get_buff(pdbg_init, dbg_buff,
3170 			    sizeof(struct cudbg_pbt_tables),
3171 			    &temp_buff);
3172 	if (rc)
3173 		return rc;
3174 
3175 	pbt = (struct cudbg_pbt_tables *)temp_buff.data;
3176 	/* PBT dynamic entries */
3177 	addr = CUDBG_CHAC_PBT_ADDR;
3178 	for (i = 0; i < CUDBG_PBT_DYNAMIC_ENTRIES; i++) {
3179 		rc = t4_cim_read(padap, addr + (i * 4), 1,
3180 				 &pbt->pbt_dynamic[i]);
3181 		if (rc) {
3182 			cudbg_err->sys_err = rc;
3183 			cudbg_put_buff(pdbg_init, &temp_buff);
3184 			return rc;
3185 		}
3186 	}
3187 
3188 	/* PBT static entries */
3189 	/* static entries start when bit 6 is set */
3190 	addr = CUDBG_CHAC_PBT_ADDR + (1 << 6);
3191 	for (i = 0; i < CUDBG_PBT_STATIC_ENTRIES; i++) {
3192 		rc = t4_cim_read(padap, addr + (i * 4), 1,
3193 				 &pbt->pbt_static[i]);
3194 		if (rc) {
3195 			cudbg_err->sys_err = rc;
3196 			cudbg_put_buff(pdbg_init, &temp_buff);
3197 			return rc;
3198 		}
3199 	}
3200 
3201 	/* LRF entries */
3202 	addr = CUDBG_CHAC_PBT_LRF;
3203 	for (i = 0; i < CUDBG_LRF_ENTRIES; i++) {
3204 		rc = t4_cim_read(padap, addr + (i * 4), 1,
3205 				 &pbt->lrf_table[i]);
3206 		if (rc) {
3207 			cudbg_err->sys_err = rc;
3208 			cudbg_put_buff(pdbg_init, &temp_buff);
3209 			return rc;
3210 		}
3211 	}
3212 
3213 	/* PBT data entries */
3214 	addr = CUDBG_CHAC_PBT_DATA;
3215 	for (i = 0; i < CUDBG_PBT_DATA_ENTRIES; i++) {
3216 		rc = t4_cim_read(padap, addr + (i * 4), 1,
3217 				 &pbt->pbt_data[i]);
3218 		if (rc) {
3219 			cudbg_err->sys_err = rc;
3220 			cudbg_put_buff(pdbg_init, &temp_buff);
3221 			return rc;
3222 		}
3223 	}
3224 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3225 }
3226 
3227 int cudbg_collect_mbox_log(struct cudbg_init *pdbg_init,
3228 			   struct cudbg_buffer *dbg_buff,
3229 			   struct cudbg_error *cudbg_err)
3230 {
3231 	struct adapter *padap = pdbg_init->adap;
3232 	struct cudbg_mbox_log *mboxlog = NULL;
3233 	struct cudbg_buffer temp_buff = { 0 };
3234 	struct mbox_cmd_log *log = NULL;
3235 	struct mbox_cmd *entry;
3236 	unsigned int entry_idx;
3237 	u16 mbox_cmds;
3238 	int i, k, rc;
3239 	u64 flit;
3240 	u32 size;
3241 
3242 	log = padap->mbox_log;
3243 	mbox_cmds = padap->mbox_log->size;
3244 	size = sizeof(struct cudbg_mbox_log) * mbox_cmds;
3245 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
3246 	if (rc)
3247 		return rc;
3248 
3249 	mboxlog = (struct cudbg_mbox_log *)temp_buff.data;
3250 	for (k = 0; k < mbox_cmds; k++) {
3251 		entry_idx = log->cursor + k;
3252 		if (entry_idx >= log->size)
3253 			entry_idx -= log->size;
3254 
3255 		entry = mbox_cmd_log_entry(log, entry_idx);
3256 		/* skip over unused entries */
3257 		if (entry->timestamp == 0)
3258 			continue;
3259 
3260 		memcpy(&mboxlog->entry, entry, sizeof(struct mbox_cmd));
3261 		for (i = 0; i < MBOX_LEN / 8; i++) {
3262 			flit = entry->cmd[i];
3263 			mboxlog->hi[i] = (u32)(flit >> 32);
3264 			mboxlog->lo[i] = (u32)flit;
3265 		}
3266 		mboxlog++;
3267 	}
3268 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3269 }
3270 
3271 int cudbg_collect_hma_indirect(struct cudbg_init *pdbg_init,
3272 			       struct cudbg_buffer *dbg_buff,
3273 			       struct cudbg_error *cudbg_err)
3274 {
3275 	struct adapter *padap = pdbg_init->adap;
3276 	struct cudbg_buffer temp_buff = { 0 };
3277 	struct ireg_buf *hma_indr;
3278 	int i, rc, n;
3279 	u32 size;
3280 
3281 	if (CHELSIO_CHIP_VERSION(padap->params.chip) < CHELSIO_T6)
3282 		return CUDBG_STATUS_ENTITY_NOT_FOUND;
3283 
3284 	n = sizeof(t6_hma_ireg_array) / (IREG_NUM_ELEM * sizeof(u32));
3285 	size = sizeof(struct ireg_buf) * n;
3286 	rc = cudbg_get_buff(pdbg_init, dbg_buff, size, &temp_buff);
3287 	if (rc)
3288 		return rc;
3289 
3290 	hma_indr = (struct ireg_buf *)temp_buff.data;
3291 	for (i = 0; i < n; i++) {
3292 		struct ireg_field *hma_fli = &hma_indr->tp_pio;
3293 		u32 *buff = hma_indr->outbuf;
3294 
3295 		hma_fli->ireg_addr = t6_hma_ireg_array[i][0];
3296 		hma_fli->ireg_data = t6_hma_ireg_array[i][1];
3297 		hma_fli->ireg_local_offset = t6_hma_ireg_array[i][2];
3298 		hma_fli->ireg_offset_range = t6_hma_ireg_array[i][3];
3299 		t4_read_indirect(padap, hma_fli->ireg_addr, hma_fli->ireg_data,
3300 				 buff, hma_fli->ireg_offset_range,
3301 				 hma_fli->ireg_local_offset);
3302 		hma_indr++;
3303 	}
3304 	return cudbg_write_and_release_buff(pdbg_init, &temp_buff, dbg_buff);
3305 }
3306 
3307 void cudbg_fill_qdesc_num_and_size(const struct adapter *padap,
3308 				   u32 *num, u32 *size)
3309 {
3310 	u32 tot_entries = 0, tot_size = 0;
3311 
3312 	/* NIC TXQ, RXQ, FLQ, and CTRLQ */
3313 	tot_entries += MAX_ETH_QSETS * 3;
3314 	tot_entries += MAX_CTRL_QUEUES;
3315 
3316 	tot_size += MAX_ETH_QSETS * MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
3317 	tot_size += MAX_ETH_QSETS * MAX_RSPQ_ENTRIES * MAX_RXQ_DESC_SIZE;
3318 	tot_size += MAX_ETH_QSETS * MAX_RX_BUFFERS * MAX_FL_DESC_SIZE;
3319 	tot_size += MAX_CTRL_QUEUES * MAX_CTRL_TXQ_ENTRIES *
3320 		    MAX_CTRL_TXQ_DESC_SIZE;
3321 
3322 	/* FW_EVTQ and INTRQ */
3323 	tot_entries += INGQ_EXTRAS;
3324 	tot_size += INGQ_EXTRAS * MAX_RSPQ_ENTRIES * MAX_RXQ_DESC_SIZE;
3325 
3326 	/* PTP_TXQ */
3327 	tot_entries += 1;
3328 	tot_size += MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
3329 
3330 	/* ULD TXQ, RXQ, and FLQ */
3331 	tot_entries += CXGB4_TX_MAX * MAX_OFLD_QSETS;
3332 	tot_entries += CXGB4_ULD_MAX * MAX_ULD_QSETS * 2;
3333 
3334 	tot_size += CXGB4_TX_MAX * MAX_OFLD_QSETS * MAX_TXQ_ENTRIES *
3335 		    MAX_TXQ_DESC_SIZE;
3336 	tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * MAX_RSPQ_ENTRIES *
3337 		    MAX_RXQ_DESC_SIZE;
3338 	tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * MAX_RX_BUFFERS *
3339 		    MAX_FL_DESC_SIZE;
3340 
3341 	/* ULD CIQ */
3342 	tot_entries += CXGB4_ULD_MAX * MAX_ULD_QSETS;
3343 	tot_size += CXGB4_ULD_MAX * MAX_ULD_QSETS * SGE_MAX_IQ_SIZE *
3344 		    MAX_RXQ_DESC_SIZE;
3345 
3346 	/* ETHOFLD TXQ, RXQ, and FLQ */
3347 	tot_entries += MAX_OFLD_QSETS * 3;
3348 	tot_size += MAX_OFLD_QSETS * MAX_TXQ_ENTRIES * MAX_TXQ_DESC_SIZE;
3349 
3350 	tot_size += sizeof(struct cudbg_ver_hdr) +
3351 		    sizeof(struct cudbg_qdesc_info) +
3352 		    sizeof(struct cudbg_qdesc_entry) * tot_entries;
3353 
3354 	if (num)
3355 		*num = tot_entries;
3356 
3357 	if (size)
3358 		*size = tot_size;
3359 }
3360 
3361 int cudbg_collect_qdesc(struct cudbg_init *pdbg_init,
3362 			struct cudbg_buffer *dbg_buff,
3363 			struct cudbg_error *cudbg_err)
3364 {
3365 	u32 num_queues = 0, tot_entries = 0, size = 0;
3366 	struct adapter *padap = pdbg_init->adap;
3367 	struct cudbg_buffer temp_buff = { 0 };
3368 	struct cudbg_qdesc_entry *qdesc_entry;
3369 	struct cudbg_qdesc_info *qdesc_info;
3370 	struct cudbg_ver_hdr *ver_hdr;
3371 	struct sge *s = &padap->sge;
3372 	u32 i, j, cur_off, tot_len;
3373 	u8 *data;
3374 	int rc;
3375 
3376 	cudbg_fill_qdesc_num_and_size(padap, &tot_entries, &size);
3377 	size = min_t(u32, size, CUDBG_DUMP_BUFF_SIZE);
3378 	tot_len = size;
3379 	data = kvzalloc(size, GFP_KERNEL);
3380 	if (!data)
3381 		return -ENOMEM;
3382 
3383 	ver_hdr = (struct cudbg_ver_hdr *)data;
3384 	ver_hdr->signature = CUDBG_ENTITY_SIGNATURE;
3385 	ver_hdr->revision = CUDBG_QDESC_REV;
3386 	ver_hdr->size = sizeof(struct cudbg_qdesc_info);
3387 	size -= sizeof(*ver_hdr);
3388 
3389 	qdesc_info = (struct cudbg_qdesc_info *)(data +
3390 						 sizeof(*ver_hdr));
3391 	size -= sizeof(*qdesc_info);
3392 	qdesc_entry = (struct cudbg_qdesc_entry *)qdesc_info->data;
3393 
3394 #define QDESC_GET(q, desc, type, label) do { \
3395 	if (size <= 0) { \
3396 		goto label; \
3397 	} \
3398 	if (desc) { \
3399 		cudbg_fill_qdesc_##q(q, type, qdesc_entry); \
3400 		size -= sizeof(*qdesc_entry) + qdesc_entry->data_size; \
3401 		num_queues++; \
3402 		qdesc_entry = cudbg_next_qdesc(qdesc_entry); \
3403 	} \
3404 } while (0)
3405 
3406 #define QDESC_GET_TXQ(q, type, label) do { \
3407 	struct sge_txq *txq = (struct sge_txq *)q; \
3408 	QDESC_GET(txq, txq->desc, type, label); \
3409 } while (0)
3410 
3411 #define QDESC_GET_RXQ(q, type, label) do { \
3412 	struct sge_rspq *rxq = (struct sge_rspq *)q; \
3413 	QDESC_GET(rxq, rxq->desc, type, label); \
3414 } while (0)
3415 
3416 #define QDESC_GET_FLQ(q, type, label) do { \
3417 	struct sge_fl *flq = (struct sge_fl *)q; \
3418 	QDESC_GET(flq, flq->desc, type, label); \
3419 } while (0)
3420 
3421 	/* NIC TXQ */
3422 	for (i = 0; i < s->ethqsets; i++)
3423 		QDESC_GET_TXQ(&s->ethtxq[i].q, CUDBG_QTYPE_NIC_TXQ, out);
3424 
3425 	/* NIC RXQ */
3426 	for (i = 0; i < s->ethqsets; i++)
3427 		QDESC_GET_RXQ(&s->ethrxq[i].rspq, CUDBG_QTYPE_NIC_RXQ, out);
3428 
3429 	/* NIC FLQ */
3430 	for (i = 0; i < s->ethqsets; i++)
3431 		QDESC_GET_FLQ(&s->ethrxq[i].fl, CUDBG_QTYPE_NIC_FLQ, out);
3432 
3433 	/* NIC CTRLQ */
3434 	for (i = 0; i < padap->params.nports; i++)
3435 		QDESC_GET_TXQ(&s->ctrlq[i].q, CUDBG_QTYPE_CTRLQ, out);
3436 
3437 	/* FW_EVTQ */
3438 	QDESC_GET_RXQ(&s->fw_evtq, CUDBG_QTYPE_FWEVTQ, out);
3439 
3440 	/* INTRQ */
3441 	QDESC_GET_RXQ(&s->intrq, CUDBG_QTYPE_INTRQ, out);
3442 
3443 	/* PTP_TXQ */
3444 	QDESC_GET_TXQ(&s->ptptxq.q, CUDBG_QTYPE_PTP_TXQ, out);
3445 
3446 	/* ULD Queues */
3447 	mutex_lock(&uld_mutex);
3448 
3449 	if (s->uld_txq_info) {
3450 		struct sge_uld_txq_info *utxq;
3451 
3452 		/* ULD TXQ */
3453 		for (j = 0; j < CXGB4_TX_MAX; j++) {
3454 			if (!s->uld_txq_info[j])
3455 				continue;
3456 
3457 			utxq = s->uld_txq_info[j];
3458 			for (i = 0; i < utxq->ntxq; i++)
3459 				QDESC_GET_TXQ(&utxq->uldtxq[i].q,
3460 					      cudbg_uld_txq_to_qtype(j),
3461 					      out_unlock);
3462 		}
3463 	}
3464 
3465 	if (s->uld_rxq_info) {
3466 		struct sge_uld_rxq_info *urxq;
3467 		u32 base;
3468 
3469 		/* ULD RXQ */
3470 		for (j = 0; j < CXGB4_ULD_MAX; j++) {
3471 			if (!s->uld_rxq_info[j])
3472 				continue;
3473 
3474 			urxq = s->uld_rxq_info[j];
3475 			for (i = 0; i < urxq->nrxq; i++)
3476 				QDESC_GET_RXQ(&urxq->uldrxq[i].rspq,
3477 					      cudbg_uld_rxq_to_qtype(j),
3478 					      out_unlock);
3479 		}
3480 
3481 		/* ULD FLQ */
3482 		for (j = 0; j < CXGB4_ULD_MAX; j++) {
3483 			if (!s->uld_rxq_info[j])
3484 				continue;
3485 
3486 			urxq = s->uld_rxq_info[j];
3487 			for (i = 0; i < urxq->nrxq; i++)
3488 				QDESC_GET_FLQ(&urxq->uldrxq[i].fl,
3489 					      cudbg_uld_flq_to_qtype(j),
3490 					      out_unlock);
3491 		}
3492 
3493 		/* ULD CIQ */
3494 		for (j = 0; j < CXGB4_ULD_MAX; j++) {
3495 			if (!s->uld_rxq_info[j])
3496 				continue;
3497 
3498 			urxq = s->uld_rxq_info[j];
3499 			base = urxq->nrxq;
3500 			for (i = 0; i < urxq->nciq; i++)
3501 				QDESC_GET_RXQ(&urxq->uldrxq[base + i].rspq,
3502 					      cudbg_uld_ciq_to_qtype(j),
3503 					      out_unlock);
3504 		}
3505 	}
3506 
3507 	/* ETHOFLD TXQ */
3508 	if (s->eohw_txq)
3509 		for (i = 0; i < s->eoqsets; i++)
3510 			QDESC_GET_TXQ(&s->eohw_txq[i].q,
3511 				      CUDBG_QTYPE_ETHOFLD_TXQ, out);
3512 
3513 	/* ETHOFLD RXQ and FLQ */
3514 	if (s->eohw_rxq) {
3515 		for (i = 0; i < s->eoqsets; i++)
3516 			QDESC_GET_RXQ(&s->eohw_rxq[i].rspq,
3517 				      CUDBG_QTYPE_ETHOFLD_RXQ, out);
3518 
3519 		for (i = 0; i < s->eoqsets; i++)
3520 			QDESC_GET_FLQ(&s->eohw_rxq[i].fl,
3521 				      CUDBG_QTYPE_ETHOFLD_FLQ, out);
3522 	}
3523 
3524 out_unlock:
3525 	mutex_unlock(&uld_mutex);
3526 
3527 out:
3528 	qdesc_info->qdesc_entry_size = sizeof(*qdesc_entry);
3529 	qdesc_info->num_queues = num_queues;
3530 	cur_off = 0;
3531 	while (tot_len) {
3532 		u32 chunk_size = min_t(u32, tot_len, CUDBG_CHUNK_SIZE);
3533 
3534 		rc = cudbg_get_buff(pdbg_init, dbg_buff, chunk_size,
3535 				    &temp_buff);
3536 		if (rc) {
3537 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3538 			goto out_free;
3539 		}
3540 
3541 		memcpy(temp_buff.data, data + cur_off, chunk_size);
3542 		tot_len -= chunk_size;
3543 		cur_off += chunk_size;
3544 		rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
3545 						  dbg_buff);
3546 		if (rc) {
3547 			cudbg_put_buff(pdbg_init, &temp_buff);
3548 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3549 			goto out_free;
3550 		}
3551 	}
3552 
3553 out_free:
3554 	kvfree(data);
3555 
3556 #undef QDESC_GET_FLQ
3557 #undef QDESC_GET_RXQ
3558 #undef QDESC_GET_TXQ
3559 #undef QDESC_GET
3560 
3561 	return rc;
3562 }
3563 
3564 int cudbg_collect_flash(struct cudbg_init *pdbg_init,
3565 			struct cudbg_buffer *dbg_buff,
3566 			struct cudbg_error *cudbg_err)
3567 {
3568 	struct adapter *padap = pdbg_init->adap;
3569 	u32 count = padap->params.sf_size, n;
3570 	struct cudbg_buffer temp_buff = {0};
3571 	u32 addr, i;
3572 	int rc;
3573 
3574 	addr = FLASH_EXP_ROM_START;
3575 
3576 	for (i = 0; i < count; i += SF_PAGE_SIZE) {
3577 		n = min_t(u32, count - i, SF_PAGE_SIZE);
3578 
3579 		rc = cudbg_get_buff(pdbg_init, dbg_buff, n, &temp_buff);
3580 		if (rc) {
3581 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3582 			goto out;
3583 		}
3584 		rc = t4_read_flash(padap, addr, n, (u32 *)temp_buff.data, 0);
3585 		if (rc)
3586 			goto out;
3587 
3588 		addr += (n * 4);
3589 		rc = cudbg_write_and_release_buff(pdbg_init, &temp_buff,
3590 						  dbg_buff);
3591 		if (rc) {
3592 			cudbg_err->sys_warn = CUDBG_STATUS_PARTIAL_DATA;
3593 			goto out;
3594 		}
3595 	}
3596 
3597 out:
3598 	return rc;
3599 }
3600