xref: /linux/drivers/crypto/hisilicon/hpre/hpre_main.c (revision 001821b0e79716c4e17c71d8e053a23599a7a508)
1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright (c) 2018-2019 HiSilicon Limited. */
3 #include <linux/acpi.h>
4 #include <linux/bitops.h>
5 #include <linux/debugfs.h>
6 #include <linux/init.h>
7 #include <linux/io.h>
8 #include <linux/kernel.h>
9 #include <linux/module.h>
10 #include <linux/pci.h>
11 #include <linux/pm_runtime.h>
12 #include <linux/topology.h>
13 #include <linux/uacce.h>
14 #include "hpre.h"
15 
16 #define HPRE_QM_ABNML_INT_MASK		0x100004
17 #define HPRE_CTRL_CNT_CLR_CE_BIT	BIT(0)
18 #define HPRE_COMM_CNT_CLR_CE		0x0
19 #define HPRE_CTRL_CNT_CLR_CE		0x301000
20 #define HPRE_FSM_MAX_CNT		0x301008
21 #define HPRE_VFG_AXQOS			0x30100c
22 #define HPRE_VFG_AXCACHE		0x301010
23 #define HPRE_RDCHN_INI_CFG		0x301014
24 #define HPRE_AWUSR_FP_CFG		0x301018
25 #define HPRE_BD_ENDIAN			0x301020
26 #define HPRE_ECC_BYPASS			0x301024
27 #define HPRE_RAS_WIDTH_CFG		0x301028
28 #define HPRE_POISON_BYPASS		0x30102c
29 #define HPRE_BD_ARUSR_CFG		0x301030
30 #define HPRE_BD_AWUSR_CFG		0x301034
31 #define HPRE_TYPES_ENB			0x301038
32 #define HPRE_RSA_ENB			BIT(0)
33 #define HPRE_ECC_ENB			BIT(1)
34 #define HPRE_DATA_RUSER_CFG		0x30103c
35 #define HPRE_DATA_WUSER_CFG		0x301040
36 #define HPRE_INT_MASK			0x301400
37 #define HPRE_INT_STATUS			0x301800
38 #define HPRE_HAC_INT_MSK		0x301400
39 #define HPRE_HAC_RAS_CE_ENB		0x301410
40 #define HPRE_HAC_RAS_NFE_ENB		0x301414
41 #define HPRE_HAC_RAS_FE_ENB		0x301418
42 #define HPRE_HAC_INT_SET		0x301500
43 #define HPRE_RNG_TIMEOUT_NUM		0x301A34
44 #define HPRE_CORE_INT_ENABLE		0
45 #define HPRE_CORE_INT_DISABLE		GENMASK(21, 0)
46 #define HPRE_RDCHN_INI_ST		0x301a00
47 #define HPRE_CLSTR_BASE			0x302000
48 #define HPRE_CORE_EN_OFFSET		0x04
49 #define HPRE_CORE_INI_CFG_OFFSET	0x20
50 #define HPRE_CORE_INI_STATUS_OFFSET	0x80
51 #define HPRE_CORE_HTBT_WARN_OFFSET	0x8c
52 #define HPRE_CORE_IS_SCHD_OFFSET	0x90
53 
54 #define HPRE_RAS_CE_ENB			0x301410
55 #define HPRE_RAS_NFE_ENB		0x301414
56 #define HPRE_RAS_FE_ENB			0x301418
57 #define HPRE_OOO_SHUTDOWN_SEL		0x301a3c
58 #define HPRE_HAC_RAS_FE_ENABLE		0
59 
60 #define HPRE_CORE_ENB		(HPRE_CLSTR_BASE + HPRE_CORE_EN_OFFSET)
61 #define HPRE_CORE_INI_CFG	(HPRE_CLSTR_BASE + HPRE_CORE_INI_CFG_OFFSET)
62 #define HPRE_CORE_INI_STATUS (HPRE_CLSTR_BASE + HPRE_CORE_INI_STATUS_OFFSET)
63 #define HPRE_HAC_ECC1_CNT		0x301a04
64 #define HPRE_HAC_ECC2_CNT		0x301a08
65 #define HPRE_HAC_SOURCE_INT		0x301600
66 #define HPRE_CLSTR_ADDR_INTRVL		0x1000
67 #define HPRE_CLUSTER_INQURY		0x100
68 #define HPRE_CLSTR_ADDR_INQRY_RSLT	0x104
69 #define HPRE_TIMEOUT_ABNML_BIT		6
70 #define HPRE_PASID_EN_BIT		9
71 #define HPRE_REG_RD_INTVRL_US		10
72 #define HPRE_REG_RD_TMOUT_US		1000
73 #define HPRE_DBGFS_VAL_MAX_LEN		20
74 #define PCI_DEVICE_ID_HUAWEI_HPRE_PF	0xa258
75 #define HPRE_QM_USR_CFG_MASK		GENMASK(31, 1)
76 #define HPRE_QM_AXI_CFG_MASK		GENMASK(15, 0)
77 #define HPRE_QM_VFG_AX_MASK		GENMASK(7, 0)
78 #define HPRE_BD_USR_MASK		GENMASK(1, 0)
79 #define HPRE_PREFETCH_CFG		0x301130
80 #define HPRE_SVA_PREFTCH_DFX		0x30115C
81 #define HPRE_PREFETCH_ENABLE		(~(BIT(0) | BIT(30)))
82 #define HPRE_PREFETCH_DISABLE		BIT(30)
83 #define HPRE_SVA_DISABLE_READY		(BIT(4) | BIT(8))
84 
85 /* clock gate */
86 #define HPRE_CLKGATE_CTL		0x301a10
87 #define HPRE_PEH_CFG_AUTO_GATE		0x301a2c
88 #define HPRE_CLUSTER_DYN_CTL		0x302010
89 #define HPRE_CORE_SHB_CFG		0x302088
90 #define HPRE_CLKGATE_CTL_EN		BIT(0)
91 #define HPRE_PEH_CFG_AUTO_GATE_EN	BIT(0)
92 #define HPRE_CLUSTER_DYN_CTL_EN		BIT(0)
93 #define HPRE_CORE_GATE_EN		(BIT(30) | BIT(31))
94 
95 #define HPRE_AM_OOO_SHUTDOWN_ENB	0x301044
96 #define HPRE_AM_OOO_SHUTDOWN_ENABLE	BIT(0)
97 #define HPRE_WR_MSI_PORT		BIT(2)
98 
99 #define HPRE_CORE_ECC_2BIT_ERR		BIT(1)
100 #define HPRE_OOO_ECC_2BIT_ERR		BIT(5)
101 
102 #define HPRE_QM_BME_FLR			BIT(7)
103 #define HPRE_QM_PM_FLR			BIT(11)
104 #define HPRE_QM_SRIOV_FLR		BIT(12)
105 
106 #define HPRE_SHAPER_TYPE_RATE		640
107 #define HPRE_VIA_MSI_DSM		1
108 #define HPRE_SQE_MASK_OFFSET		8
109 #define HPRE_SQE_MASK_LEN		44
110 #define HPRE_CTX_Q_NUM_DEF		1
111 
112 #define HPRE_DFX_BASE		0x301000
113 #define HPRE_DFX_COMMON1		0x301400
114 #define HPRE_DFX_COMMON2		0x301A00
115 #define HPRE_DFX_CORE		0x302000
116 #define HPRE_DFX_BASE_LEN		0x55
117 #define HPRE_DFX_COMMON1_LEN		0x41
118 #define HPRE_DFX_COMMON2_LEN		0xE
119 #define HPRE_DFX_CORE_LEN		0x43
120 
121 static const char hpre_name[] = "hisi_hpre";
122 static struct dentry *hpre_debugfs_root;
123 static const struct pci_device_id hpre_dev_ids[] = {
124 	{ PCI_DEVICE(PCI_VENDOR_ID_HUAWEI, PCI_DEVICE_ID_HUAWEI_HPRE_PF) },
125 	{ PCI_DEVICE(PCI_VENDOR_ID_HUAWEI, PCI_DEVICE_ID_HUAWEI_HPRE_VF) },
126 	{ 0, }
127 };
128 
129 MODULE_DEVICE_TABLE(pci, hpre_dev_ids);
130 
131 struct hpre_hw_error {
132 	u32 int_msk;
133 	const char *msg;
134 };
135 
136 static const struct qm_dev_alg hpre_dev_algs[] = {
137 	{
138 		.alg_msk = BIT(0),
139 		.alg = "rsa\n"
140 	}, {
141 		.alg_msk = BIT(1),
142 		.alg = "dh\n"
143 	}, {
144 		.alg_msk = BIT(2),
145 		.alg = "ecdh\n"
146 	}, {
147 		.alg_msk = BIT(3),
148 		.alg = "ecdsa\n"
149 	}, {
150 		.alg_msk = BIT(4),
151 		.alg = "sm2\n"
152 	}, {
153 		.alg_msk = BIT(5),
154 		.alg = "x25519\n"
155 	}, {
156 		.alg_msk = BIT(6),
157 		.alg = "x448\n"
158 	}, {
159 		/* sentinel */
160 	}
161 };
162 
163 static struct hisi_qm_list hpre_devices = {
164 	.register_to_crypto	= hpre_algs_register,
165 	.unregister_from_crypto	= hpre_algs_unregister,
166 };
167 
168 static const char * const hpre_debug_file_name[] = {
169 	[HPRE_CLEAR_ENABLE] = "rdclr_en",
170 	[HPRE_CLUSTER_CTRL] = "cluster_ctrl",
171 };
172 
173 enum hpre_cap_type {
174 	HPRE_QM_NFE_MASK_CAP,
175 	HPRE_QM_RESET_MASK_CAP,
176 	HPRE_QM_OOO_SHUTDOWN_MASK_CAP,
177 	HPRE_QM_CE_MASK_CAP,
178 	HPRE_NFE_MASK_CAP,
179 	HPRE_RESET_MASK_CAP,
180 	HPRE_OOO_SHUTDOWN_MASK_CAP,
181 	HPRE_CE_MASK_CAP,
182 	HPRE_CLUSTER_NUM_CAP,
183 	HPRE_CORE_TYPE_NUM_CAP,
184 	HPRE_CORE_NUM_CAP,
185 	HPRE_CLUSTER_CORE_NUM_CAP,
186 	HPRE_CORE_ENABLE_BITMAP_CAP,
187 	HPRE_DRV_ALG_BITMAP_CAP,
188 	HPRE_DEV_ALG_BITMAP_CAP,
189 	HPRE_CORE1_ALG_BITMAP_CAP,
190 	HPRE_CORE2_ALG_BITMAP_CAP,
191 	HPRE_CORE3_ALG_BITMAP_CAP,
192 	HPRE_CORE4_ALG_BITMAP_CAP,
193 	HPRE_CORE5_ALG_BITMAP_CAP,
194 	HPRE_CORE6_ALG_BITMAP_CAP,
195 	HPRE_CORE7_ALG_BITMAP_CAP,
196 	HPRE_CORE8_ALG_BITMAP_CAP,
197 	HPRE_CORE9_ALG_BITMAP_CAP,
198 	HPRE_CORE10_ALG_BITMAP_CAP
199 };
200 
201 static const struct hisi_qm_cap_info hpre_basic_info[] = {
202 	{HPRE_QM_NFE_MASK_CAP, 0x3124, 0, GENMASK(31, 0), 0x0, 0x1C37, 0x7C37},
203 	{HPRE_QM_RESET_MASK_CAP, 0x3128, 0, GENMASK(31, 0), 0x0, 0xC37, 0x6C37},
204 	{HPRE_QM_OOO_SHUTDOWN_MASK_CAP, 0x3128, 0, GENMASK(31, 0), 0x0, 0x4, 0x6C37},
205 	{HPRE_QM_CE_MASK_CAP, 0x312C, 0, GENMASK(31, 0), 0x0, 0x8, 0x8},
206 	{HPRE_NFE_MASK_CAP, 0x3130, 0, GENMASK(31, 0), 0x0, 0x3FFFFE, 0x1FFFFFE},
207 	{HPRE_RESET_MASK_CAP, 0x3134, 0, GENMASK(31, 0), 0x0, 0x3FFFFE, 0xBFFFFE},
208 	{HPRE_OOO_SHUTDOWN_MASK_CAP, 0x3134, 0, GENMASK(31, 0), 0x0, 0x22, 0xBFFFFE},
209 	{HPRE_CE_MASK_CAP, 0x3138, 0, GENMASK(31, 0), 0x0, 0x1, 0x1},
210 	{HPRE_CLUSTER_NUM_CAP, 0x313c, 20, GENMASK(3, 0), 0x0,  0x4, 0x1},
211 	{HPRE_CORE_TYPE_NUM_CAP, 0x313c, 16, GENMASK(3, 0), 0x0, 0x2, 0x2},
212 	{HPRE_CORE_NUM_CAP, 0x313c, 8, GENMASK(7, 0), 0x0, 0x8, 0xA},
213 	{HPRE_CLUSTER_CORE_NUM_CAP, 0x313c, 0, GENMASK(7, 0), 0x0, 0x2, 0xA},
214 	{HPRE_CORE_ENABLE_BITMAP_CAP, 0x3140, 0, GENMASK(31, 0), 0x0, 0xF, 0x3FF},
215 	{HPRE_DRV_ALG_BITMAP_CAP, 0x3144, 0, GENMASK(31, 0), 0x0, 0x03, 0x27},
216 	{HPRE_DEV_ALG_BITMAP_CAP, 0x3148, 0, GENMASK(31, 0), 0x0, 0x03, 0x7F},
217 	{HPRE_CORE1_ALG_BITMAP_CAP, 0x314c, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
218 	{HPRE_CORE2_ALG_BITMAP_CAP, 0x3150, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
219 	{HPRE_CORE3_ALG_BITMAP_CAP, 0x3154, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
220 	{HPRE_CORE4_ALG_BITMAP_CAP, 0x3158, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
221 	{HPRE_CORE5_ALG_BITMAP_CAP, 0x315c, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
222 	{HPRE_CORE6_ALG_BITMAP_CAP, 0x3160, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
223 	{HPRE_CORE7_ALG_BITMAP_CAP, 0x3164, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
224 	{HPRE_CORE8_ALG_BITMAP_CAP, 0x3168, 0, GENMASK(31, 0), 0x0, 0x7F, 0x7F},
225 	{HPRE_CORE9_ALG_BITMAP_CAP, 0x316c, 0, GENMASK(31, 0), 0x0, 0x10, 0x10},
226 	{HPRE_CORE10_ALG_BITMAP_CAP, 0x3170, 0, GENMASK(31, 0), 0x0, 0x10, 0x10}
227 };
228 
229 enum hpre_pre_store_cap_idx {
230 	HPRE_CLUSTER_NUM_CAP_IDX = 0x0,
231 	HPRE_CORE_ENABLE_BITMAP_CAP_IDX,
232 	HPRE_DRV_ALG_BITMAP_CAP_IDX,
233 	HPRE_DEV_ALG_BITMAP_CAP_IDX,
234 };
235 
236 static const u32 hpre_pre_store_caps[] = {
237 	HPRE_CLUSTER_NUM_CAP,
238 	HPRE_CORE_ENABLE_BITMAP_CAP,
239 	HPRE_DRV_ALG_BITMAP_CAP,
240 	HPRE_DEV_ALG_BITMAP_CAP,
241 };
242 
243 static const struct hpre_hw_error hpre_hw_errors[] = {
244 	{
245 		.int_msk = BIT(0),
246 		.msg = "core_ecc_1bit_err_int_set"
247 	}, {
248 		.int_msk = BIT(1),
249 		.msg = "core_ecc_2bit_err_int_set"
250 	}, {
251 		.int_msk = BIT(2),
252 		.msg = "dat_wb_poison_int_set"
253 	}, {
254 		.int_msk = BIT(3),
255 		.msg = "dat_rd_poison_int_set"
256 	}, {
257 		.int_msk = BIT(4),
258 		.msg = "bd_rd_poison_int_set"
259 	}, {
260 		.int_msk = BIT(5),
261 		.msg = "ooo_ecc_2bit_err_int_set"
262 	}, {
263 		.int_msk = BIT(6),
264 		.msg = "cluster1_shb_timeout_int_set"
265 	}, {
266 		.int_msk = BIT(7),
267 		.msg = "cluster2_shb_timeout_int_set"
268 	}, {
269 		.int_msk = BIT(8),
270 		.msg = "cluster3_shb_timeout_int_set"
271 	}, {
272 		.int_msk = BIT(9),
273 		.msg = "cluster4_shb_timeout_int_set"
274 	}, {
275 		.int_msk = GENMASK(15, 10),
276 		.msg = "ooo_rdrsp_err_int_set"
277 	}, {
278 		.int_msk = GENMASK(21, 16),
279 		.msg = "ooo_wrrsp_err_int_set"
280 	}, {
281 		.int_msk = BIT(22),
282 		.msg = "pt_rng_timeout_int_set"
283 	}, {
284 		.int_msk = BIT(23),
285 		.msg = "sva_fsm_timeout_int_set"
286 	}, {
287 		.int_msk = BIT(24),
288 		.msg = "sva_int_set"
289 	}, {
290 		/* sentinel */
291 	}
292 };
293 
294 static const u64 hpre_cluster_offsets[] = {
295 	[HPRE_CLUSTER0] =
296 		HPRE_CLSTR_BASE + HPRE_CLUSTER0 * HPRE_CLSTR_ADDR_INTRVL,
297 	[HPRE_CLUSTER1] =
298 		HPRE_CLSTR_BASE + HPRE_CLUSTER1 * HPRE_CLSTR_ADDR_INTRVL,
299 	[HPRE_CLUSTER2] =
300 		HPRE_CLSTR_BASE + HPRE_CLUSTER2 * HPRE_CLSTR_ADDR_INTRVL,
301 	[HPRE_CLUSTER3] =
302 		HPRE_CLSTR_BASE + HPRE_CLUSTER3 * HPRE_CLSTR_ADDR_INTRVL,
303 };
304 
305 static const struct debugfs_reg32 hpre_cluster_dfx_regs[] = {
306 	{"CORES_EN_STATUS     ",  HPRE_CORE_EN_OFFSET},
307 	{"CORES_INI_CFG       ",  HPRE_CORE_INI_CFG_OFFSET},
308 	{"CORES_INI_STATUS    ",  HPRE_CORE_INI_STATUS_OFFSET},
309 	{"CORES_HTBT_WARN     ",  HPRE_CORE_HTBT_WARN_OFFSET},
310 	{"CORES_IS_SCHD       ",  HPRE_CORE_IS_SCHD_OFFSET},
311 };
312 
313 static const struct debugfs_reg32 hpre_com_dfx_regs[] = {
314 	{"READ_CLR_EN     ",  HPRE_CTRL_CNT_CLR_CE},
315 	{"AXQOS           ",  HPRE_VFG_AXQOS},
316 	{"AWUSR_CFG       ",  HPRE_AWUSR_FP_CFG},
317 	{"BD_ENDIAN       ",  HPRE_BD_ENDIAN},
318 	{"ECC_CHECK_CTRL  ",  HPRE_ECC_BYPASS},
319 	{"RAS_INT_WIDTH   ",  HPRE_RAS_WIDTH_CFG},
320 	{"POISON_BYPASS   ",  HPRE_POISON_BYPASS},
321 	{"BD_ARUSER       ",  HPRE_BD_ARUSR_CFG},
322 	{"BD_AWUSER       ",  HPRE_BD_AWUSR_CFG},
323 	{"DATA_ARUSER     ",  HPRE_DATA_RUSER_CFG},
324 	{"DATA_AWUSER     ",  HPRE_DATA_WUSER_CFG},
325 	{"INT_STATUS      ",  HPRE_INT_STATUS},
326 	{"INT_MASK        ",  HPRE_HAC_INT_MSK},
327 	{"RAS_CE_ENB      ",  HPRE_HAC_RAS_CE_ENB},
328 	{"RAS_NFE_ENB     ",  HPRE_HAC_RAS_NFE_ENB},
329 	{"RAS_FE_ENB      ",  HPRE_HAC_RAS_FE_ENB},
330 	{"INT_SET         ",  HPRE_HAC_INT_SET},
331 	{"RNG_TIMEOUT_NUM ",  HPRE_RNG_TIMEOUT_NUM},
332 };
333 
334 static const char *hpre_dfx_files[HPRE_DFX_FILE_NUM] = {
335 	"send_cnt",
336 	"recv_cnt",
337 	"send_fail_cnt",
338 	"send_busy_cnt",
339 	"over_thrhld_cnt",
340 	"overtime_thrhld",
341 	"invalid_req_cnt"
342 };
343 
344 /* define the HPRE's dfx regs region and region length */
345 static struct dfx_diff_registers hpre_diff_regs[] = {
346 	{
347 		.reg_offset = HPRE_DFX_BASE,
348 		.reg_len = HPRE_DFX_BASE_LEN,
349 	}, {
350 		.reg_offset = HPRE_DFX_COMMON1,
351 		.reg_len = HPRE_DFX_COMMON1_LEN,
352 	}, {
353 		.reg_offset = HPRE_DFX_COMMON2,
354 		.reg_len = HPRE_DFX_COMMON2_LEN,
355 	}, {
356 		.reg_offset = HPRE_DFX_CORE,
357 		.reg_len = HPRE_DFX_CORE_LEN,
358 	},
359 };
360 
361 bool hpre_check_alg_support(struct hisi_qm *qm, u32 alg)
362 {
363 	u32 cap_val;
364 
365 	cap_val = qm->cap_tables.dev_cap_table[HPRE_DRV_ALG_BITMAP_CAP_IDX].cap_val;
366 	if (alg & cap_val)
367 		return true;
368 
369 	return false;
370 }
371 
372 static int hpre_diff_regs_show(struct seq_file *s, void *unused)
373 {
374 	struct hisi_qm *qm = s->private;
375 
376 	hisi_qm_acc_diff_regs_dump(qm, s, qm->debug.acc_diff_regs,
377 					ARRAY_SIZE(hpre_diff_regs));
378 
379 	return 0;
380 }
381 
382 DEFINE_SHOW_ATTRIBUTE(hpre_diff_regs);
383 
384 static int hpre_com_regs_show(struct seq_file *s, void *unused)
385 {
386 	hisi_qm_regs_dump(s, s->private);
387 
388 	return 0;
389 }
390 
391 DEFINE_SHOW_ATTRIBUTE(hpre_com_regs);
392 
393 static int hpre_cluster_regs_show(struct seq_file *s, void *unused)
394 {
395 	hisi_qm_regs_dump(s, s->private);
396 
397 	return 0;
398 }
399 
400 DEFINE_SHOW_ATTRIBUTE(hpre_cluster_regs);
401 
402 static const struct kernel_param_ops hpre_uacce_mode_ops = {
403 	.set = uacce_mode_set,
404 	.get = param_get_int,
405 };
406 
407 /*
408  * uacce_mode = 0 means hpre only register to crypto,
409  * uacce_mode = 1 means hpre both register to crypto and uacce.
410  */
411 static u32 uacce_mode = UACCE_MODE_NOUACCE;
412 module_param_cb(uacce_mode, &hpre_uacce_mode_ops, &uacce_mode, 0444);
413 MODULE_PARM_DESC(uacce_mode, UACCE_MODE_DESC);
414 
415 static bool pf_q_num_flag;
416 static int pf_q_num_set(const char *val, const struct kernel_param *kp)
417 {
418 	pf_q_num_flag = true;
419 
420 	return q_num_set(val, kp, PCI_DEVICE_ID_HUAWEI_HPRE_PF);
421 }
422 
423 static const struct kernel_param_ops hpre_pf_q_num_ops = {
424 	.set = pf_q_num_set,
425 	.get = param_get_int,
426 };
427 
428 static u32 pf_q_num = HPRE_PF_DEF_Q_NUM;
429 module_param_cb(pf_q_num, &hpre_pf_q_num_ops, &pf_q_num, 0444);
430 MODULE_PARM_DESC(pf_q_num, "Number of queues in PF of CS(2-1024)");
431 
432 static const struct kernel_param_ops vfs_num_ops = {
433 	.set = vfs_num_set,
434 	.get = param_get_int,
435 };
436 
437 static u32 vfs_num;
438 module_param_cb(vfs_num, &vfs_num_ops, &vfs_num, 0444);
439 MODULE_PARM_DESC(vfs_num, "Number of VFs to enable(1-63), 0(default)");
440 
441 struct hisi_qp *hpre_create_qp(u8 type)
442 {
443 	int node = cpu_to_node(raw_smp_processor_id());
444 	struct hisi_qp *qp = NULL;
445 	int ret;
446 
447 	if (type != HPRE_V2_ALG_TYPE && type != HPRE_V3_ECC_ALG_TYPE)
448 		return NULL;
449 
450 	/*
451 	 * type: 0 - RSA/DH. algorithm supported in V2,
452 	 *       1 - ECC algorithm in V3.
453 	 */
454 	ret = hisi_qm_alloc_qps_node(&hpre_devices, 1, type, node, &qp);
455 	if (!ret)
456 		return qp;
457 
458 	return NULL;
459 }
460 
461 static void hpre_config_pasid(struct hisi_qm *qm)
462 {
463 	u32 val1, val2;
464 
465 	if (qm->ver >= QM_HW_V3)
466 		return;
467 
468 	val1 = readl_relaxed(qm->io_base + HPRE_DATA_RUSER_CFG);
469 	val2 = readl_relaxed(qm->io_base + HPRE_DATA_WUSER_CFG);
470 	if (qm->use_sva) {
471 		val1 |= BIT(HPRE_PASID_EN_BIT);
472 		val2 |= BIT(HPRE_PASID_EN_BIT);
473 	} else {
474 		val1 &= ~BIT(HPRE_PASID_EN_BIT);
475 		val2 &= ~BIT(HPRE_PASID_EN_BIT);
476 	}
477 	writel_relaxed(val1, qm->io_base + HPRE_DATA_RUSER_CFG);
478 	writel_relaxed(val2, qm->io_base + HPRE_DATA_WUSER_CFG);
479 }
480 
481 static int hpre_cfg_by_dsm(struct hisi_qm *qm)
482 {
483 	struct device *dev = &qm->pdev->dev;
484 	union acpi_object *obj;
485 	guid_t guid;
486 
487 	if (guid_parse("b06b81ab-0134-4a45-9b0c-483447b95fa7", &guid)) {
488 		dev_err(dev, "Hpre GUID failed\n");
489 		return -EINVAL;
490 	}
491 
492 	/* Switch over to MSI handling due to non-standard PCI implementation */
493 	obj = acpi_evaluate_dsm(ACPI_HANDLE(dev), &guid,
494 				0, HPRE_VIA_MSI_DSM, NULL);
495 	if (!obj) {
496 		dev_err(dev, "ACPI handle failed!\n");
497 		return -EIO;
498 	}
499 
500 	ACPI_FREE(obj);
501 
502 	return 0;
503 }
504 
505 static int hpre_set_cluster(struct hisi_qm *qm)
506 {
507 	struct device *dev = &qm->pdev->dev;
508 	unsigned long offset;
509 	u32 cluster_core_mask;
510 	u8 clusters_num;
511 	u32 val = 0;
512 	int ret, i;
513 
514 	cluster_core_mask = qm->cap_tables.dev_cap_table[HPRE_CORE_ENABLE_BITMAP_CAP_IDX].cap_val;
515 	clusters_num = qm->cap_tables.dev_cap_table[HPRE_CLUSTER_NUM_CAP_IDX].cap_val;
516 	for (i = 0; i < clusters_num; i++) {
517 		offset = i * HPRE_CLSTR_ADDR_INTRVL;
518 
519 		/* clusters initiating */
520 		writel(cluster_core_mask,
521 		       qm->io_base + offset + HPRE_CORE_ENB);
522 		writel(0x1, qm->io_base + offset + HPRE_CORE_INI_CFG);
523 		ret = readl_relaxed_poll_timeout(qm->io_base + offset +
524 					HPRE_CORE_INI_STATUS, val,
525 					((val & cluster_core_mask) ==
526 					cluster_core_mask),
527 					HPRE_REG_RD_INTVRL_US,
528 					HPRE_REG_RD_TMOUT_US);
529 		if (ret) {
530 			dev_err(dev,
531 				"cluster %d int st status timeout!\n", i);
532 			return -ETIMEDOUT;
533 		}
534 	}
535 
536 	return 0;
537 }
538 
539 /*
540  * For Kunpeng 920, we should disable FLR triggered by hardware (BME/PM/SRIOV).
541  * Or it may stay in D3 state when we bind and unbind hpre quickly,
542  * as it does FLR triggered by hardware.
543  */
544 static void disable_flr_of_bme(struct hisi_qm *qm)
545 {
546 	u32 val;
547 
548 	val = readl(qm->io_base + QM_PEH_AXUSER_CFG);
549 	val &= ~(HPRE_QM_BME_FLR | HPRE_QM_SRIOV_FLR);
550 	val |= HPRE_QM_PM_FLR;
551 	writel(val, qm->io_base + QM_PEH_AXUSER_CFG);
552 	writel(PEH_AXUSER_CFG_ENABLE, qm->io_base + QM_PEH_AXUSER_CFG_ENABLE);
553 }
554 
555 static void hpre_open_sva_prefetch(struct hisi_qm *qm)
556 {
557 	u32 val;
558 	int ret;
559 
560 	if (!test_bit(QM_SUPPORT_SVA_PREFETCH, &qm->caps))
561 		return;
562 
563 	/* Enable prefetch */
564 	val = readl_relaxed(qm->io_base + HPRE_PREFETCH_CFG);
565 	val &= HPRE_PREFETCH_ENABLE;
566 	writel(val, qm->io_base + HPRE_PREFETCH_CFG);
567 
568 	ret = readl_relaxed_poll_timeout(qm->io_base + HPRE_PREFETCH_CFG,
569 					 val, !(val & HPRE_PREFETCH_DISABLE),
570 					 HPRE_REG_RD_INTVRL_US,
571 					 HPRE_REG_RD_TMOUT_US);
572 	if (ret)
573 		pci_err(qm->pdev, "failed to open sva prefetch\n");
574 }
575 
576 static void hpre_close_sva_prefetch(struct hisi_qm *qm)
577 {
578 	u32 val;
579 	int ret;
580 
581 	if (!test_bit(QM_SUPPORT_SVA_PREFETCH, &qm->caps))
582 		return;
583 
584 	val = readl_relaxed(qm->io_base + HPRE_PREFETCH_CFG);
585 	val |= HPRE_PREFETCH_DISABLE;
586 	writel(val, qm->io_base + HPRE_PREFETCH_CFG);
587 
588 	ret = readl_relaxed_poll_timeout(qm->io_base + HPRE_SVA_PREFTCH_DFX,
589 					 val, !(val & HPRE_SVA_DISABLE_READY),
590 					 HPRE_REG_RD_INTVRL_US,
591 					 HPRE_REG_RD_TMOUT_US);
592 	if (ret)
593 		pci_err(qm->pdev, "failed to close sva prefetch\n");
594 }
595 
596 static void hpre_enable_clock_gate(struct hisi_qm *qm)
597 {
598 	u32 val;
599 
600 	if (qm->ver < QM_HW_V3)
601 		return;
602 
603 	val = readl(qm->io_base + HPRE_CLKGATE_CTL);
604 	val |= HPRE_CLKGATE_CTL_EN;
605 	writel(val, qm->io_base + HPRE_CLKGATE_CTL);
606 
607 	val = readl(qm->io_base + HPRE_PEH_CFG_AUTO_GATE);
608 	val |= HPRE_PEH_CFG_AUTO_GATE_EN;
609 	writel(val, qm->io_base + HPRE_PEH_CFG_AUTO_GATE);
610 
611 	val = readl(qm->io_base + HPRE_CLUSTER_DYN_CTL);
612 	val |= HPRE_CLUSTER_DYN_CTL_EN;
613 	writel(val, qm->io_base + HPRE_CLUSTER_DYN_CTL);
614 
615 	val = readl_relaxed(qm->io_base + HPRE_CORE_SHB_CFG);
616 	val |= HPRE_CORE_GATE_EN;
617 	writel(val, qm->io_base + HPRE_CORE_SHB_CFG);
618 }
619 
620 static void hpre_disable_clock_gate(struct hisi_qm *qm)
621 {
622 	u32 val;
623 
624 	if (qm->ver < QM_HW_V3)
625 		return;
626 
627 	val = readl(qm->io_base + HPRE_CLKGATE_CTL);
628 	val &= ~HPRE_CLKGATE_CTL_EN;
629 	writel(val, qm->io_base + HPRE_CLKGATE_CTL);
630 
631 	val = readl(qm->io_base + HPRE_PEH_CFG_AUTO_GATE);
632 	val &= ~HPRE_PEH_CFG_AUTO_GATE_EN;
633 	writel(val, qm->io_base + HPRE_PEH_CFG_AUTO_GATE);
634 
635 	val = readl(qm->io_base + HPRE_CLUSTER_DYN_CTL);
636 	val &= ~HPRE_CLUSTER_DYN_CTL_EN;
637 	writel(val, qm->io_base + HPRE_CLUSTER_DYN_CTL);
638 
639 	val = readl_relaxed(qm->io_base + HPRE_CORE_SHB_CFG);
640 	val &= ~HPRE_CORE_GATE_EN;
641 	writel(val, qm->io_base + HPRE_CORE_SHB_CFG);
642 }
643 
644 static int hpre_set_user_domain_and_cache(struct hisi_qm *qm)
645 {
646 	struct device *dev = &qm->pdev->dev;
647 	u32 val;
648 	int ret;
649 
650 	/* disabel dynamic clock gate before sram init */
651 	hpre_disable_clock_gate(qm);
652 
653 	writel(HPRE_QM_USR_CFG_MASK, qm->io_base + QM_ARUSER_M_CFG_ENABLE);
654 	writel(HPRE_QM_USR_CFG_MASK, qm->io_base + QM_AWUSER_M_CFG_ENABLE);
655 	writel_relaxed(HPRE_QM_AXI_CFG_MASK, qm->io_base + QM_AXI_M_CFG);
656 
657 	/* HPRE need more time, we close this interrupt */
658 	val = readl_relaxed(qm->io_base + HPRE_QM_ABNML_INT_MASK);
659 	val |= BIT(HPRE_TIMEOUT_ABNML_BIT);
660 	writel_relaxed(val, qm->io_base + HPRE_QM_ABNML_INT_MASK);
661 
662 	if (qm->ver >= QM_HW_V3)
663 		writel(HPRE_RSA_ENB | HPRE_ECC_ENB,
664 			qm->io_base + HPRE_TYPES_ENB);
665 	else
666 		writel(HPRE_RSA_ENB, qm->io_base + HPRE_TYPES_ENB);
667 
668 	writel(HPRE_QM_VFG_AX_MASK, qm->io_base + HPRE_VFG_AXCACHE);
669 	writel(0x0, qm->io_base + HPRE_BD_ENDIAN);
670 	writel(0x0, qm->io_base + HPRE_INT_MASK);
671 	writel(0x0, qm->io_base + HPRE_POISON_BYPASS);
672 	writel(0x0, qm->io_base + HPRE_COMM_CNT_CLR_CE);
673 	writel(0x0, qm->io_base + HPRE_ECC_BYPASS);
674 
675 	writel(HPRE_BD_USR_MASK, qm->io_base + HPRE_BD_ARUSR_CFG);
676 	writel(HPRE_BD_USR_MASK, qm->io_base + HPRE_BD_AWUSR_CFG);
677 	writel(0x1, qm->io_base + HPRE_RDCHN_INI_CFG);
678 	ret = readl_relaxed_poll_timeout(qm->io_base + HPRE_RDCHN_INI_ST, val,
679 			val & BIT(0),
680 			HPRE_REG_RD_INTVRL_US,
681 			HPRE_REG_RD_TMOUT_US);
682 	if (ret) {
683 		dev_err(dev, "read rd channel timeout fail!\n");
684 		return -ETIMEDOUT;
685 	}
686 
687 	ret = hpre_set_cluster(qm);
688 	if (ret)
689 		return -ETIMEDOUT;
690 
691 	/* This setting is only needed by Kunpeng 920. */
692 	if (qm->ver == QM_HW_V2) {
693 		ret = hpre_cfg_by_dsm(qm);
694 		if (ret)
695 			return ret;
696 
697 		disable_flr_of_bme(qm);
698 	}
699 
700 	/* Config data buffer pasid needed by Kunpeng 920 */
701 	hpre_config_pasid(qm);
702 
703 	hpre_enable_clock_gate(qm);
704 
705 	return ret;
706 }
707 
708 static void hpre_cnt_regs_clear(struct hisi_qm *qm)
709 {
710 	unsigned long offset;
711 	u8 clusters_num;
712 	int i;
713 
714 	/* clear clusterX/cluster_ctrl */
715 	clusters_num = qm->cap_tables.dev_cap_table[HPRE_CLUSTER_NUM_CAP_IDX].cap_val;
716 	for (i = 0; i < clusters_num; i++) {
717 		offset = HPRE_CLSTR_BASE + i * HPRE_CLSTR_ADDR_INTRVL;
718 		writel(0x0, qm->io_base + offset + HPRE_CLUSTER_INQURY);
719 	}
720 
721 	/* clear rdclr_en */
722 	writel(0x0, qm->io_base + HPRE_CTRL_CNT_CLR_CE);
723 
724 	hisi_qm_debug_regs_clear(qm);
725 }
726 
727 static void hpre_master_ooo_ctrl(struct hisi_qm *qm, bool enable)
728 {
729 	u32 val1, val2;
730 
731 	val1 = readl(qm->io_base + HPRE_AM_OOO_SHUTDOWN_ENB);
732 	if (enable) {
733 		val1 |= HPRE_AM_OOO_SHUTDOWN_ENABLE;
734 		val2 = hisi_qm_get_hw_info(qm, hpre_basic_info,
735 					   HPRE_OOO_SHUTDOWN_MASK_CAP, qm->cap_ver);
736 	} else {
737 		val1 &= ~HPRE_AM_OOO_SHUTDOWN_ENABLE;
738 		val2 = 0x0;
739 	}
740 
741 	if (qm->ver > QM_HW_V2)
742 		writel(val2, qm->io_base + HPRE_OOO_SHUTDOWN_SEL);
743 
744 	writel(val1, qm->io_base + HPRE_AM_OOO_SHUTDOWN_ENB);
745 }
746 
747 static void hpre_hw_error_disable(struct hisi_qm *qm)
748 {
749 	u32 ce, nfe;
750 
751 	ce = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_CE_MASK_CAP, qm->cap_ver);
752 	nfe = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_NFE_MASK_CAP, qm->cap_ver);
753 
754 	/* disable hpre hw error interrupts */
755 	writel(ce | nfe | HPRE_HAC_RAS_FE_ENABLE, qm->io_base + HPRE_INT_MASK);
756 	/* disable HPRE block master OOO when nfe occurs on Kunpeng930 */
757 	hpre_master_ooo_ctrl(qm, false);
758 }
759 
760 static void hpre_hw_error_enable(struct hisi_qm *qm)
761 {
762 	u32 ce, nfe;
763 
764 	ce = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_CE_MASK_CAP, qm->cap_ver);
765 	nfe = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_NFE_MASK_CAP, qm->cap_ver);
766 
767 	/* clear HPRE hw error source if having */
768 	writel(ce | nfe | HPRE_HAC_RAS_FE_ENABLE, qm->io_base + HPRE_HAC_SOURCE_INT);
769 
770 	/* configure error type */
771 	writel(ce, qm->io_base + HPRE_RAS_CE_ENB);
772 	writel(nfe, qm->io_base + HPRE_RAS_NFE_ENB);
773 	writel(HPRE_HAC_RAS_FE_ENABLE, qm->io_base + HPRE_RAS_FE_ENB);
774 
775 	/* enable HPRE block master OOO when nfe occurs on Kunpeng930 */
776 	hpre_master_ooo_ctrl(qm, true);
777 
778 	/* enable hpre hw error interrupts */
779 	writel(HPRE_CORE_INT_ENABLE, qm->io_base + HPRE_INT_MASK);
780 }
781 
782 static inline struct hisi_qm *hpre_file_to_qm(struct hpre_debugfs_file *file)
783 {
784 	struct hpre *hpre = container_of(file->debug, struct hpre, debug);
785 
786 	return &hpre->qm;
787 }
788 
789 static u32 hpre_clear_enable_read(struct hpre_debugfs_file *file)
790 {
791 	struct hisi_qm *qm = hpre_file_to_qm(file);
792 
793 	return readl(qm->io_base + HPRE_CTRL_CNT_CLR_CE) &
794 	       HPRE_CTRL_CNT_CLR_CE_BIT;
795 }
796 
797 static int hpre_clear_enable_write(struct hpre_debugfs_file *file, u32 val)
798 {
799 	struct hisi_qm *qm = hpre_file_to_qm(file);
800 	u32 tmp;
801 
802 	if (val != 1 && val != 0)
803 		return -EINVAL;
804 
805 	tmp = (readl(qm->io_base + HPRE_CTRL_CNT_CLR_CE) &
806 	       ~HPRE_CTRL_CNT_CLR_CE_BIT) | val;
807 	writel(tmp, qm->io_base + HPRE_CTRL_CNT_CLR_CE);
808 
809 	return 0;
810 }
811 
812 static u32 hpre_cluster_inqry_read(struct hpre_debugfs_file *file)
813 {
814 	struct hisi_qm *qm = hpre_file_to_qm(file);
815 	int cluster_index = file->index - HPRE_CLUSTER_CTRL;
816 	unsigned long offset = HPRE_CLSTR_BASE +
817 			       cluster_index * HPRE_CLSTR_ADDR_INTRVL;
818 
819 	return readl(qm->io_base + offset + HPRE_CLSTR_ADDR_INQRY_RSLT);
820 }
821 
822 static void hpre_cluster_inqry_write(struct hpre_debugfs_file *file, u32 val)
823 {
824 	struct hisi_qm *qm = hpre_file_to_qm(file);
825 	int cluster_index = file->index - HPRE_CLUSTER_CTRL;
826 	unsigned long offset = HPRE_CLSTR_BASE + cluster_index *
827 			       HPRE_CLSTR_ADDR_INTRVL;
828 
829 	writel(val, qm->io_base + offset + HPRE_CLUSTER_INQURY);
830 }
831 
832 static ssize_t hpre_ctrl_debug_read(struct file *filp, char __user *buf,
833 				    size_t count, loff_t *pos)
834 {
835 	struct hpre_debugfs_file *file = filp->private_data;
836 	struct hisi_qm *qm = hpre_file_to_qm(file);
837 	char tbuf[HPRE_DBGFS_VAL_MAX_LEN];
838 	u32 val;
839 	int ret;
840 
841 	ret = hisi_qm_get_dfx_access(qm);
842 	if (ret)
843 		return ret;
844 
845 	spin_lock_irq(&file->lock);
846 	switch (file->type) {
847 	case HPRE_CLEAR_ENABLE:
848 		val = hpre_clear_enable_read(file);
849 		break;
850 	case HPRE_CLUSTER_CTRL:
851 		val = hpre_cluster_inqry_read(file);
852 		break;
853 	default:
854 		goto err_input;
855 	}
856 	spin_unlock_irq(&file->lock);
857 
858 	hisi_qm_put_dfx_access(qm);
859 	ret = snprintf(tbuf, HPRE_DBGFS_VAL_MAX_LEN, "%u\n", val);
860 	return simple_read_from_buffer(buf, count, pos, tbuf, ret);
861 
862 err_input:
863 	spin_unlock_irq(&file->lock);
864 	hisi_qm_put_dfx_access(qm);
865 	return -EINVAL;
866 }
867 
868 static ssize_t hpre_ctrl_debug_write(struct file *filp, const char __user *buf,
869 				     size_t count, loff_t *pos)
870 {
871 	struct hpre_debugfs_file *file = filp->private_data;
872 	struct hisi_qm *qm = hpre_file_to_qm(file);
873 	char tbuf[HPRE_DBGFS_VAL_MAX_LEN];
874 	unsigned long val;
875 	int len, ret;
876 
877 	if (*pos != 0)
878 		return 0;
879 
880 	if (count >= HPRE_DBGFS_VAL_MAX_LEN)
881 		return -ENOSPC;
882 
883 	len = simple_write_to_buffer(tbuf, HPRE_DBGFS_VAL_MAX_LEN - 1,
884 				     pos, buf, count);
885 	if (len < 0)
886 		return len;
887 
888 	tbuf[len] = '\0';
889 	if (kstrtoul(tbuf, 0, &val))
890 		return -EFAULT;
891 
892 	ret = hisi_qm_get_dfx_access(qm);
893 	if (ret)
894 		return ret;
895 
896 	spin_lock_irq(&file->lock);
897 	switch (file->type) {
898 	case HPRE_CLEAR_ENABLE:
899 		ret = hpre_clear_enable_write(file, val);
900 		if (ret)
901 			goto err_input;
902 		break;
903 	case HPRE_CLUSTER_CTRL:
904 		hpre_cluster_inqry_write(file, val);
905 		break;
906 	default:
907 		ret = -EINVAL;
908 		goto err_input;
909 	}
910 
911 	ret = count;
912 
913 err_input:
914 	spin_unlock_irq(&file->lock);
915 	hisi_qm_put_dfx_access(qm);
916 	return ret;
917 }
918 
919 static const struct file_operations hpre_ctrl_debug_fops = {
920 	.owner = THIS_MODULE,
921 	.open = simple_open,
922 	.read = hpre_ctrl_debug_read,
923 	.write = hpre_ctrl_debug_write,
924 };
925 
926 static int hpre_debugfs_atomic64_get(void *data, u64 *val)
927 {
928 	struct hpre_dfx *dfx_item = data;
929 
930 	*val = atomic64_read(&dfx_item->value);
931 
932 	return 0;
933 }
934 
935 static int hpre_debugfs_atomic64_set(void *data, u64 val)
936 {
937 	struct hpre_dfx *dfx_item = data;
938 	struct hpre_dfx *hpre_dfx = NULL;
939 
940 	if (dfx_item->type == HPRE_OVERTIME_THRHLD) {
941 		hpre_dfx = dfx_item - HPRE_OVERTIME_THRHLD;
942 		atomic64_set(&hpre_dfx[HPRE_OVER_THRHLD_CNT].value, 0);
943 	} else if (val) {
944 		return -EINVAL;
945 	}
946 
947 	atomic64_set(&dfx_item->value, val);
948 
949 	return 0;
950 }
951 
952 DEFINE_DEBUGFS_ATTRIBUTE(hpre_atomic64_ops, hpre_debugfs_atomic64_get,
953 			 hpre_debugfs_atomic64_set, "%llu\n");
954 
955 static int hpre_create_debugfs_file(struct hisi_qm *qm, struct dentry *dir,
956 				    enum hpre_ctrl_dbgfs_file type, int indx)
957 {
958 	struct hpre *hpre = container_of(qm, struct hpre, qm);
959 	struct hpre_debug *dbg = &hpre->debug;
960 	struct dentry *file_dir;
961 
962 	if (dir)
963 		file_dir = dir;
964 	else
965 		file_dir = qm->debug.debug_root;
966 
967 	if (type >= HPRE_DEBUG_FILE_NUM)
968 		return -EINVAL;
969 
970 	spin_lock_init(&dbg->files[indx].lock);
971 	dbg->files[indx].debug = dbg;
972 	dbg->files[indx].type = type;
973 	dbg->files[indx].index = indx;
974 	debugfs_create_file(hpre_debug_file_name[type], 0600, file_dir,
975 			    dbg->files + indx, &hpre_ctrl_debug_fops);
976 
977 	return 0;
978 }
979 
980 static int hpre_pf_comm_regs_debugfs_init(struct hisi_qm *qm)
981 {
982 	struct device *dev = &qm->pdev->dev;
983 	struct debugfs_regset32 *regset;
984 
985 	regset = devm_kzalloc(dev, sizeof(*regset), GFP_KERNEL);
986 	if (!regset)
987 		return -ENOMEM;
988 
989 	regset->regs = hpre_com_dfx_regs;
990 	regset->nregs = ARRAY_SIZE(hpre_com_dfx_regs);
991 	regset->base = qm->io_base;
992 	regset->dev = dev;
993 
994 	debugfs_create_file("regs", 0444, qm->debug.debug_root,
995 			    regset, &hpre_com_regs_fops);
996 
997 	return 0;
998 }
999 
1000 static int hpre_cluster_debugfs_init(struct hisi_qm *qm)
1001 {
1002 	struct device *dev = &qm->pdev->dev;
1003 	char buf[HPRE_DBGFS_VAL_MAX_LEN];
1004 	struct debugfs_regset32 *regset;
1005 	struct dentry *tmp_d;
1006 	u8 clusters_num;
1007 	int i, ret;
1008 
1009 	clusters_num = qm->cap_tables.dev_cap_table[HPRE_CLUSTER_NUM_CAP_IDX].cap_val;
1010 	for (i = 0; i < clusters_num; i++) {
1011 		ret = snprintf(buf, HPRE_DBGFS_VAL_MAX_LEN, "cluster%d", i);
1012 		if (ret >= HPRE_DBGFS_VAL_MAX_LEN)
1013 			return -EINVAL;
1014 		tmp_d = debugfs_create_dir(buf, qm->debug.debug_root);
1015 
1016 		regset = devm_kzalloc(dev, sizeof(*regset), GFP_KERNEL);
1017 		if (!regset)
1018 			return -ENOMEM;
1019 
1020 		regset->regs = hpre_cluster_dfx_regs;
1021 		regset->nregs = ARRAY_SIZE(hpre_cluster_dfx_regs);
1022 		regset->base = qm->io_base + hpre_cluster_offsets[i];
1023 		regset->dev = dev;
1024 
1025 		debugfs_create_file("regs", 0444, tmp_d, regset,
1026 				    &hpre_cluster_regs_fops);
1027 		ret = hpre_create_debugfs_file(qm, tmp_d, HPRE_CLUSTER_CTRL,
1028 					       i + HPRE_CLUSTER_CTRL);
1029 		if (ret)
1030 			return ret;
1031 	}
1032 
1033 	return 0;
1034 }
1035 
1036 static int hpre_ctrl_debug_init(struct hisi_qm *qm)
1037 {
1038 	int ret;
1039 
1040 	ret = hpre_create_debugfs_file(qm, NULL, HPRE_CLEAR_ENABLE,
1041 				       HPRE_CLEAR_ENABLE);
1042 	if (ret)
1043 		return ret;
1044 
1045 	ret = hpre_pf_comm_regs_debugfs_init(qm);
1046 	if (ret)
1047 		return ret;
1048 
1049 	return hpre_cluster_debugfs_init(qm);
1050 }
1051 
1052 static void hpre_dfx_debug_init(struct hisi_qm *qm)
1053 {
1054 	struct dfx_diff_registers *hpre_regs = qm->debug.acc_diff_regs;
1055 	struct hpre *hpre = container_of(qm, struct hpre, qm);
1056 	struct hpre_dfx *dfx = hpre->debug.dfx;
1057 	struct dentry *parent;
1058 	int i;
1059 
1060 	parent = debugfs_create_dir("hpre_dfx", qm->debug.debug_root);
1061 	for (i = 0; i < HPRE_DFX_FILE_NUM; i++) {
1062 		dfx[i].type = i;
1063 		debugfs_create_file(hpre_dfx_files[i], 0644, parent, &dfx[i],
1064 				    &hpre_atomic64_ops);
1065 	}
1066 
1067 	if (qm->fun_type == QM_HW_PF && hpre_regs)
1068 		debugfs_create_file("diff_regs", 0444, parent,
1069 				      qm, &hpre_diff_regs_fops);
1070 }
1071 
1072 static int hpre_debugfs_init(struct hisi_qm *qm)
1073 {
1074 	struct device *dev = &qm->pdev->dev;
1075 	int ret;
1076 
1077 	ret = hisi_qm_regs_debugfs_init(qm, hpre_diff_regs, ARRAY_SIZE(hpre_diff_regs));
1078 	if (ret) {
1079 		dev_warn(dev, "Failed to init HPRE diff regs!\n");
1080 		return ret;
1081 	}
1082 
1083 	qm->debug.debug_root = debugfs_create_dir(dev_name(dev),
1084 							hpre_debugfs_root);
1085 	qm->debug.sqe_mask_offset = HPRE_SQE_MASK_OFFSET;
1086 	qm->debug.sqe_mask_len = HPRE_SQE_MASK_LEN;
1087 
1088 	hisi_qm_debug_init(qm);
1089 
1090 	if (qm->pdev->device == PCI_DEVICE_ID_HUAWEI_HPRE_PF) {
1091 		ret = hpre_ctrl_debug_init(qm);
1092 		if (ret)
1093 			goto debugfs_remove;
1094 	}
1095 
1096 	hpre_dfx_debug_init(qm);
1097 
1098 	return 0;
1099 
1100 debugfs_remove:
1101 	debugfs_remove_recursive(qm->debug.debug_root);
1102 	hisi_qm_regs_debugfs_uninit(qm, ARRAY_SIZE(hpre_diff_regs));
1103 	return ret;
1104 }
1105 
1106 static void hpre_debugfs_exit(struct hisi_qm *qm)
1107 {
1108 	debugfs_remove_recursive(qm->debug.debug_root);
1109 
1110 	hisi_qm_regs_debugfs_uninit(qm, ARRAY_SIZE(hpre_diff_regs));
1111 }
1112 
1113 static int hpre_pre_store_cap_reg(struct hisi_qm *qm)
1114 {
1115 	struct hisi_qm_cap_record *hpre_cap;
1116 	struct device *dev = &qm->pdev->dev;
1117 	size_t i, size;
1118 
1119 	size = ARRAY_SIZE(hpre_pre_store_caps);
1120 	hpre_cap = devm_kzalloc(dev, sizeof(*hpre_cap) * size, GFP_KERNEL);
1121 	if (!hpre_cap)
1122 		return -ENOMEM;
1123 
1124 	for (i = 0; i < size; i++) {
1125 		hpre_cap[i].type = hpre_pre_store_caps[i];
1126 		hpre_cap[i].cap_val = hisi_qm_get_hw_info(qm, hpre_basic_info,
1127 				      hpre_pre_store_caps[i], qm->cap_ver);
1128 	}
1129 
1130 	if (hpre_cap[HPRE_CLUSTER_NUM_CAP_IDX].cap_val > HPRE_CLUSTERS_NUM_MAX) {
1131 		dev_err(dev, "Device cluster num %u is out of range for driver supports %d!\n",
1132 			hpre_cap[HPRE_CLUSTER_NUM_CAP_IDX].cap_val, HPRE_CLUSTERS_NUM_MAX);
1133 		return -EINVAL;
1134 	}
1135 
1136 	qm->cap_tables.dev_cap_table = hpre_cap;
1137 
1138 	return 0;
1139 }
1140 
1141 static int hpre_qm_init(struct hisi_qm *qm, struct pci_dev *pdev)
1142 {
1143 	u64 alg_msk;
1144 	int ret;
1145 
1146 	if (pdev->revision == QM_HW_V1) {
1147 		pci_warn(pdev, "HPRE version 1 is not supported!\n");
1148 		return -EINVAL;
1149 	}
1150 
1151 	qm->mode = uacce_mode;
1152 	qm->pdev = pdev;
1153 	qm->ver = pdev->revision;
1154 	qm->sqe_size = HPRE_SQE_SIZE;
1155 	qm->dev_name = hpre_name;
1156 
1157 	qm->fun_type = (pdev->device == PCI_DEVICE_ID_HUAWEI_HPRE_PF) ?
1158 			QM_HW_PF : QM_HW_VF;
1159 	if (qm->fun_type == QM_HW_PF) {
1160 		qm->qp_base = HPRE_PF_DEF_Q_BASE;
1161 		qm->qp_num = pf_q_num;
1162 		qm->debug.curr_qm_qp_num = pf_q_num;
1163 		qm->qm_list = &hpre_devices;
1164 		if (pf_q_num_flag)
1165 			set_bit(QM_MODULE_PARAM, &qm->misc_ctl);
1166 	}
1167 
1168 	ret = hisi_qm_init(qm);
1169 	if (ret) {
1170 		pci_err(pdev, "Failed to init hpre qm configures!\n");
1171 		return ret;
1172 	}
1173 
1174 	/* Fetch and save the value of capability registers */
1175 	ret = hpre_pre_store_cap_reg(qm);
1176 	if (ret) {
1177 		pci_err(pdev, "Failed to pre-store capability registers!\n");
1178 		hisi_qm_uninit(qm);
1179 		return ret;
1180 	}
1181 
1182 	alg_msk = qm->cap_tables.dev_cap_table[HPRE_DEV_ALG_BITMAP_CAP_IDX].cap_val;
1183 	ret = hisi_qm_set_algs(qm, alg_msk, hpre_dev_algs, ARRAY_SIZE(hpre_dev_algs));
1184 	if (ret) {
1185 		pci_err(pdev, "Failed to set hpre algs!\n");
1186 		hisi_qm_uninit(qm);
1187 	}
1188 
1189 	return ret;
1190 }
1191 
1192 static int hpre_show_last_regs_init(struct hisi_qm *qm)
1193 {
1194 	int cluster_dfx_regs_num =  ARRAY_SIZE(hpre_cluster_dfx_regs);
1195 	int com_dfx_regs_num = ARRAY_SIZE(hpre_com_dfx_regs);
1196 	struct qm_debug *debug = &qm->debug;
1197 	void __iomem *io_base;
1198 	u8 clusters_num;
1199 	int i, j, idx;
1200 
1201 	clusters_num = qm->cap_tables.dev_cap_table[HPRE_CLUSTER_NUM_CAP_IDX].cap_val;
1202 	debug->last_words = kcalloc(cluster_dfx_regs_num * clusters_num +
1203 			com_dfx_regs_num, sizeof(unsigned int), GFP_KERNEL);
1204 	if (!debug->last_words)
1205 		return -ENOMEM;
1206 
1207 	for (i = 0; i < com_dfx_regs_num; i++)
1208 		debug->last_words[i] = readl_relaxed(qm->io_base +
1209 						hpre_com_dfx_regs[i].offset);
1210 
1211 	for (i = 0; i < clusters_num; i++) {
1212 		io_base = qm->io_base + hpre_cluster_offsets[i];
1213 		for (j = 0; j < cluster_dfx_regs_num; j++) {
1214 			idx = com_dfx_regs_num + i * cluster_dfx_regs_num + j;
1215 			debug->last_words[idx] = readl_relaxed(
1216 				io_base + hpre_cluster_dfx_regs[j].offset);
1217 		}
1218 	}
1219 
1220 	return 0;
1221 }
1222 
1223 static void hpre_show_last_regs_uninit(struct hisi_qm *qm)
1224 {
1225 	struct qm_debug *debug = &qm->debug;
1226 
1227 	if (qm->fun_type == QM_HW_VF || !debug->last_words)
1228 		return;
1229 
1230 	kfree(debug->last_words);
1231 	debug->last_words = NULL;
1232 }
1233 
1234 static void hpre_show_last_dfx_regs(struct hisi_qm *qm)
1235 {
1236 	int cluster_dfx_regs_num =  ARRAY_SIZE(hpre_cluster_dfx_regs);
1237 	int com_dfx_regs_num = ARRAY_SIZE(hpre_com_dfx_regs);
1238 	struct qm_debug *debug = &qm->debug;
1239 	struct pci_dev *pdev = qm->pdev;
1240 	void __iomem *io_base;
1241 	u8 clusters_num;
1242 	int i, j, idx;
1243 	u32 val;
1244 
1245 	if (qm->fun_type == QM_HW_VF || !debug->last_words)
1246 		return;
1247 
1248 	/* dumps last word of the debugging registers during controller reset */
1249 	for (i = 0; i < com_dfx_regs_num; i++) {
1250 		val = readl_relaxed(qm->io_base + hpre_com_dfx_regs[i].offset);
1251 		if (debug->last_words[i] != val)
1252 			pci_info(pdev, "Common_core:%s \t= 0x%08x => 0x%08x\n",
1253 			  hpre_com_dfx_regs[i].name, debug->last_words[i], val);
1254 	}
1255 
1256 	clusters_num = qm->cap_tables.dev_cap_table[HPRE_CLUSTER_NUM_CAP_IDX].cap_val;
1257 	for (i = 0; i < clusters_num; i++) {
1258 		io_base = qm->io_base + hpre_cluster_offsets[i];
1259 		for (j = 0; j <  cluster_dfx_regs_num; j++) {
1260 			val = readl_relaxed(io_base +
1261 					     hpre_cluster_dfx_regs[j].offset);
1262 			idx = com_dfx_regs_num + i * cluster_dfx_regs_num + j;
1263 			if (debug->last_words[idx] != val)
1264 				pci_info(pdev, "cluster-%d:%s \t= 0x%08x => 0x%08x\n",
1265 				i, hpre_cluster_dfx_regs[j].name, debug->last_words[idx], val);
1266 		}
1267 	}
1268 }
1269 
1270 static void hpre_log_hw_error(struct hisi_qm *qm, u32 err_sts)
1271 {
1272 	const struct hpre_hw_error *err = hpre_hw_errors;
1273 	struct device *dev = &qm->pdev->dev;
1274 
1275 	while (err->msg) {
1276 		if (err->int_msk & err_sts)
1277 			dev_warn(dev, "%s [error status=0x%x] found\n",
1278 				 err->msg, err->int_msk);
1279 		err++;
1280 	}
1281 }
1282 
1283 static u32 hpre_get_hw_err_status(struct hisi_qm *qm)
1284 {
1285 	return readl(qm->io_base + HPRE_INT_STATUS);
1286 }
1287 
1288 static void hpre_clear_hw_err_status(struct hisi_qm *qm, u32 err_sts)
1289 {
1290 	u32 nfe;
1291 
1292 	writel(err_sts, qm->io_base + HPRE_HAC_SOURCE_INT);
1293 	nfe = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_NFE_MASK_CAP, qm->cap_ver);
1294 	writel(nfe, qm->io_base + HPRE_RAS_NFE_ENB);
1295 }
1296 
1297 static void hpre_open_axi_master_ooo(struct hisi_qm *qm)
1298 {
1299 	u32 value;
1300 
1301 	value = readl(qm->io_base + HPRE_AM_OOO_SHUTDOWN_ENB);
1302 	writel(value & ~HPRE_AM_OOO_SHUTDOWN_ENABLE,
1303 	       qm->io_base + HPRE_AM_OOO_SHUTDOWN_ENB);
1304 	writel(value | HPRE_AM_OOO_SHUTDOWN_ENABLE,
1305 	       qm->io_base + HPRE_AM_OOO_SHUTDOWN_ENB);
1306 }
1307 
1308 static void hpre_err_info_init(struct hisi_qm *qm)
1309 {
1310 	struct hisi_qm_err_info *err_info = &qm->err_info;
1311 
1312 	err_info->fe = HPRE_HAC_RAS_FE_ENABLE;
1313 	err_info->ce = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_QM_CE_MASK_CAP, qm->cap_ver);
1314 	err_info->nfe = hisi_qm_get_hw_info(qm, hpre_basic_info, HPRE_QM_NFE_MASK_CAP, qm->cap_ver);
1315 	err_info->ecc_2bits_mask = HPRE_CORE_ECC_2BIT_ERR | HPRE_OOO_ECC_2BIT_ERR;
1316 	err_info->dev_shutdown_mask = hisi_qm_get_hw_info(qm, hpre_basic_info,
1317 			HPRE_OOO_SHUTDOWN_MASK_CAP, qm->cap_ver);
1318 	err_info->qm_shutdown_mask = hisi_qm_get_hw_info(qm, hpre_basic_info,
1319 			HPRE_QM_OOO_SHUTDOWN_MASK_CAP, qm->cap_ver);
1320 	err_info->qm_reset_mask = hisi_qm_get_hw_info(qm, hpre_basic_info,
1321 			HPRE_QM_RESET_MASK_CAP, qm->cap_ver);
1322 	err_info->dev_reset_mask = hisi_qm_get_hw_info(qm, hpre_basic_info,
1323 			HPRE_RESET_MASK_CAP, qm->cap_ver);
1324 	err_info->msi_wr_port = HPRE_WR_MSI_PORT;
1325 	err_info->acpi_rst = "HRST";
1326 }
1327 
1328 static const struct hisi_qm_err_ini hpre_err_ini = {
1329 	.hw_init		= hpre_set_user_domain_and_cache,
1330 	.hw_err_enable		= hpre_hw_error_enable,
1331 	.hw_err_disable		= hpre_hw_error_disable,
1332 	.get_dev_hw_err_status	= hpre_get_hw_err_status,
1333 	.clear_dev_hw_err_status = hpre_clear_hw_err_status,
1334 	.log_dev_hw_err		= hpre_log_hw_error,
1335 	.open_axi_master_ooo	= hpre_open_axi_master_ooo,
1336 	.open_sva_prefetch	= hpre_open_sva_prefetch,
1337 	.close_sva_prefetch	= hpre_close_sva_prefetch,
1338 	.show_last_dfx_regs	= hpre_show_last_dfx_regs,
1339 	.err_info_init		= hpre_err_info_init,
1340 };
1341 
1342 static int hpre_pf_probe_init(struct hpre *hpre)
1343 {
1344 	struct hisi_qm *qm = &hpre->qm;
1345 	int ret;
1346 
1347 	ret = hpre_set_user_domain_and_cache(qm);
1348 	if (ret)
1349 		return ret;
1350 
1351 	hpre_open_sva_prefetch(qm);
1352 
1353 	qm->err_ini = &hpre_err_ini;
1354 	qm->err_ini->err_info_init(qm);
1355 	hisi_qm_dev_err_init(qm);
1356 	ret = hpre_show_last_regs_init(qm);
1357 	if (ret)
1358 		pci_err(qm->pdev, "Failed to init last word regs!\n");
1359 
1360 	return ret;
1361 }
1362 
1363 static int hpre_probe_init(struct hpre *hpre)
1364 {
1365 	u32 type_rate = HPRE_SHAPER_TYPE_RATE;
1366 	struct hisi_qm *qm = &hpre->qm;
1367 	int ret;
1368 
1369 	if (qm->fun_type == QM_HW_PF) {
1370 		ret = hpre_pf_probe_init(hpre);
1371 		if (ret)
1372 			return ret;
1373 		/* Enable shaper type 0 */
1374 		if (qm->ver >= QM_HW_V3) {
1375 			type_rate |= QM_SHAPER_ENABLE;
1376 			qm->type_rate = type_rate;
1377 		}
1378 	}
1379 
1380 	return 0;
1381 }
1382 
1383 static int hpre_probe(struct pci_dev *pdev, const struct pci_device_id *id)
1384 {
1385 	struct hisi_qm *qm;
1386 	struct hpre *hpre;
1387 	int ret;
1388 
1389 	hpre = devm_kzalloc(&pdev->dev, sizeof(*hpre), GFP_KERNEL);
1390 	if (!hpre)
1391 		return -ENOMEM;
1392 
1393 	qm = &hpre->qm;
1394 	ret = hpre_qm_init(qm, pdev);
1395 	if (ret) {
1396 		pci_err(pdev, "Failed to init HPRE QM (%d)!\n", ret);
1397 		return ret;
1398 	}
1399 
1400 	ret = hpre_probe_init(hpre);
1401 	if (ret) {
1402 		pci_err(pdev, "Failed to probe (%d)!\n", ret);
1403 		goto err_with_qm_init;
1404 	}
1405 
1406 	ret = hisi_qm_start(qm);
1407 	if (ret)
1408 		goto err_with_err_init;
1409 
1410 	ret = hpre_debugfs_init(qm);
1411 	if (ret)
1412 		dev_warn(&pdev->dev, "init debugfs fail!\n");
1413 
1414 	hisi_qm_add_list(qm, &hpre_devices);
1415 	ret = hisi_qm_alg_register(qm, &hpre_devices, HPRE_CTX_Q_NUM_DEF);
1416 	if (ret < 0) {
1417 		pci_err(pdev, "fail to register algs to crypto!\n");
1418 		goto err_qm_del_list;
1419 	}
1420 
1421 	if (qm->uacce) {
1422 		ret = uacce_register(qm->uacce);
1423 		if (ret) {
1424 			pci_err(pdev, "failed to register uacce (%d)!\n", ret);
1425 			goto err_with_alg_register;
1426 		}
1427 	}
1428 
1429 	if (qm->fun_type == QM_HW_PF && vfs_num) {
1430 		ret = hisi_qm_sriov_enable(pdev, vfs_num);
1431 		if (ret < 0)
1432 			goto err_with_alg_register;
1433 	}
1434 
1435 	hisi_qm_pm_init(qm);
1436 
1437 	return 0;
1438 
1439 err_with_alg_register:
1440 	hisi_qm_alg_unregister(qm, &hpre_devices, HPRE_CTX_Q_NUM_DEF);
1441 
1442 err_qm_del_list:
1443 	hisi_qm_del_list(qm, &hpre_devices);
1444 	hpre_debugfs_exit(qm);
1445 	hisi_qm_stop(qm, QM_NORMAL);
1446 
1447 err_with_err_init:
1448 	hpre_show_last_regs_uninit(qm);
1449 	hisi_qm_dev_err_uninit(qm);
1450 
1451 err_with_qm_init:
1452 	hisi_qm_uninit(qm);
1453 
1454 	return ret;
1455 }
1456 
1457 static void hpre_remove(struct pci_dev *pdev)
1458 {
1459 	struct hisi_qm *qm = pci_get_drvdata(pdev);
1460 
1461 	hisi_qm_pm_uninit(qm);
1462 	hisi_qm_wait_task_finish(qm, &hpre_devices);
1463 	hisi_qm_alg_unregister(qm, &hpre_devices, HPRE_CTX_Q_NUM_DEF);
1464 	hisi_qm_del_list(qm, &hpre_devices);
1465 	if (qm->fun_type == QM_HW_PF && qm->vfs_num)
1466 		hisi_qm_sriov_disable(pdev, true);
1467 
1468 	hpre_debugfs_exit(qm);
1469 	hisi_qm_stop(qm, QM_NORMAL);
1470 
1471 	if (qm->fun_type == QM_HW_PF) {
1472 		hpre_cnt_regs_clear(qm);
1473 		qm->debug.curr_qm_qp_num = 0;
1474 		hpre_show_last_regs_uninit(qm);
1475 		hisi_qm_dev_err_uninit(qm);
1476 	}
1477 
1478 	hisi_qm_uninit(qm);
1479 }
1480 
1481 static const struct dev_pm_ops hpre_pm_ops = {
1482 	SET_RUNTIME_PM_OPS(hisi_qm_suspend, hisi_qm_resume, NULL)
1483 };
1484 
1485 static const struct pci_error_handlers hpre_err_handler = {
1486 	.error_detected		= hisi_qm_dev_err_detected,
1487 	.slot_reset		= hisi_qm_dev_slot_reset,
1488 	.reset_prepare		= hisi_qm_reset_prepare,
1489 	.reset_done		= hisi_qm_reset_done,
1490 };
1491 
1492 static struct pci_driver hpre_pci_driver = {
1493 	.name			= hpre_name,
1494 	.id_table		= hpre_dev_ids,
1495 	.probe			= hpre_probe,
1496 	.remove			= hpre_remove,
1497 	.sriov_configure	= IS_ENABLED(CONFIG_PCI_IOV) ?
1498 				  hisi_qm_sriov_configure : NULL,
1499 	.err_handler		= &hpre_err_handler,
1500 	.shutdown		= hisi_qm_dev_shutdown,
1501 	.driver.pm		= &hpre_pm_ops,
1502 };
1503 
1504 struct pci_driver *hisi_hpre_get_pf_driver(void)
1505 {
1506 	return &hpre_pci_driver;
1507 }
1508 EXPORT_SYMBOL_GPL(hisi_hpre_get_pf_driver);
1509 
1510 static void hpre_register_debugfs(void)
1511 {
1512 	if (!debugfs_initialized())
1513 		return;
1514 
1515 	hpre_debugfs_root = debugfs_create_dir(hpre_name, NULL);
1516 }
1517 
1518 static void hpre_unregister_debugfs(void)
1519 {
1520 	debugfs_remove_recursive(hpre_debugfs_root);
1521 }
1522 
1523 static int __init hpre_init(void)
1524 {
1525 	int ret;
1526 
1527 	hisi_qm_init_list(&hpre_devices);
1528 	hpre_register_debugfs();
1529 
1530 	ret = pci_register_driver(&hpre_pci_driver);
1531 	if (ret) {
1532 		hpre_unregister_debugfs();
1533 		pr_err("hpre: can't register hisi hpre driver.\n");
1534 	}
1535 
1536 	return ret;
1537 }
1538 
1539 static void __exit hpre_exit(void)
1540 {
1541 	pci_unregister_driver(&hpre_pci_driver);
1542 	hpre_unregister_debugfs();
1543 }
1544 
1545 module_init(hpre_init);
1546 module_exit(hpre_exit);
1547 
1548 MODULE_LICENSE("GPL v2");
1549 MODULE_AUTHOR("Zaibo Xu <xuzaibo@huawei.com>");
1550 MODULE_AUTHOR("Meng Yu <yumeng18@huawei.com>");
1551 MODULE_DESCRIPTION("Driver for HiSilicon HPRE accelerator");
1552