xref: /linux/drivers/crypto/cavium/nitrox/nitrox_reqmgr.c (revision 0ddd7eaffa644baa78e247bbd220ab7195b1eed6)
1 // SPDX-License-Identifier: GPL-2.0
2 #include <linux/gfp.h>
3 #include <linux/workqueue.h>
4 #include <crypto/internal/skcipher.h>
5 
6 #include "nitrox_common.h"
7 #include "nitrox_dev.h"
8 #include "nitrox_req.h"
9 #include "nitrox_csr.h"
10 
11 /* SLC_STORE_INFO */
12 #define MIN_UDD_LEN 16
13 /* PKT_IN_HDR + SLC_STORE_INFO */
14 #define FDATA_SIZE 32
15 /* Base destination port for the solicited requests */
16 #define SOLICIT_BASE_DPORT 256
17 
18 #define REQ_NOT_POSTED 1
19 #define REQ_BACKLOG    2
20 #define REQ_POSTED     3
21 
22 /**
23  * Response codes from SE microcode
24  * 0x00 - Success
25  *   Completion with no error
26  * 0x43 - ERR_GC_DATA_LEN_INVALID
27  *   Invalid Data length if Encryption Data length is
28  *   less than 16 bytes for AES-XTS and AES-CTS.
29  * 0x45 - ERR_GC_CTX_LEN_INVALID
30  *   Invalid context length: CTXL != 23 words.
31  * 0x4F - ERR_GC_DOCSIS_CIPHER_INVALID
32  *   DOCSIS support is enabled with other than
33  *   AES/DES-CBC mode encryption.
34  * 0x50 - ERR_GC_DOCSIS_OFFSET_INVALID
35  *   Authentication offset is other than 0 with
36  *   Encryption IV source = 0.
37  *   Authentication offset is other than 8 (DES)/16 (AES)
38  *   with Encryption IV source = 1
39  * 0x51 - ERR_GC_CRC32_INVALID_SELECTION
40  *   CRC32 is enabled for other than DOCSIS encryption.
41  * 0x52 - ERR_GC_AES_CCM_FLAG_INVALID
42  *   Invalid flag options in AES-CCM IV.
43  */
44 
45 static inline int incr_index(int index, int count, int max)
46 {
47 	if ((index + count) >= max)
48 		index = index + count - max;
49 	else
50 		index += count;
51 
52 	return index;
53 }
54 
55 static void softreq_unmap_sgbufs(struct nitrox_softreq *sr)
56 {
57 	struct nitrox_device *ndev = sr->ndev;
58 	struct device *dev = DEV(ndev);
59 
60 
61 	dma_unmap_sg(dev, sr->in.sg, sg_nents(sr->in.sg),
62 		     DMA_BIDIRECTIONAL);
63 	dma_unmap_single(dev, sr->in.sgcomp_dma, sr->in.sgcomp_len,
64 			 DMA_TO_DEVICE);
65 	kfree(sr->in.sgcomp);
66 	sr->in.sg = NULL;
67 	sr->in.sgmap_cnt = 0;
68 
69 	dma_unmap_sg(dev, sr->out.sg, sg_nents(sr->out.sg),
70 		     DMA_BIDIRECTIONAL);
71 	dma_unmap_single(dev, sr->out.sgcomp_dma, sr->out.sgcomp_len,
72 			 DMA_TO_DEVICE);
73 	kfree(sr->out.sgcomp);
74 	sr->out.sg = NULL;
75 	sr->out.sgmap_cnt = 0;
76 }
77 
78 static void softreq_destroy(struct nitrox_softreq *sr)
79 {
80 	softreq_unmap_sgbufs(sr);
81 	kfree(sr);
82 }
83 
84 /**
85  * create_sg_component - create SG componets for N5 device.
86  * @sr: Request structure
87  * @sgtbl: SG table
88  * @map_nents: number of dma mapped entries
89  *
90  * Component structure
91  *
92  *   63     48 47     32 31    16 15      0
93  *   --------------------------------------
94  *   |   LEN0  |  LEN1  |  LEN2  |  LEN3  |
95  *   |-------------------------------------
96  *   |               PTR0                 |
97  *   --------------------------------------
98  *   |               PTR1                 |
99  *   --------------------------------------
100  *   |               PTR2                 |
101  *   --------------------------------------
102  *   |               PTR3                 |
103  *   --------------------------------------
104  *
105  *   Returns 0 if success or a negative errno code on error.
106  */
107 static int create_sg_component(struct nitrox_softreq *sr,
108 			       struct nitrox_sgtable *sgtbl, int map_nents)
109 {
110 	struct nitrox_device *ndev = sr->ndev;
111 	struct nitrox_sgcomp *sgcomp;
112 	struct scatterlist *sg;
113 	dma_addr_t dma;
114 	size_t sz_comp;
115 	int i, j, nr_sgcomp;
116 
117 	nr_sgcomp = roundup(map_nents, 4) / 4;
118 
119 	/* each component holds 4 dma pointers */
120 	sz_comp = nr_sgcomp * sizeof(*sgcomp);
121 	sgcomp = kzalloc(sz_comp, sr->gfp);
122 	if (!sgcomp)
123 		return -ENOMEM;
124 
125 	sgtbl->sgcomp = sgcomp;
126 
127 	sg = sgtbl->sg;
128 	/* populate device sg component */
129 	for (i = 0; i < nr_sgcomp; i++) {
130 		for (j = 0; j < 4 && sg; j++) {
131 			sgcomp[i].len[j] = cpu_to_be16(sg_dma_len(sg));
132 			sgcomp[i].dma[j] = cpu_to_be64(sg_dma_address(sg));
133 			sg = sg_next(sg);
134 		}
135 	}
136 	/* map the device sg component */
137 	dma = dma_map_single(DEV(ndev), sgtbl->sgcomp, sz_comp, DMA_TO_DEVICE);
138 	if (dma_mapping_error(DEV(ndev), dma)) {
139 		kfree(sgtbl->sgcomp);
140 		sgtbl->sgcomp = NULL;
141 		return -ENOMEM;
142 	}
143 
144 	sgtbl->sgcomp_dma = dma;
145 	sgtbl->sgcomp_len = sz_comp;
146 
147 	return 0;
148 }
149 
150 /**
151  * dma_map_inbufs - DMA map input sglist and creates sglist component
152  *                  for N5 device.
153  * @sr: Request structure
154  * @req: Crypto request structre
155  *
156  * Returns 0 if successful or a negative errno code on error.
157  */
158 static int dma_map_inbufs(struct nitrox_softreq *sr,
159 			  struct se_crypto_request *req)
160 {
161 	struct device *dev = DEV(sr->ndev);
162 	struct scatterlist *sg = req->src;
163 	int i, nents, ret = 0;
164 
165 	nents = dma_map_sg(dev, req->src, sg_nents(req->src),
166 			   DMA_BIDIRECTIONAL);
167 	if (!nents)
168 		return -EINVAL;
169 
170 	for_each_sg(req->src, sg, nents, i)
171 		sr->in.total_bytes += sg_dma_len(sg);
172 
173 	sr->in.sg = req->src;
174 	sr->in.sgmap_cnt = nents;
175 	ret = create_sg_component(sr, &sr->in, sr->in.sgmap_cnt);
176 	if (ret)
177 		goto incomp_err;
178 
179 	return 0;
180 
181 incomp_err:
182 	dma_unmap_sg(dev, req->src, sg_nents(req->src), DMA_BIDIRECTIONAL);
183 	sr->in.sgmap_cnt = 0;
184 	return ret;
185 }
186 
187 static int dma_map_outbufs(struct nitrox_softreq *sr,
188 			   struct se_crypto_request *req)
189 {
190 	struct device *dev = DEV(sr->ndev);
191 	int nents, ret = 0;
192 
193 	nents = dma_map_sg(dev, req->dst, sg_nents(req->dst),
194 			   DMA_BIDIRECTIONAL);
195 	if (!nents)
196 		return -EINVAL;
197 
198 	sr->out.sg = req->dst;
199 	sr->out.sgmap_cnt = nents;
200 	ret = create_sg_component(sr, &sr->out, sr->out.sgmap_cnt);
201 	if (ret)
202 		goto outcomp_map_err;
203 
204 	return 0;
205 
206 outcomp_map_err:
207 	dma_unmap_sg(dev, req->dst, sg_nents(req->dst), DMA_BIDIRECTIONAL);
208 	sr->out.sgmap_cnt = 0;
209 	sr->out.sg = NULL;
210 	return ret;
211 }
212 
213 static inline int softreq_map_iobuf(struct nitrox_softreq *sr,
214 				    struct se_crypto_request *creq)
215 {
216 	int ret;
217 
218 	ret = dma_map_inbufs(sr, creq);
219 	if (ret)
220 		return ret;
221 
222 	ret = dma_map_outbufs(sr, creq);
223 	if (ret)
224 		softreq_unmap_sgbufs(sr);
225 
226 	return ret;
227 }
228 
229 static inline void backlog_list_add(struct nitrox_softreq *sr,
230 				    struct nitrox_cmdq *cmdq)
231 {
232 	INIT_LIST_HEAD(&sr->backlog);
233 
234 	spin_lock_bh(&cmdq->backlog_qlock);
235 	list_add_tail(&sr->backlog, &cmdq->backlog_head);
236 	atomic_inc(&cmdq->backlog_count);
237 	atomic_set(&sr->status, REQ_BACKLOG);
238 	spin_unlock_bh(&cmdq->backlog_qlock);
239 }
240 
241 static inline void response_list_add(struct nitrox_softreq *sr,
242 				     struct nitrox_cmdq *cmdq)
243 {
244 	INIT_LIST_HEAD(&sr->response);
245 
246 	spin_lock_bh(&cmdq->resp_qlock);
247 	list_add_tail(&sr->response, &cmdq->response_head);
248 	spin_unlock_bh(&cmdq->resp_qlock);
249 }
250 
251 static inline void response_list_del(struct nitrox_softreq *sr,
252 				     struct nitrox_cmdq *cmdq)
253 {
254 	spin_lock_bh(&cmdq->resp_qlock);
255 	list_del(&sr->response);
256 	spin_unlock_bh(&cmdq->resp_qlock);
257 }
258 
259 static struct nitrox_softreq *
260 get_first_response_entry(struct nitrox_cmdq *cmdq)
261 {
262 	return list_first_entry_or_null(&cmdq->response_head,
263 					struct nitrox_softreq, response);
264 }
265 
266 static inline bool cmdq_full(struct nitrox_cmdq *cmdq, int qlen)
267 {
268 	if (atomic_inc_return(&cmdq->pending_count) > qlen) {
269 		atomic_dec(&cmdq->pending_count);
270 		/* sync with other cpus */
271 		smp_mb__after_atomic();
272 		return true;
273 	}
274 	/* sync with other cpus */
275 	smp_mb__after_atomic();
276 	return false;
277 }
278 
279 /**
280  * post_se_instr - Post SE instruction to Packet Input ring
281  * @sr: Request structure
282  *
283  * Returns 0 if successful or a negative error code,
284  * if no space in ring.
285  */
286 static void post_se_instr(struct nitrox_softreq *sr,
287 			  struct nitrox_cmdq *cmdq)
288 {
289 	struct nitrox_device *ndev = sr->ndev;
290 	int idx;
291 	u8 *ent;
292 
293 	spin_lock_bh(&cmdq->cmd_qlock);
294 
295 	idx = cmdq->write_idx;
296 	/* copy the instruction */
297 	ent = cmdq->base + (idx * cmdq->instr_size);
298 	memcpy(ent, &sr->instr, cmdq->instr_size);
299 
300 	atomic_set(&sr->status, REQ_POSTED);
301 	response_list_add(sr, cmdq);
302 	sr->tstamp = jiffies;
303 	/* flush the command queue updates */
304 	dma_wmb();
305 
306 	/* Ring doorbell with count 1 */
307 	writeq(1, cmdq->dbell_csr_addr);
308 
309 	cmdq->write_idx = incr_index(idx, 1, ndev->qlen);
310 
311 	spin_unlock_bh(&cmdq->cmd_qlock);
312 
313 	/* increment the posted command count */
314 	atomic64_inc(&ndev->stats.posted);
315 }
316 
317 static int post_backlog_cmds(struct nitrox_cmdq *cmdq)
318 {
319 	struct nitrox_device *ndev = cmdq->ndev;
320 	struct nitrox_softreq *sr, *tmp;
321 	int ret = 0;
322 
323 	if (!atomic_read(&cmdq->backlog_count))
324 		return 0;
325 
326 	spin_lock_bh(&cmdq->backlog_qlock);
327 
328 	list_for_each_entry_safe(sr, tmp, &cmdq->backlog_head, backlog) {
329 		/* submit until space available */
330 		if (unlikely(cmdq_full(cmdq, ndev->qlen))) {
331 			ret = -ENOSPC;
332 			break;
333 		}
334 		/* delete from backlog list */
335 		list_del(&sr->backlog);
336 		atomic_dec(&cmdq->backlog_count);
337 		/* sync with other cpus */
338 		smp_mb__after_atomic();
339 
340 		/* post the command */
341 		post_se_instr(sr, cmdq);
342 	}
343 	spin_unlock_bh(&cmdq->backlog_qlock);
344 
345 	return ret;
346 }
347 
348 static int nitrox_enqueue_request(struct nitrox_softreq *sr)
349 {
350 	struct nitrox_cmdq *cmdq = sr->cmdq;
351 	struct nitrox_device *ndev = sr->ndev;
352 
353 	/* try to post backlog requests */
354 	post_backlog_cmds(cmdq);
355 
356 	if (unlikely(cmdq_full(cmdq, ndev->qlen))) {
357 		if (!(sr->flags & CRYPTO_TFM_REQ_MAY_BACKLOG)) {
358 			/* increment drop count */
359 			atomic64_inc(&ndev->stats.dropped);
360 			return -ENOSPC;
361 		}
362 		/* add to backlog list */
363 		backlog_list_add(sr, cmdq);
364 		return -EINPROGRESS;
365 	}
366 	post_se_instr(sr, cmdq);
367 
368 	return -EINPROGRESS;
369 }
370 
371 /**
372  * nitrox_se_request - Send request to SE core
373  * @ndev: NITROX device
374  * @req: Crypto request
375  *
376  * Returns 0 on success, or a negative error code.
377  */
378 int nitrox_process_se_request(struct nitrox_device *ndev,
379 			      struct se_crypto_request *req,
380 			      completion_t callback,
381 			      void *cb_arg)
382 {
383 	struct nitrox_softreq *sr;
384 	dma_addr_t ctx_handle = 0;
385 	int qno, ret = 0;
386 
387 	if (!nitrox_ready(ndev))
388 		return -ENODEV;
389 
390 	sr = kzalloc(sizeof(*sr), req->gfp);
391 	if (!sr)
392 		return -ENOMEM;
393 
394 	sr->ndev = ndev;
395 	sr->flags = req->flags;
396 	sr->gfp = req->gfp;
397 	sr->callback = callback;
398 	sr->cb_arg = cb_arg;
399 
400 	atomic_set(&sr->status, REQ_NOT_POSTED);
401 
402 	sr->resp.orh = req->orh;
403 	sr->resp.completion = req->comp;
404 
405 	ret = softreq_map_iobuf(sr, req);
406 	if (ret) {
407 		kfree(sr);
408 		return ret;
409 	}
410 
411 	/* get the context handle */
412 	if (req->ctx_handle) {
413 		struct ctx_hdr *hdr;
414 		u8 *ctx_ptr;
415 
416 		ctx_ptr = (u8 *)(uintptr_t)req->ctx_handle;
417 		hdr = (struct ctx_hdr *)(ctx_ptr - sizeof(struct ctx_hdr));
418 		ctx_handle = hdr->ctx_dma;
419 	}
420 
421 	/* select the queue */
422 	qno = smp_processor_id() % ndev->nr_queues;
423 
424 	sr->cmdq = &ndev->pkt_inq[qno];
425 
426 	/*
427 	 * 64-Byte Instruction Format
428 	 *
429 	 *  ----------------------
430 	 *  |      DPTR0         | 8 bytes
431 	 *  ----------------------
432 	 *  |  PKT_IN_INSTR_HDR  | 8 bytes
433 	 *  ----------------------
434 	 *  |    PKT_IN_HDR      | 16 bytes
435 	 *  ----------------------
436 	 *  |    SLC_INFO        | 16 bytes
437 	 *  ----------------------
438 	 *  |   Front data       | 16 bytes
439 	 *  ----------------------
440 	 */
441 
442 	/* fill the packet instruction */
443 	/* word 0 */
444 	sr->instr.dptr0 = cpu_to_be64(sr->in.sgcomp_dma);
445 
446 	/* word 1 */
447 	sr->instr.ih.value = 0;
448 	sr->instr.ih.s.g = 1;
449 	sr->instr.ih.s.gsz = sr->in.sgmap_cnt;
450 	sr->instr.ih.s.ssz = sr->out.sgmap_cnt;
451 	sr->instr.ih.s.fsz = FDATA_SIZE + sizeof(struct gphdr);
452 	sr->instr.ih.s.tlen = sr->instr.ih.s.fsz + sr->in.total_bytes;
453 	sr->instr.ih.bev = cpu_to_be64(sr->instr.ih.value);
454 
455 	/* word 2 */
456 	sr->instr.irh.value[0] = 0;
457 	sr->instr.irh.s.uddl = MIN_UDD_LEN;
458 	/* context length in 64-bit words */
459 	sr->instr.irh.s.ctxl = (req->ctrl.s.ctxl / 8);
460 	/* offset from solicit base port 256 */
461 	sr->instr.irh.s.destport = SOLICIT_BASE_DPORT + qno;
462 	sr->instr.irh.s.ctxc = req->ctrl.s.ctxc;
463 	sr->instr.irh.s.arg = req->ctrl.s.arg;
464 	sr->instr.irh.s.opcode = req->opcode;
465 	sr->instr.irh.bev[0] = cpu_to_be64(sr->instr.irh.value[0]);
466 
467 	/* word 3 */
468 	sr->instr.irh.s.ctxp = cpu_to_be64(ctx_handle);
469 
470 	/* word 4 */
471 	sr->instr.slc.value[0] = 0;
472 	sr->instr.slc.s.ssz = sr->out.sgmap_cnt;
473 	sr->instr.slc.bev[0] = cpu_to_be64(sr->instr.slc.value[0]);
474 
475 	/* word 5 */
476 	sr->instr.slc.s.rptr = cpu_to_be64(sr->out.sgcomp_dma);
477 
478 	/*
479 	 * No conversion for front data,
480 	 * It goes into payload
481 	 * put GP Header in front data
482 	 */
483 	sr->instr.fdata[0] = *((u64 *)&req->gph);
484 	sr->instr.fdata[1] = 0;
485 
486 	ret = nitrox_enqueue_request(sr);
487 	if (ret == -ENOSPC)
488 		goto send_fail;
489 
490 	return ret;
491 
492 send_fail:
493 	softreq_destroy(sr);
494 	return ret;
495 }
496 
497 static inline int cmd_timeout(unsigned long tstamp, unsigned long timeout)
498 {
499 	return time_after_eq(jiffies, (tstamp + timeout));
500 }
501 
502 void backlog_qflush_work(struct work_struct *work)
503 {
504 	struct nitrox_cmdq *cmdq;
505 
506 	cmdq = container_of(work, struct nitrox_cmdq, backlog_qflush);
507 	post_backlog_cmds(cmdq);
508 }
509 
510 static bool sr_completed(struct nitrox_softreq *sr)
511 {
512 	u64 orh = READ_ONCE(*sr->resp.orh);
513 	unsigned long timeout = jiffies + msecs_to_jiffies(1);
514 
515 	if ((orh != PENDING_SIG) && (orh & 0xff))
516 		return true;
517 
518 	while (READ_ONCE(*sr->resp.completion) == PENDING_SIG) {
519 		if (time_after(jiffies, timeout)) {
520 			pr_err("comp not done\n");
521 			return false;
522 		}
523 	}
524 
525 	return true;
526 }
527 
528 /**
529  * process_request_list - process completed requests
530  * @ndev: N5 device
531  * @qno: queue to operate
532  *
533  * Returns the number of responses processed.
534  */
535 static void process_response_list(struct nitrox_cmdq *cmdq)
536 {
537 	struct nitrox_device *ndev = cmdq->ndev;
538 	struct nitrox_softreq *sr;
539 	int req_completed = 0, err = 0, budget;
540 	completion_t callback;
541 	void *cb_arg;
542 
543 	/* check all pending requests */
544 	budget = atomic_read(&cmdq->pending_count);
545 
546 	while (req_completed < budget) {
547 		sr = get_first_response_entry(cmdq);
548 		if (!sr)
549 			break;
550 
551 		if (atomic_read(&sr->status) != REQ_POSTED)
552 			break;
553 
554 		/* check orh and completion bytes updates */
555 		if (!sr_completed(sr)) {
556 			/* request not completed, check for timeout */
557 			if (!cmd_timeout(sr->tstamp, ndev->timeout))
558 				break;
559 			dev_err_ratelimited(DEV(ndev),
560 					    "Request timeout, orh 0x%016llx\n",
561 					    READ_ONCE(*sr->resp.orh));
562 		}
563 		atomic_dec(&cmdq->pending_count);
564 		atomic64_inc(&ndev->stats.completed);
565 		/* sync with other cpus */
566 		smp_mb__after_atomic();
567 		/* remove from response list */
568 		response_list_del(sr, cmdq);
569 		/* ORH error code */
570 		err = READ_ONCE(*sr->resp.orh) & 0xff;
571 		callback = sr->callback;
572 		cb_arg = sr->cb_arg;
573 		softreq_destroy(sr);
574 		if (callback)
575 			callback(cb_arg, err);
576 
577 		req_completed++;
578 	}
579 }
580 
581 /**
582  * pkt_slc_resp_tasklet - post processing of SE responses
583  */
584 void pkt_slc_resp_tasklet(unsigned long data)
585 {
586 	struct nitrox_q_vector *qvec = (void *)(uintptr_t)(data);
587 	struct nitrox_cmdq *cmdq = qvec->cmdq;
588 	union nps_pkt_slc_cnts slc_cnts;
589 
590 	/* read completion count */
591 	slc_cnts.value = readq(cmdq->compl_cnt_csr_addr);
592 	/* resend the interrupt if more work to do */
593 	slc_cnts.s.resend = 1;
594 
595 	process_response_list(cmdq);
596 
597 	/*
598 	 * clear the interrupt with resend bit enabled,
599 	 * MSI-X interrupt generates if Completion count > Threshold
600 	 */
601 	writeq(slc_cnts.value, cmdq->compl_cnt_csr_addr);
602 
603 	if (atomic_read(&cmdq->backlog_count))
604 		schedule_work(&cmdq->backlog_qflush);
605 }
606