xref: /freebsd/sys/contrib/openzfs/module/os/linux/zfs/qat_compress.c (revision 61145dc2b94f12f6a47344fb9aac702321880e43)
1*61145dc2SMartin Matuska // SPDX-License-Identifier: CDDL-1.0
2eda14cbcSMatt Macy /*
3eda14cbcSMatt Macy  * CDDL HEADER START
4eda14cbcSMatt Macy  *
5eda14cbcSMatt Macy  * The contents of this file are subject to the terms of the
6eda14cbcSMatt Macy  * Common Development and Distribution License (the "License").
7eda14cbcSMatt Macy  * You may not use this file except in compliance with the License.
8eda14cbcSMatt Macy  *
9eda14cbcSMatt Macy  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10271171e0SMartin Matuska  * or https://opensource.org/licenses/CDDL-1.0.
11eda14cbcSMatt Macy  * See the License for the specific language governing permissions
12eda14cbcSMatt Macy  * and limitations under the License.
13eda14cbcSMatt Macy  *
14eda14cbcSMatt Macy  * When distributing Covered Code, include this CDDL HEADER in each
15eda14cbcSMatt Macy  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16eda14cbcSMatt Macy  * If applicable, add the following below this CDDL HEADER, with the
17eda14cbcSMatt Macy  * fields enclosed by brackets "[]" replaced with your own identifying
18eda14cbcSMatt Macy  * information: Portions Copyright [yyyy] [name of copyright owner]
19eda14cbcSMatt Macy  *
20eda14cbcSMatt Macy  * CDDL HEADER END
21eda14cbcSMatt Macy  */
22eda14cbcSMatt Macy 
23eda14cbcSMatt Macy #if defined(_KERNEL) && defined(HAVE_QAT)
24eda14cbcSMatt Macy #include <linux/slab.h>
25eda14cbcSMatt Macy #include <linux/vmalloc.h>
26eda14cbcSMatt Macy #include <linux/pagemap.h>
27eda14cbcSMatt Macy #include <linux/completion.h>
28eda14cbcSMatt Macy #include <sys/zfs_context.h>
29eda14cbcSMatt Macy #include <sys/byteorder.h>
30eda14cbcSMatt Macy #include <sys/zio.h>
31eda14cbcSMatt Macy #include <sys/qat.h>
32eda14cbcSMatt Macy 
33eda14cbcSMatt Macy /*
34eda14cbcSMatt Macy  * Max instances in a QAT device, each instance is a channel to submit
35eda14cbcSMatt Macy  * jobs to QAT hardware, this is only for pre-allocating instance and
36eda14cbcSMatt Macy  * session arrays; the actual number of instances are defined in the
37eda14cbcSMatt Macy  * QAT driver's configuration file.
38eda14cbcSMatt Macy  */
39eda14cbcSMatt Macy #define	QAT_DC_MAX_INSTANCES	48
40eda14cbcSMatt Macy 
41eda14cbcSMatt Macy /*
42eda14cbcSMatt Macy  * ZLIB head and foot size
43eda14cbcSMatt Macy  */
44eda14cbcSMatt Macy #define	ZLIB_HEAD_SZ		2
45eda14cbcSMatt Macy #define	ZLIB_FOOT_SZ		4
46eda14cbcSMatt Macy 
47eda14cbcSMatt Macy static CpaInstanceHandle dc_inst_handles[QAT_DC_MAX_INSTANCES];
48eda14cbcSMatt Macy static CpaDcSessionHandle session_handles[QAT_DC_MAX_INSTANCES];
49eda14cbcSMatt Macy static CpaBufferList **buffer_array[QAT_DC_MAX_INSTANCES];
50eda14cbcSMatt Macy static Cpa16U num_inst = 0;
51eda14cbcSMatt Macy static Cpa32U inst_num = 0;
52eda14cbcSMatt Macy static boolean_t qat_dc_init_done = B_FALSE;
53eda14cbcSMatt Macy int zfs_qat_compress_disable = 0;
54eda14cbcSMatt Macy 
55eda14cbcSMatt Macy boolean_t
qat_dc_use_accel(size_t s_len)56eda14cbcSMatt Macy qat_dc_use_accel(size_t s_len)
57eda14cbcSMatt Macy {
58eda14cbcSMatt Macy 	return (!zfs_qat_compress_disable &&
59eda14cbcSMatt Macy 	    qat_dc_init_done &&
60eda14cbcSMatt Macy 	    s_len >= QAT_MIN_BUF_SIZE &&
61eda14cbcSMatt Macy 	    s_len <= QAT_MAX_BUF_SIZE);
62eda14cbcSMatt Macy }
63eda14cbcSMatt Macy 
64eda14cbcSMatt Macy static void
qat_dc_callback(void * p_callback,CpaStatus status)65eda14cbcSMatt Macy qat_dc_callback(void *p_callback, CpaStatus status)
66eda14cbcSMatt Macy {
67eda14cbcSMatt Macy 	if (p_callback != NULL)
68eda14cbcSMatt Macy 		complete((struct completion *)p_callback);
69eda14cbcSMatt Macy }
70eda14cbcSMatt Macy 
71eda14cbcSMatt Macy static void
qat_dc_clean(void)72eda14cbcSMatt Macy qat_dc_clean(void)
73eda14cbcSMatt Macy {
74eda14cbcSMatt Macy 	Cpa16U buff_num = 0;
75eda14cbcSMatt Macy 	Cpa16U num_inter_buff_lists = 0;
76eda14cbcSMatt Macy 
77eda14cbcSMatt Macy 	for (Cpa16U i = 0; i < num_inst; i++) {
78eda14cbcSMatt Macy 		cpaDcStopInstance(dc_inst_handles[i]);
79eda14cbcSMatt Macy 		QAT_PHYS_CONTIG_FREE(session_handles[i]);
80eda14cbcSMatt Macy 		/* free intermediate buffers  */
81eda14cbcSMatt Macy 		if (buffer_array[i] != NULL) {
82eda14cbcSMatt Macy 			cpaDcGetNumIntermediateBuffers(
83eda14cbcSMatt Macy 			    dc_inst_handles[i], &num_inter_buff_lists);
84eda14cbcSMatt Macy 			for (buff_num = 0; buff_num < num_inter_buff_lists;
85eda14cbcSMatt Macy 			    buff_num++) {
86eda14cbcSMatt Macy 				CpaBufferList *buffer_inter =
87eda14cbcSMatt Macy 				    buffer_array[i][buff_num];
88eda14cbcSMatt Macy 				if (buffer_inter->pBuffers) {
89eda14cbcSMatt Macy 					QAT_PHYS_CONTIG_FREE(
90eda14cbcSMatt Macy 					    buffer_inter->pBuffers->pData);
91eda14cbcSMatt Macy 					QAT_PHYS_CONTIG_FREE(
92eda14cbcSMatt Macy 					    buffer_inter->pBuffers);
93eda14cbcSMatt Macy 				}
94eda14cbcSMatt Macy 				QAT_PHYS_CONTIG_FREE(
95eda14cbcSMatt Macy 				    buffer_inter->pPrivateMetaData);
96eda14cbcSMatt Macy 				QAT_PHYS_CONTIG_FREE(buffer_inter);
97eda14cbcSMatt Macy 			}
98eda14cbcSMatt Macy 		}
99eda14cbcSMatt Macy 	}
100eda14cbcSMatt Macy 
101eda14cbcSMatt Macy 	num_inst = 0;
102eda14cbcSMatt Macy 	qat_dc_init_done = B_FALSE;
103eda14cbcSMatt Macy }
104eda14cbcSMatt Macy 
105eda14cbcSMatt Macy int
qat_dc_init(void)106eda14cbcSMatt Macy qat_dc_init(void)
107eda14cbcSMatt Macy {
108eda14cbcSMatt Macy 	CpaStatus status = CPA_STATUS_SUCCESS;
109eda14cbcSMatt Macy 	Cpa32U sess_size = 0;
110eda14cbcSMatt Macy 	Cpa32U ctx_size = 0;
111eda14cbcSMatt Macy 	Cpa16U num_inter_buff_lists = 0;
112eda14cbcSMatt Macy 	Cpa16U buff_num = 0;
113eda14cbcSMatt Macy 	Cpa32U buff_meta_size = 0;
114eda14cbcSMatt Macy 	CpaDcSessionSetupData sd = {0};
115eda14cbcSMatt Macy 
116eda14cbcSMatt Macy 	if (qat_dc_init_done)
117eda14cbcSMatt Macy 		return (0);
118eda14cbcSMatt Macy 
119eda14cbcSMatt Macy 	status = cpaDcGetNumInstances(&num_inst);
120eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
121eda14cbcSMatt Macy 		return (-1);
122eda14cbcSMatt Macy 
123eda14cbcSMatt Macy 	/* if the user has configured no QAT compression units just return */
124eda14cbcSMatt Macy 	if (num_inst == 0)
125eda14cbcSMatt Macy 		return (0);
126eda14cbcSMatt Macy 
127eda14cbcSMatt Macy 	if (num_inst > QAT_DC_MAX_INSTANCES)
128eda14cbcSMatt Macy 		num_inst = QAT_DC_MAX_INSTANCES;
129eda14cbcSMatt Macy 
130eda14cbcSMatt Macy 	status = cpaDcGetInstances(num_inst, &dc_inst_handles[0]);
131eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
132eda14cbcSMatt Macy 		return (-1);
133eda14cbcSMatt Macy 
134eda14cbcSMatt Macy 	for (Cpa16U i = 0; i < num_inst; i++) {
135eda14cbcSMatt Macy 		cpaDcSetAddressTranslation(dc_inst_handles[i],
136eda14cbcSMatt Macy 		    (void*)virt_to_phys);
137eda14cbcSMatt Macy 
138eda14cbcSMatt Macy 		status = cpaDcBufferListGetMetaSize(dc_inst_handles[i],
139eda14cbcSMatt Macy 		    1, &buff_meta_size);
140eda14cbcSMatt Macy 
141eda14cbcSMatt Macy 		if (status == CPA_STATUS_SUCCESS)
142eda14cbcSMatt Macy 			status = cpaDcGetNumIntermediateBuffers(
143eda14cbcSMatt Macy 			    dc_inst_handles[i], &num_inter_buff_lists);
144eda14cbcSMatt Macy 
145eda14cbcSMatt Macy 		if (status == CPA_STATUS_SUCCESS && num_inter_buff_lists != 0)
146eda14cbcSMatt Macy 			status = QAT_PHYS_CONTIG_ALLOC(&buffer_array[i],
147eda14cbcSMatt Macy 			    num_inter_buff_lists *
148eda14cbcSMatt Macy 			    sizeof (CpaBufferList *));
149eda14cbcSMatt Macy 
150eda14cbcSMatt Macy 		for (buff_num = 0; buff_num < num_inter_buff_lists;
151eda14cbcSMatt Macy 		    buff_num++) {
152eda14cbcSMatt Macy 			if (status == CPA_STATUS_SUCCESS)
153eda14cbcSMatt Macy 				status = QAT_PHYS_CONTIG_ALLOC(
154eda14cbcSMatt Macy 				    &buffer_array[i][buff_num],
155eda14cbcSMatt Macy 				    sizeof (CpaBufferList));
156eda14cbcSMatt Macy 
157eda14cbcSMatt Macy 			if (status == CPA_STATUS_SUCCESS)
158eda14cbcSMatt Macy 				status = QAT_PHYS_CONTIG_ALLOC(
159eda14cbcSMatt Macy 				    &buffer_array[i][buff_num]->
160eda14cbcSMatt Macy 				    pPrivateMetaData,
161eda14cbcSMatt Macy 				    buff_meta_size);
162eda14cbcSMatt Macy 
163eda14cbcSMatt Macy 			if (status == CPA_STATUS_SUCCESS)
164eda14cbcSMatt Macy 				status = QAT_PHYS_CONTIG_ALLOC(
165eda14cbcSMatt Macy 				    &buffer_array[i][buff_num]->pBuffers,
166eda14cbcSMatt Macy 				    sizeof (CpaFlatBuffer));
167eda14cbcSMatt Macy 
168eda14cbcSMatt Macy 			if (status == CPA_STATUS_SUCCESS) {
169eda14cbcSMatt Macy 				/*
170eda14cbcSMatt Macy 				 *  implementation requires an intermediate
171eda14cbcSMatt Macy 				 *  buffer approximately twice the size of
172eda14cbcSMatt Macy 				 *  output buffer, which is 2x max buffer
173eda14cbcSMatt Macy 				 *  size here.
174eda14cbcSMatt Macy 				 */
175eda14cbcSMatt Macy 				status = QAT_PHYS_CONTIG_ALLOC(
176eda14cbcSMatt Macy 				    &buffer_array[i][buff_num]->pBuffers->
177eda14cbcSMatt Macy 				    pData, 2 * QAT_MAX_BUF_SIZE);
178eda14cbcSMatt Macy 				if (status != CPA_STATUS_SUCCESS)
179eda14cbcSMatt Macy 					goto fail;
180eda14cbcSMatt Macy 
181eda14cbcSMatt Macy 				buffer_array[i][buff_num]->numBuffers = 1;
182eda14cbcSMatt Macy 				buffer_array[i][buff_num]->pBuffers->
183eda14cbcSMatt Macy 				    dataLenInBytes = 2 * QAT_MAX_BUF_SIZE;
184eda14cbcSMatt Macy 			}
185eda14cbcSMatt Macy 		}
186eda14cbcSMatt Macy 
187eda14cbcSMatt Macy 		status = cpaDcStartInstance(dc_inst_handles[i],
188eda14cbcSMatt Macy 		    num_inter_buff_lists, buffer_array[i]);
189eda14cbcSMatt Macy 		if (status != CPA_STATUS_SUCCESS)
190eda14cbcSMatt Macy 			goto fail;
191eda14cbcSMatt Macy 
192eda14cbcSMatt Macy 		sd.compLevel = CPA_DC_L1;
193eda14cbcSMatt Macy 		sd.compType = CPA_DC_DEFLATE;
194eda14cbcSMatt Macy 		sd.huffType = CPA_DC_HT_FULL_DYNAMIC;
195eda14cbcSMatt Macy 		sd.sessDirection = CPA_DC_DIR_COMBINED;
196eda14cbcSMatt Macy 		sd.sessState = CPA_DC_STATELESS;
1973159b89bSMartin Matuska #if (CPA_DC_API_VERSION_NUM_MAJOR == 1 && CPA_DC_API_VERSION_NUM_MINOR < 6)
198eda14cbcSMatt Macy 		sd.deflateWindowSize = 7;
1993159b89bSMartin Matuska #endif
200eda14cbcSMatt Macy 		sd.checksum = CPA_DC_ADLER32;
201eda14cbcSMatt Macy 		status = cpaDcGetSessionSize(dc_inst_handles[i],
202eda14cbcSMatt Macy 		    &sd, &sess_size, &ctx_size);
203eda14cbcSMatt Macy 		if (status != CPA_STATUS_SUCCESS)
204eda14cbcSMatt Macy 			goto fail;
205eda14cbcSMatt Macy 
206eda14cbcSMatt Macy 		QAT_PHYS_CONTIG_ALLOC(&session_handles[i], sess_size);
207eda14cbcSMatt Macy 		if (session_handles[i] == NULL)
208eda14cbcSMatt Macy 			goto fail;
209eda14cbcSMatt Macy 
210eda14cbcSMatt Macy 		status = cpaDcInitSession(dc_inst_handles[i],
211eda14cbcSMatt Macy 		    session_handles[i],
212eda14cbcSMatt Macy 		    &sd, NULL, qat_dc_callback);
213eda14cbcSMatt Macy 		if (status != CPA_STATUS_SUCCESS)
214eda14cbcSMatt Macy 			goto fail;
215eda14cbcSMatt Macy 	}
216eda14cbcSMatt Macy 
217eda14cbcSMatt Macy 	qat_dc_init_done = B_TRUE;
218eda14cbcSMatt Macy 	return (0);
219eda14cbcSMatt Macy fail:
220eda14cbcSMatt Macy 	qat_dc_clean();
221eda14cbcSMatt Macy 	return (-1);
222eda14cbcSMatt Macy }
223eda14cbcSMatt Macy 
224eda14cbcSMatt Macy void
qat_dc_fini(void)225eda14cbcSMatt Macy qat_dc_fini(void)
226eda14cbcSMatt Macy {
227eda14cbcSMatt Macy 	if (!qat_dc_init_done)
228eda14cbcSMatt Macy 		return;
229eda14cbcSMatt Macy 
230eda14cbcSMatt Macy 	qat_dc_clean();
231eda14cbcSMatt Macy }
232eda14cbcSMatt Macy 
233eda14cbcSMatt Macy /*
234eda14cbcSMatt Macy  * The "add" parameter is an additional buffer which is passed
235eda14cbcSMatt Macy  * to QAT as a scratch buffer alongside the destination buffer
236eda14cbcSMatt Macy  * in case the "compressed" data ends up being larger than the
237eda14cbcSMatt Macy  * original source data. This is necessary to prevent QAT from
238eda14cbcSMatt Macy  * generating buffer overflow warnings for incompressible data.
239eda14cbcSMatt Macy  */
240eda14cbcSMatt Macy static int
qat_compress_impl(qat_compress_dir_t dir,char * src,int src_len,char * dst,int dst_len,char * add,int add_len,size_t * c_len)241eda14cbcSMatt Macy qat_compress_impl(qat_compress_dir_t dir, char *src, int src_len,
242eda14cbcSMatt Macy     char *dst, int dst_len, char *add, int add_len, size_t *c_len)
243eda14cbcSMatt Macy {
244eda14cbcSMatt Macy 	CpaInstanceHandle dc_inst_handle;
245eda14cbcSMatt Macy 	CpaDcSessionHandle session_handle;
246eda14cbcSMatt Macy 	CpaBufferList *buf_list_src = NULL;
247eda14cbcSMatt Macy 	CpaBufferList *buf_list_dst = NULL;
248eda14cbcSMatt Macy 	CpaFlatBuffer *flat_buf_src = NULL;
249eda14cbcSMatt Macy 	CpaFlatBuffer *flat_buf_dst = NULL;
250eda14cbcSMatt Macy 	Cpa8U *buffer_meta_src = NULL;
251eda14cbcSMatt Macy 	Cpa8U *buffer_meta_dst = NULL;
252eda14cbcSMatt Macy 	Cpa32U buffer_meta_size = 0;
2532a58b312SMartin Matuska 	CpaDcRqResults dc_results = {.checksum = 1};
254eda14cbcSMatt Macy 	CpaStatus status = CPA_STATUS_FAIL;
255eda14cbcSMatt Macy 	Cpa32U hdr_sz = 0;
256eda14cbcSMatt Macy 	Cpa32U compressed_sz;
257eda14cbcSMatt Macy 	Cpa32U num_src_buf = (src_len >> PAGE_SHIFT) + 2;
258eda14cbcSMatt Macy 	Cpa32U num_dst_buf = (dst_len >> PAGE_SHIFT) + 2;
259eda14cbcSMatt Macy 	Cpa32U num_add_buf = (add_len >> PAGE_SHIFT) + 2;
260eda14cbcSMatt Macy 	Cpa32U bytes_left;
261eda14cbcSMatt Macy 	Cpa32U dst_pages = 0;
262eda14cbcSMatt Macy 	Cpa32U adler32 = 0;
263eda14cbcSMatt Macy 	char *data;
264eda14cbcSMatt Macy 	struct page *page;
265eda14cbcSMatt Macy 	struct page **in_pages = NULL;
266eda14cbcSMatt Macy 	struct page **out_pages = NULL;
267eda14cbcSMatt Macy 	struct page **add_pages = NULL;
268eda14cbcSMatt Macy 	Cpa32U page_off = 0;
269eda14cbcSMatt Macy 	struct completion complete;
270eda14cbcSMatt Macy 	Cpa32U page_num = 0;
271eda14cbcSMatt Macy 	Cpa16U i;
272eda14cbcSMatt Macy 
273eda14cbcSMatt Macy 	/*
274eda14cbcSMatt Macy 	 * We increment num_src_buf and num_dst_buf by 2 to allow
275eda14cbcSMatt Macy 	 * us to handle non page-aligned buffer addresses and buffers
276eda14cbcSMatt Macy 	 * whose sizes are not divisible by PAGE_SIZE.
277eda14cbcSMatt Macy 	 */
278eda14cbcSMatt Macy 	Cpa32U src_buffer_list_mem_size = sizeof (CpaBufferList) +
279eda14cbcSMatt Macy 	    (num_src_buf * sizeof (CpaFlatBuffer));
280eda14cbcSMatt Macy 	Cpa32U dst_buffer_list_mem_size = sizeof (CpaBufferList) +
281eda14cbcSMatt Macy 	    ((num_dst_buf + num_add_buf) * sizeof (CpaFlatBuffer));
282eda14cbcSMatt Macy 
283eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&in_pages,
284eda14cbcSMatt Macy 	    num_src_buf * sizeof (struct page *));
285eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
286eda14cbcSMatt Macy 		goto fail;
287eda14cbcSMatt Macy 
288eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&out_pages,
289eda14cbcSMatt Macy 	    num_dst_buf * sizeof (struct page *));
290eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
291eda14cbcSMatt Macy 		goto fail;
292eda14cbcSMatt Macy 
293eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&add_pages,
294eda14cbcSMatt Macy 	    num_add_buf * sizeof (struct page *));
295eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
296eda14cbcSMatt Macy 		goto fail;
297eda14cbcSMatt Macy 
298eda14cbcSMatt Macy 	i = (Cpa32U)atomic_inc_32_nv(&inst_num) % num_inst;
299eda14cbcSMatt Macy 	dc_inst_handle = dc_inst_handles[i];
300eda14cbcSMatt Macy 	session_handle = session_handles[i];
301eda14cbcSMatt Macy 
302eda14cbcSMatt Macy 	cpaDcBufferListGetMetaSize(dc_inst_handle, num_src_buf,
303eda14cbcSMatt Macy 	    &buffer_meta_size);
304eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&buffer_meta_src, buffer_meta_size);
305eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
306eda14cbcSMatt Macy 		goto fail;
307eda14cbcSMatt Macy 
308eda14cbcSMatt Macy 	cpaDcBufferListGetMetaSize(dc_inst_handle, num_dst_buf + num_add_buf,
309eda14cbcSMatt Macy 	    &buffer_meta_size);
310eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&buffer_meta_dst, buffer_meta_size);
311eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
312eda14cbcSMatt Macy 		goto fail;
313eda14cbcSMatt Macy 
314eda14cbcSMatt Macy 	/* build source buffer list */
315eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&buf_list_src, src_buffer_list_mem_size);
316eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
317eda14cbcSMatt Macy 		goto fail;
318eda14cbcSMatt Macy 
319eda14cbcSMatt Macy 	flat_buf_src = (CpaFlatBuffer *)(buf_list_src + 1);
320eda14cbcSMatt Macy 
321eda14cbcSMatt Macy 	buf_list_src->pBuffers = flat_buf_src; /* always point to first one */
322eda14cbcSMatt Macy 
323eda14cbcSMatt Macy 	/* build destination buffer list */
324eda14cbcSMatt Macy 	status = QAT_PHYS_CONTIG_ALLOC(&buf_list_dst, dst_buffer_list_mem_size);
325eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS)
326eda14cbcSMatt Macy 		goto fail;
327eda14cbcSMatt Macy 
328eda14cbcSMatt Macy 	flat_buf_dst = (CpaFlatBuffer *)(buf_list_dst + 1);
329eda14cbcSMatt Macy 
330eda14cbcSMatt Macy 	buf_list_dst->pBuffers = flat_buf_dst; /* always point to first one */
331eda14cbcSMatt Macy 
332eda14cbcSMatt Macy 	buf_list_src->numBuffers = 0;
333eda14cbcSMatt Macy 	buf_list_src->pPrivateMetaData = buffer_meta_src;
334eda14cbcSMatt Macy 	bytes_left = src_len;
335eda14cbcSMatt Macy 	data = src;
336eda14cbcSMatt Macy 	page_num = 0;
337eda14cbcSMatt Macy 	while (bytes_left > 0) {
338eda14cbcSMatt Macy 		page_off = ((long)data & ~PAGE_MASK);
339eda14cbcSMatt Macy 		page = qat_mem_to_page(data);
340eda14cbcSMatt Macy 		in_pages[page_num] = page;
341eda14cbcSMatt Macy 		flat_buf_src->pData = kmap(page) + page_off;
342eda14cbcSMatt Macy 		flat_buf_src->dataLenInBytes =
343eda14cbcSMatt Macy 		    min((long)PAGE_SIZE - page_off, (long)bytes_left);
344eda14cbcSMatt Macy 
345eda14cbcSMatt Macy 		bytes_left -= flat_buf_src->dataLenInBytes;
346eda14cbcSMatt Macy 		data += flat_buf_src->dataLenInBytes;
347eda14cbcSMatt Macy 		flat_buf_src++;
348eda14cbcSMatt Macy 		buf_list_src->numBuffers++;
349eda14cbcSMatt Macy 		page_num++;
350eda14cbcSMatt Macy 	}
351eda14cbcSMatt Macy 
352eda14cbcSMatt Macy 	buf_list_dst->numBuffers = 0;
353eda14cbcSMatt Macy 	buf_list_dst->pPrivateMetaData = buffer_meta_dst;
354eda14cbcSMatt Macy 	bytes_left = dst_len;
355eda14cbcSMatt Macy 	data = dst;
356eda14cbcSMatt Macy 	page_num = 0;
357eda14cbcSMatt Macy 	while (bytes_left > 0) {
358eda14cbcSMatt Macy 		page_off = ((long)data & ~PAGE_MASK);
359eda14cbcSMatt Macy 		page = qat_mem_to_page(data);
360eda14cbcSMatt Macy 		flat_buf_dst->pData = kmap(page) + page_off;
361eda14cbcSMatt Macy 		out_pages[page_num] = page;
362eda14cbcSMatt Macy 		flat_buf_dst->dataLenInBytes =
363eda14cbcSMatt Macy 		    min((long)PAGE_SIZE - page_off, (long)bytes_left);
364eda14cbcSMatt Macy 
365eda14cbcSMatt Macy 		bytes_left -= flat_buf_dst->dataLenInBytes;
366eda14cbcSMatt Macy 		data += flat_buf_dst->dataLenInBytes;
367eda14cbcSMatt Macy 		flat_buf_dst++;
368eda14cbcSMatt Macy 		buf_list_dst->numBuffers++;
369eda14cbcSMatt Macy 		page_num++;
370eda14cbcSMatt Macy 		dst_pages++;
371eda14cbcSMatt Macy 	}
372eda14cbcSMatt Macy 
373eda14cbcSMatt Macy 	/* map additional scratch pages into the destination buffer list */
374eda14cbcSMatt Macy 	bytes_left = add_len;
375eda14cbcSMatt Macy 	data = add;
376eda14cbcSMatt Macy 	page_num = 0;
377eda14cbcSMatt Macy 	while (bytes_left > 0) {
378eda14cbcSMatt Macy 		page_off = ((long)data & ~PAGE_MASK);
379eda14cbcSMatt Macy 		page = qat_mem_to_page(data);
380eda14cbcSMatt Macy 		flat_buf_dst->pData = kmap(page) + page_off;
381eda14cbcSMatt Macy 		add_pages[page_num] = page;
382eda14cbcSMatt Macy 		flat_buf_dst->dataLenInBytes =
383eda14cbcSMatt Macy 		    min((long)PAGE_SIZE - page_off, (long)bytes_left);
384eda14cbcSMatt Macy 
385eda14cbcSMatt Macy 		bytes_left -= flat_buf_dst->dataLenInBytes;
386eda14cbcSMatt Macy 		data += flat_buf_dst->dataLenInBytes;
387eda14cbcSMatt Macy 		flat_buf_dst++;
388eda14cbcSMatt Macy 		buf_list_dst->numBuffers++;
389eda14cbcSMatt Macy 		page_num++;
390eda14cbcSMatt Macy 	}
391eda14cbcSMatt Macy 
392eda14cbcSMatt Macy 	init_completion(&complete);
393eda14cbcSMatt Macy 
394eda14cbcSMatt Macy 	if (dir == QAT_COMPRESS) {
395eda14cbcSMatt Macy 		QAT_STAT_BUMP(comp_requests);
396eda14cbcSMatt Macy 		QAT_STAT_INCR(comp_total_in_bytes, src_len);
397eda14cbcSMatt Macy 
398eda14cbcSMatt Macy 		cpaDcGenerateHeader(session_handle,
399eda14cbcSMatt Macy 		    buf_list_dst->pBuffers, &hdr_sz);
400eda14cbcSMatt Macy 		buf_list_dst->pBuffers->pData += hdr_sz;
401eda14cbcSMatt Macy 		buf_list_dst->pBuffers->dataLenInBytes -= hdr_sz;
402eda14cbcSMatt Macy 		status = cpaDcCompressData(
403eda14cbcSMatt Macy 		    dc_inst_handle, session_handle,
404eda14cbcSMatt Macy 		    buf_list_src, buf_list_dst,
405eda14cbcSMatt Macy 		    &dc_results, CPA_DC_FLUSH_FINAL,
406eda14cbcSMatt Macy 		    &complete);
407eda14cbcSMatt Macy 		if (status != CPA_STATUS_SUCCESS) {
408eda14cbcSMatt Macy 			goto fail;
409eda14cbcSMatt Macy 		}
410eda14cbcSMatt Macy 
411eda14cbcSMatt Macy 		/* we now wait until the completion of the operation. */
412eda14cbcSMatt Macy 		wait_for_completion(&complete);
413eda14cbcSMatt Macy 
414eda14cbcSMatt Macy 		if (dc_results.status != CPA_STATUS_SUCCESS) {
415eda14cbcSMatt Macy 			status = CPA_STATUS_FAIL;
416eda14cbcSMatt Macy 			goto fail;
417eda14cbcSMatt Macy 		}
418eda14cbcSMatt Macy 
419eda14cbcSMatt Macy 		compressed_sz = dc_results.produced;
420eda14cbcSMatt Macy 		if (compressed_sz + hdr_sz + ZLIB_FOOT_SZ > dst_len) {
421eda14cbcSMatt Macy 			status = CPA_STATUS_INCOMPRESSIBLE;
422eda14cbcSMatt Macy 			goto fail;
423eda14cbcSMatt Macy 		}
424eda14cbcSMatt Macy 
4251f88aa09SMartin Matuska 		/* get adler32 checksum and append footer */
4261f88aa09SMartin Matuska 		*(Cpa32U*)(dst + hdr_sz + compressed_sz) =
4271f88aa09SMartin Matuska 		    BSWAP_32(dc_results.checksum);
428eda14cbcSMatt Macy 
4291f88aa09SMartin Matuska 		*c_len = hdr_sz + compressed_sz + ZLIB_FOOT_SZ;
430eda14cbcSMatt Macy 		QAT_STAT_INCR(comp_total_out_bytes, *c_len);
431eda14cbcSMatt Macy 	} else {
432eda14cbcSMatt Macy 		ASSERT3U(dir, ==, QAT_DECOMPRESS);
433eda14cbcSMatt Macy 		QAT_STAT_BUMP(decomp_requests);
434eda14cbcSMatt Macy 		QAT_STAT_INCR(decomp_total_in_bytes, src_len);
435eda14cbcSMatt Macy 
436eda14cbcSMatt Macy 		buf_list_src->pBuffers->pData += ZLIB_HEAD_SZ;
437eda14cbcSMatt Macy 		buf_list_src->pBuffers->dataLenInBytes -= ZLIB_HEAD_SZ;
438eda14cbcSMatt Macy 		status = cpaDcDecompressData(dc_inst_handle, session_handle,
439eda14cbcSMatt Macy 		    buf_list_src, buf_list_dst, &dc_results, CPA_DC_FLUSH_FINAL,
440eda14cbcSMatt Macy 		    &complete);
441eda14cbcSMatt Macy 
442eda14cbcSMatt Macy 		if (CPA_STATUS_SUCCESS != status) {
443eda14cbcSMatt Macy 			status = CPA_STATUS_FAIL;
444eda14cbcSMatt Macy 			goto fail;
445eda14cbcSMatt Macy 		}
446eda14cbcSMatt Macy 
447eda14cbcSMatt Macy 		/* we now wait until the completion of the operation. */
448eda14cbcSMatt Macy 		wait_for_completion(&complete);
449eda14cbcSMatt Macy 
450eda14cbcSMatt Macy 		if (dc_results.status != CPA_STATUS_SUCCESS) {
451eda14cbcSMatt Macy 			status = CPA_STATUS_FAIL;
452eda14cbcSMatt Macy 			goto fail;
453eda14cbcSMatt Macy 		}
454eda14cbcSMatt Macy 
455eda14cbcSMatt Macy 		/* verify adler checksum */
456eda14cbcSMatt Macy 		adler32 = *(Cpa32U *)(src + dc_results.consumed + ZLIB_HEAD_SZ);
457eda14cbcSMatt Macy 		if (adler32 != BSWAP_32(dc_results.checksum)) {
458eda14cbcSMatt Macy 			status = CPA_STATUS_FAIL;
459eda14cbcSMatt Macy 			goto fail;
460eda14cbcSMatt Macy 		}
461eda14cbcSMatt Macy 		*c_len = dc_results.produced;
462eda14cbcSMatt Macy 		QAT_STAT_INCR(decomp_total_out_bytes, *c_len);
463eda14cbcSMatt Macy 	}
464eda14cbcSMatt Macy 
465eda14cbcSMatt Macy fail:
466eda14cbcSMatt Macy 	if (status != CPA_STATUS_SUCCESS && status != CPA_STATUS_INCOMPRESSIBLE)
467eda14cbcSMatt Macy 		QAT_STAT_BUMP(dc_fails);
468eda14cbcSMatt Macy 
469eda14cbcSMatt Macy 	if (in_pages) {
470eda14cbcSMatt Macy 		for (page_num = 0;
471eda14cbcSMatt Macy 		    page_num < buf_list_src->numBuffers;
472eda14cbcSMatt Macy 		    page_num++) {
473eda14cbcSMatt Macy 			kunmap(in_pages[page_num]);
474eda14cbcSMatt Macy 		}
475eda14cbcSMatt Macy 		QAT_PHYS_CONTIG_FREE(in_pages);
476eda14cbcSMatt Macy 	}
477eda14cbcSMatt Macy 
478eda14cbcSMatt Macy 	if (out_pages) {
479eda14cbcSMatt Macy 		for (page_num = 0; page_num < dst_pages; page_num++) {
480eda14cbcSMatt Macy 			kunmap(out_pages[page_num]);
481eda14cbcSMatt Macy 		}
482eda14cbcSMatt Macy 		QAT_PHYS_CONTIG_FREE(out_pages);
483eda14cbcSMatt Macy 	}
484eda14cbcSMatt Macy 
485eda14cbcSMatt Macy 	if (add_pages) {
486eda14cbcSMatt Macy 		for (page_num = 0;
487eda14cbcSMatt Macy 		    page_num < buf_list_dst->numBuffers - dst_pages;
488eda14cbcSMatt Macy 		    page_num++) {
489eda14cbcSMatt Macy 			kunmap(add_pages[page_num]);
490eda14cbcSMatt Macy 		}
491eda14cbcSMatt Macy 		QAT_PHYS_CONTIG_FREE(add_pages);
492eda14cbcSMatt Macy 	}
493eda14cbcSMatt Macy 
494eda14cbcSMatt Macy 	QAT_PHYS_CONTIG_FREE(buffer_meta_src);
495eda14cbcSMatt Macy 	QAT_PHYS_CONTIG_FREE(buffer_meta_dst);
496eda14cbcSMatt Macy 	QAT_PHYS_CONTIG_FREE(buf_list_src);
497eda14cbcSMatt Macy 	QAT_PHYS_CONTIG_FREE(buf_list_dst);
498eda14cbcSMatt Macy 
499eda14cbcSMatt Macy 	return (status);
500eda14cbcSMatt Macy }
501eda14cbcSMatt Macy 
502eda14cbcSMatt Macy /*
503eda14cbcSMatt Macy  * Entry point for QAT accelerated compression / decompression.
504eda14cbcSMatt Macy  */
505eda14cbcSMatt Macy int
qat_compress(qat_compress_dir_t dir,char * src,int src_len,char * dst,int dst_len,size_t * c_len)506eda14cbcSMatt Macy qat_compress(qat_compress_dir_t dir, char *src, int src_len,
507eda14cbcSMatt Macy     char *dst, int dst_len, size_t *c_len)
508eda14cbcSMatt Macy {
509eda14cbcSMatt Macy 	int ret;
510eda14cbcSMatt Macy 	size_t add_len = 0;
511eda14cbcSMatt Macy 	void *add = NULL;
512eda14cbcSMatt Macy 
513eda14cbcSMatt Macy 	if (dir == QAT_COMPRESS) {
514eda14cbcSMatt Macy 		add_len = dst_len;
515eda14cbcSMatt Macy 		add = zio_data_buf_alloc(add_len);
516eda14cbcSMatt Macy 	}
517eda14cbcSMatt Macy 
518eda14cbcSMatt Macy 	ret = qat_compress_impl(dir, src, src_len, dst,
519eda14cbcSMatt Macy 	    dst_len, add, add_len, c_len);
520eda14cbcSMatt Macy 
521eda14cbcSMatt Macy 	if (dir == QAT_COMPRESS)
522eda14cbcSMatt Macy 		zio_data_buf_free(add, add_len);
523eda14cbcSMatt Macy 
524eda14cbcSMatt Macy 	return (ret);
525eda14cbcSMatt Macy }
526eda14cbcSMatt Macy 
527eda14cbcSMatt Macy static int
param_set_qat_compress(const char * val,zfs_kernel_param_t * kp)528eda14cbcSMatt Macy param_set_qat_compress(const char *val, zfs_kernel_param_t *kp)
529eda14cbcSMatt Macy {
530eda14cbcSMatt Macy 	int ret;
531eda14cbcSMatt Macy 	int *pvalue = kp->arg;
532eda14cbcSMatt Macy 	ret = param_set_int(val, kp);
533eda14cbcSMatt Macy 	if (ret)
534eda14cbcSMatt Macy 		return (ret);
535eda14cbcSMatt Macy 	/*
536eda14cbcSMatt Macy 	 * zfs_qat_compress_disable = 0: enable qat compress
537eda14cbcSMatt Macy 	 * try to initialize qat instance if it has not been done
538eda14cbcSMatt Macy 	 */
539eda14cbcSMatt Macy 	if (*pvalue == 0 && !qat_dc_init_done) {
540eda14cbcSMatt Macy 		ret = qat_dc_init();
541eda14cbcSMatt Macy 		if (ret != 0) {
542eda14cbcSMatt Macy 			zfs_qat_compress_disable = 1;
543eda14cbcSMatt Macy 			return (ret);
544eda14cbcSMatt Macy 		}
545eda14cbcSMatt Macy 	}
546eda14cbcSMatt Macy 	return (ret);
547eda14cbcSMatt Macy }
548eda14cbcSMatt Macy 
549eda14cbcSMatt Macy module_param_call(zfs_qat_compress_disable, param_set_qat_compress,
550eda14cbcSMatt Macy     param_get_int, &zfs_qat_compress_disable, 0644);
551eda14cbcSMatt Macy MODULE_PARM_DESC(zfs_qat_compress_disable, "Enable/Disable QAT compression");
552eda14cbcSMatt Macy 
553eda14cbcSMatt Macy #endif
554