4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 #if defined(_KERNEL) && defined(HAVE_QAT)
23 #include <linux/slab.h>
24 #include <linux/vmalloc.h>
25 #include <linux/pagemap.h>
26 #include <linux/completion.h>
27 #include <sys/zfs_context.h>
32 * Max instances in a QAT device, each instance is a channel to submit
33 * jobs to QAT hardware, this is only for pre-allocating instance and
34 * session arrays; the actual number of instances are defined in the
35 * QAT driver's configuration file.
37 #define QAT_DC_MAX_INSTANCES 48
40 * ZLIB head and foot size
42 #define ZLIB_HEAD_SZ 2
43 #define ZLIB_FOOT_SZ 4
45 static CpaInstanceHandle dc_inst_handles
[QAT_DC_MAX_INSTANCES
];
46 static CpaDcSessionHandle session_handles
[QAT_DC_MAX_INSTANCES
];
47 static CpaBufferList
**buffer_array
[QAT_DC_MAX_INSTANCES
];
48 static Cpa16U num_inst
= 0;
49 static Cpa32U inst_num
= 0;
50 static boolean_t qat_dc_init_done
= B_FALSE
;
51 int zfs_qat_compress_disable
= 0;
54 qat_dc_use_accel(size_t s_len
)
56 return (!zfs_qat_compress_disable
&&
58 s_len
>= QAT_MIN_BUF_SIZE
&&
59 s_len
<= QAT_MAX_BUF_SIZE
);
63 qat_dc_callback(void *p_callback
, CpaStatus status
)
65 if (p_callback
!= NULL
)
66 complete((struct completion
*)p_callback
);
73 Cpa16U num_inter_buff_lists
= 0;
75 for (Cpa16U i
= 0; i
< num_inst
; i
++) {
76 cpaDcStopInstance(dc_inst_handles
[i
]);
77 QAT_PHYS_CONTIG_FREE(session_handles
[i
]);
78 /* free intermediate buffers */
79 if (buffer_array
[i
] != NULL
) {
80 cpaDcGetNumIntermediateBuffers(
81 dc_inst_handles
[i
], &num_inter_buff_lists
);
82 for (buff_num
= 0; buff_num
< num_inter_buff_lists
;
84 CpaBufferList
*buffer_inter
=
85 buffer_array
[i
][buff_num
];
86 if (buffer_inter
->pBuffers
) {
88 buffer_inter
->pBuffers
->pData
);
90 buffer_inter
->pBuffers
);
93 buffer_inter
->pPrivateMetaData
);
94 QAT_PHYS_CONTIG_FREE(buffer_inter
);
100 qat_dc_init_done
= B_FALSE
;
106 CpaStatus status
= CPA_STATUS_SUCCESS
;
107 Cpa32U sess_size
= 0;
109 Cpa16U num_inter_buff_lists
= 0;
111 Cpa32U buff_meta_size
= 0;
112 CpaDcSessionSetupData sd
= {0};
114 status
= cpaDcGetNumInstances(&num_inst
);
115 if (status
!= CPA_STATUS_SUCCESS
)
118 /* if the user has configured no QAT compression units just return */
122 if (num_inst
> QAT_DC_MAX_INSTANCES
)
123 num_inst
= QAT_DC_MAX_INSTANCES
;
125 status
= cpaDcGetInstances(num_inst
, &dc_inst_handles
[0]);
126 if (status
!= CPA_STATUS_SUCCESS
)
129 for (Cpa16U i
= 0; i
< num_inst
; i
++) {
130 cpaDcSetAddressTranslation(dc_inst_handles
[i
],
131 (void*)virt_to_phys
);
133 status
= cpaDcBufferListGetMetaSize(dc_inst_handles
[i
],
136 if (status
== CPA_STATUS_SUCCESS
)
137 status
= cpaDcGetNumIntermediateBuffers(
138 dc_inst_handles
[i
], &num_inter_buff_lists
);
140 if (status
== CPA_STATUS_SUCCESS
&& num_inter_buff_lists
!= 0)
141 status
= QAT_PHYS_CONTIG_ALLOC(&buffer_array
[i
],
142 num_inter_buff_lists
*
143 sizeof (CpaBufferList
*));
145 for (buff_num
= 0; buff_num
< num_inter_buff_lists
;
147 if (status
== CPA_STATUS_SUCCESS
)
148 status
= QAT_PHYS_CONTIG_ALLOC(
149 &buffer_array
[i
][buff_num
],
150 sizeof (CpaBufferList
));
152 if (status
== CPA_STATUS_SUCCESS
)
153 status
= QAT_PHYS_CONTIG_ALLOC(
154 &buffer_array
[i
][buff_num
]->
158 if (status
== CPA_STATUS_SUCCESS
)
159 status
= QAT_PHYS_CONTIG_ALLOC(
160 &buffer_array
[i
][buff_num
]->pBuffers
,
161 sizeof (CpaFlatBuffer
));
163 if (status
== CPA_STATUS_SUCCESS
) {
165 * implementation requires an intermediate
166 * buffer approximately twice the size of
167 * output buffer, which is 2x max buffer
170 status
= QAT_PHYS_CONTIG_ALLOC(
171 &buffer_array
[i
][buff_num
]->pBuffers
->
172 pData
, 2 * QAT_MAX_BUF_SIZE
);
173 if (status
!= CPA_STATUS_SUCCESS
)
176 buffer_array
[i
][buff_num
]->numBuffers
= 1;
177 buffer_array
[i
][buff_num
]->pBuffers
->
178 dataLenInBytes
= 2 * QAT_MAX_BUF_SIZE
;
182 status
= cpaDcStartInstance(dc_inst_handles
[i
],
183 num_inter_buff_lists
, buffer_array
[i
]);
184 if (status
!= CPA_STATUS_SUCCESS
)
187 sd
.compLevel
= CPA_DC_L1
;
188 sd
.compType
= CPA_DC_DEFLATE
;
189 sd
.huffType
= CPA_DC_HT_FULL_DYNAMIC
;
190 sd
.sessDirection
= CPA_DC_DIR_COMBINED
;
191 sd
.sessState
= CPA_DC_STATELESS
;
192 sd
.deflateWindowSize
= 7;
193 sd
.checksum
= CPA_DC_ADLER32
;
194 status
= cpaDcGetSessionSize(dc_inst_handles
[i
],
195 &sd
, &sess_size
, &ctx_size
);
196 if (status
!= CPA_STATUS_SUCCESS
)
199 QAT_PHYS_CONTIG_ALLOC(&session_handles
[i
], sess_size
);
200 if (session_handles
[i
] == NULL
)
203 status
= cpaDcInitSession(dc_inst_handles
[i
],
205 &sd
, NULL
, qat_dc_callback
);
206 if (status
!= CPA_STATUS_SUCCESS
)
210 qat_dc_init_done
= B_TRUE
;
220 if (!qat_dc_init_done
)
227 * The "add" parameter is an additional buffer which is passed
228 * to QAT as a scratch buffer alongside the destination buffer
229 * in case the "compressed" data ends up being larger than the
230 * original source data. This is necessary to prevent QAT from
231 * generating buffer overflow warnings for incompressible data.
234 qat_compress_impl(qat_compress_dir_t dir
, char *src
, int src_len
,
235 char *dst
, int dst_len
, char *add
, int add_len
, size_t *c_len
)
237 CpaInstanceHandle dc_inst_handle
;
238 CpaDcSessionHandle session_handle
;
239 CpaBufferList
*buf_list_src
= NULL
;
240 CpaBufferList
*buf_list_dst
= NULL
;
241 CpaFlatBuffer
*flat_buf_src
= NULL
;
242 CpaFlatBuffer
*flat_buf_dst
= NULL
;
243 Cpa8U
*buffer_meta_src
= NULL
;
244 Cpa8U
*buffer_meta_dst
= NULL
;
245 Cpa32U buffer_meta_size
= 0;
246 CpaDcRqResults dc_results
;
247 CpaStatus status
= CPA_STATUS_SUCCESS
;
249 Cpa32U compressed_sz
;
250 Cpa32U num_src_buf
= (src_len
>> PAGE_SHIFT
) + 2;
251 Cpa32U num_dst_buf
= (dst_len
>> PAGE_SHIFT
) + 2;
252 Cpa32U num_add_buf
= (add_len
>> PAGE_SHIFT
) + 2;
254 Cpa32U dst_pages
= 0;
257 struct page
**in_pages
= NULL
;
258 struct page
**out_pages
= NULL
;
259 struct page
**add_pages
= NULL
;
261 struct completion complete
;
266 * We increment num_src_buf and num_dst_buf by 2 to allow
267 * us to handle non page-aligned buffer addresses and buffers
268 * whose sizes are not divisible by PAGE_SIZE.
270 Cpa32U src_buffer_list_mem_size
= sizeof (CpaBufferList
) +
271 (num_src_buf
* sizeof (CpaFlatBuffer
));
272 Cpa32U dst_buffer_list_mem_size
= sizeof (CpaBufferList
) +
273 ((num_dst_buf
+ num_add_buf
) * sizeof (CpaFlatBuffer
));
275 if (QAT_PHYS_CONTIG_ALLOC(&in_pages
,
276 num_src_buf
* sizeof (struct page
*)) != CPA_STATUS_SUCCESS
)
279 if (QAT_PHYS_CONTIG_ALLOC(&out_pages
,
280 num_dst_buf
* sizeof (struct page
*)) != CPA_STATUS_SUCCESS
)
283 if (QAT_PHYS_CONTIG_ALLOC(&add_pages
,
284 num_add_buf
* sizeof (struct page
*)) != CPA_STATUS_SUCCESS
)
287 i
= (Cpa32U
)atomic_inc_32_nv(&inst_num
) % num_inst
;
288 dc_inst_handle
= dc_inst_handles
[i
];
289 session_handle
= session_handles
[i
];
291 cpaDcBufferListGetMetaSize(dc_inst_handle
, num_src_buf
,
293 if (QAT_PHYS_CONTIG_ALLOC(&buffer_meta_src
, buffer_meta_size
) !=
297 cpaDcBufferListGetMetaSize(dc_inst_handle
, num_dst_buf
+ num_add_buf
,
299 if (QAT_PHYS_CONTIG_ALLOC(&buffer_meta_dst
, buffer_meta_size
) !=
303 /* build source buffer list */
304 if (QAT_PHYS_CONTIG_ALLOC(&buf_list_src
, src_buffer_list_mem_size
) !=
308 flat_buf_src
= (CpaFlatBuffer
*)(buf_list_src
+ 1);
310 buf_list_src
->pBuffers
= flat_buf_src
; /* always point to first one */
312 /* build destination buffer list */
313 if (QAT_PHYS_CONTIG_ALLOC(&buf_list_dst
, dst_buffer_list_mem_size
) !=
317 flat_buf_dst
= (CpaFlatBuffer
*)(buf_list_dst
+ 1);
319 buf_list_dst
->pBuffers
= flat_buf_dst
; /* always point to first one */
321 buf_list_src
->numBuffers
= 0;
322 buf_list_src
->pPrivateMetaData
= buffer_meta_src
;
323 bytes_left
= src_len
;
326 while (bytes_left
> 0) {
327 page_off
= ((long)data
& ~PAGE_MASK
);
328 page
= qat_mem_to_page(data
);
329 in_pages
[page_num
] = page
;
330 flat_buf_src
->pData
= kmap(page
) + page_off
;
331 flat_buf_src
->dataLenInBytes
=
332 min((long)PAGE_SIZE
- page_off
, (long)bytes_left
);
334 bytes_left
-= flat_buf_src
->dataLenInBytes
;
335 data
+= flat_buf_src
->dataLenInBytes
;
337 buf_list_src
->numBuffers
++;
341 buf_list_dst
->numBuffers
= 0;
342 buf_list_dst
->pPrivateMetaData
= buffer_meta_dst
;
343 bytes_left
= dst_len
;
346 while (bytes_left
> 0) {
347 page_off
= ((long)data
& ~PAGE_MASK
);
348 page
= qat_mem_to_page(data
);
349 flat_buf_dst
->pData
= kmap(page
) + page_off
;
350 out_pages
[page_num
] = page
;
351 flat_buf_dst
->dataLenInBytes
=
352 min((long)PAGE_SIZE
- page_off
, (long)bytes_left
);
354 bytes_left
-= flat_buf_dst
->dataLenInBytes
;
355 data
+= flat_buf_dst
->dataLenInBytes
;
357 buf_list_dst
->numBuffers
++;
362 /* map additional scratch pages into the destination buffer list */
363 bytes_left
= add_len
;
366 while (bytes_left
> 0) {
367 page_off
= ((long)data
& ~PAGE_MASK
);
368 page
= qat_mem_to_page(data
);
369 flat_buf_dst
->pData
= kmap(page
) + page_off
;
370 add_pages
[page_num
] = page
;
371 flat_buf_dst
->dataLenInBytes
=
372 min((long)PAGE_SIZE
- page_off
, (long)bytes_left
);
374 bytes_left
-= flat_buf_dst
->dataLenInBytes
;
375 data
+= flat_buf_dst
->dataLenInBytes
;
377 buf_list_dst
->numBuffers
++;
381 init_completion(&complete
);
383 if (dir
== QAT_COMPRESS
) {
384 QAT_STAT_BUMP(comp_requests
);
385 QAT_STAT_INCR(comp_total_in_bytes
, src_len
);
387 cpaDcGenerateHeader(session_handle
,
388 buf_list_dst
->pBuffers
, &hdr_sz
);
389 buf_list_dst
->pBuffers
->pData
+= hdr_sz
;
390 buf_list_dst
->pBuffers
->dataLenInBytes
-= hdr_sz
;
391 status
= cpaDcCompressData(
392 dc_inst_handle
, session_handle
,
393 buf_list_src
, buf_list_dst
,
394 &dc_results
, CPA_DC_FLUSH_FINAL
,
396 if (status
!= CPA_STATUS_SUCCESS
) {
400 /* we now wait until the completion of the operation. */
401 if (!wait_for_completion_interruptible_timeout(&complete
,
403 status
= CPA_STATUS_FAIL
;
407 if (dc_results
.status
!= CPA_STATUS_SUCCESS
) {
408 status
= CPA_STATUS_FAIL
;
412 compressed_sz
= dc_results
.produced
;
413 if (compressed_sz
+ hdr_sz
+ ZLIB_FOOT_SZ
> dst_len
) {
414 status
= CPA_STATUS_INCOMPRESSIBLE
;
418 flat_buf_dst
= (CpaFlatBuffer
*)(buf_list_dst
+ 1);
419 /* move to the last page */
420 flat_buf_dst
+= (compressed_sz
+ hdr_sz
) >> PAGE_SHIFT
;
422 /* no space for gzip footer in the last page */
423 if (((compressed_sz
+ hdr_sz
) % PAGE_SIZE
)
424 + ZLIB_FOOT_SZ
> PAGE_SIZE
) {
425 status
= CPA_STATUS_INCOMPRESSIBLE
;
429 /* jump to the end of the buffer and append footer */
430 flat_buf_dst
->pData
=
431 (char *)((unsigned long)flat_buf_dst
->pData
& PAGE_MASK
)
432 + ((compressed_sz
+ hdr_sz
) % PAGE_SIZE
);
433 flat_buf_dst
->dataLenInBytes
= ZLIB_FOOT_SZ
;
435 dc_results
.produced
= 0;
436 status
= cpaDcGenerateFooter(session_handle
,
437 flat_buf_dst
, &dc_results
);
438 if (status
!= CPA_STATUS_SUCCESS
)
441 *c_len
= compressed_sz
+ dc_results
.produced
+ hdr_sz
;
442 QAT_STAT_INCR(comp_total_out_bytes
, *c_len
);
444 ASSERT3U(dir
, ==, QAT_DECOMPRESS
);
445 QAT_STAT_BUMP(decomp_requests
);
446 QAT_STAT_INCR(decomp_total_in_bytes
, src_len
);
448 buf_list_src
->pBuffers
->pData
+= ZLIB_HEAD_SZ
;
449 buf_list_src
->pBuffers
->dataLenInBytes
-= ZLIB_HEAD_SZ
;
450 status
= cpaDcDecompressData(dc_inst_handle
, session_handle
,
451 buf_list_src
, buf_list_dst
, &dc_results
, CPA_DC_FLUSH_FINAL
,
454 if (CPA_STATUS_SUCCESS
!= status
) {
455 status
= CPA_STATUS_FAIL
;
459 /* we now wait until the completion of the operation. */
460 if (!wait_for_completion_interruptible_timeout(&complete
,
462 status
= CPA_STATUS_FAIL
;
466 if (dc_results
.status
!= CPA_STATUS_SUCCESS
) {
467 status
= CPA_STATUS_FAIL
;
471 *c_len
= dc_results
.produced
;
472 QAT_STAT_INCR(decomp_total_out_bytes
, *c_len
);
476 if (status
!= CPA_STATUS_SUCCESS
&& status
!= CPA_STATUS_INCOMPRESSIBLE
)
477 QAT_STAT_BUMP(dc_fails
);
481 page_num
< buf_list_src
->numBuffers
;
483 kunmap(in_pages
[page_num
]);
485 QAT_PHYS_CONTIG_FREE(in_pages
);
489 for (page_num
= 0; page_num
< dst_pages
; page_num
++) {
490 kunmap(out_pages
[page_num
]);
492 QAT_PHYS_CONTIG_FREE(out_pages
);
497 page_num
< buf_list_dst
->numBuffers
- dst_pages
;
499 kunmap(add_pages
[page_num
]);
501 QAT_PHYS_CONTIG_FREE(add_pages
);
504 QAT_PHYS_CONTIG_FREE(buffer_meta_src
);
505 QAT_PHYS_CONTIG_FREE(buffer_meta_dst
);
506 QAT_PHYS_CONTIG_FREE(buf_list_src
);
507 QAT_PHYS_CONTIG_FREE(buf_list_dst
);
513 * Entry point for QAT accelerated compression / decompression.
516 qat_compress(qat_compress_dir_t dir
, char *src
, int src_len
,
517 char *dst
, int dst_len
, size_t *c_len
)
523 if (dir
== QAT_COMPRESS
) {
525 add
= zio_data_buf_alloc(add_len
);
528 ret
= qat_compress_impl(dir
, src
, src_len
, dst
,
529 dst_len
, add
, add_len
, c_len
);
531 if (dir
== QAT_COMPRESS
)
532 zio_data_buf_free(add
, add_len
);
537 module_param(zfs_qat_compress_disable
, int, 0644);
538 MODULE_PARM_DESC(zfs_qat_compress_disable
, "Disable QAT compression");