Path: blob/main/sys/contrib/openzfs/module/os/linux/zfs/qat_compress.c
48775 views
// SPDX-License-Identifier: CDDL-1.01/*2* CDDL HEADER START3*4* The contents of this file are subject to the terms of the5* Common Development and Distribution License (the "License").6* You may not use this file except in compliance with the License.7*8* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE9* or https://opensource.org/licenses/CDDL-1.0.10* See the License for the specific language governing permissions11* and limitations under the License.12*13* When distributing Covered Code, include this CDDL HEADER in each14* file and include the License file at usr/src/OPENSOLARIS.LICENSE.15* If applicable, add the following below this CDDL HEADER, with the16* fields enclosed by brackets "[]" replaced with your own identifying17* information: Portions Copyright [yyyy] [name of copyright owner]18*19* CDDL HEADER END20*/2122#if defined(_KERNEL) && defined(HAVE_QAT)23#include <linux/slab.h>24#include <linux/vmalloc.h>25#include <linux/pagemap.h>26#include <linux/completion.h>27#include <sys/zfs_context.h>28#include <sys/byteorder.h>29#include <sys/zio.h>30#include <sys/qat.h>3132/*33* Max instances in a QAT device, each instance is a channel to submit34* jobs to QAT hardware, this is only for pre-allocating instance and35* session arrays; the actual number of instances are defined in the36* QAT driver's configuration file.37*/38#define QAT_DC_MAX_INSTANCES 483940/*41* ZLIB head and foot size42*/43#define ZLIB_HEAD_SZ 244#define ZLIB_FOOT_SZ 44546static CpaInstanceHandle dc_inst_handles[QAT_DC_MAX_INSTANCES];47static CpaDcSessionHandle session_handles[QAT_DC_MAX_INSTANCES];48static CpaBufferList **buffer_array[QAT_DC_MAX_INSTANCES];49static Cpa16U num_inst = 0;50static Cpa32U inst_num = 0;51static boolean_t qat_dc_init_done = B_FALSE;52int zfs_qat_compress_disable = 0;5354boolean_t55qat_dc_use_accel(size_t s_len)56{57return (!zfs_qat_compress_disable &&58qat_dc_init_done &&59s_len >= QAT_MIN_BUF_SIZE &&60s_len <= QAT_MAX_BUF_SIZE);61}6263static void64qat_dc_callback(void *p_callback, CpaStatus status)65{66if (p_callback != NULL)67complete((struct completion *)p_callback);68}6970static void71qat_dc_clean(void)72{73Cpa16U buff_num = 0;74Cpa16U num_inter_buff_lists = 0;7576for (Cpa16U i = 0; i < num_inst; i++) {77cpaDcStopInstance(dc_inst_handles[i]);78QAT_PHYS_CONTIG_FREE(session_handles[i]);79/* free intermediate buffers */80if (buffer_array[i] != NULL) {81cpaDcGetNumIntermediateBuffers(82dc_inst_handles[i], &num_inter_buff_lists);83for (buff_num = 0; buff_num < num_inter_buff_lists;84buff_num++) {85CpaBufferList *buffer_inter =86buffer_array[i][buff_num];87if (buffer_inter->pBuffers) {88QAT_PHYS_CONTIG_FREE(89buffer_inter->pBuffers->pData);90QAT_PHYS_CONTIG_FREE(91buffer_inter->pBuffers);92}93QAT_PHYS_CONTIG_FREE(94buffer_inter->pPrivateMetaData);95QAT_PHYS_CONTIG_FREE(buffer_inter);96}97}98}99100num_inst = 0;101qat_dc_init_done = B_FALSE;102}103104int105qat_dc_init(void)106{107CpaStatus status = CPA_STATUS_SUCCESS;108Cpa32U sess_size = 0;109Cpa32U ctx_size = 0;110Cpa16U num_inter_buff_lists = 0;111Cpa16U buff_num = 0;112Cpa32U buff_meta_size = 0;113CpaDcSessionSetupData sd = {0};114115if (qat_dc_init_done)116return (0);117118status = cpaDcGetNumInstances(&num_inst);119if (status != CPA_STATUS_SUCCESS)120return (-1);121122/* if the user has configured no QAT compression units just return */123if (num_inst == 0)124return (0);125126if (num_inst > QAT_DC_MAX_INSTANCES)127num_inst = QAT_DC_MAX_INSTANCES;128129status = cpaDcGetInstances(num_inst, &dc_inst_handles[0]);130if (status != CPA_STATUS_SUCCESS)131return (-1);132133for (Cpa16U i = 0; i < num_inst; i++) {134cpaDcSetAddressTranslation(dc_inst_handles[i],135(void*)virt_to_phys);136137status = cpaDcBufferListGetMetaSize(dc_inst_handles[i],1381, &buff_meta_size);139140if (status == CPA_STATUS_SUCCESS)141status = cpaDcGetNumIntermediateBuffers(142dc_inst_handles[i], &num_inter_buff_lists);143144if (status == CPA_STATUS_SUCCESS && num_inter_buff_lists != 0)145status = QAT_PHYS_CONTIG_ALLOC(&buffer_array[i],146num_inter_buff_lists *147sizeof (CpaBufferList *));148149for (buff_num = 0; buff_num < num_inter_buff_lists;150buff_num++) {151if (status == CPA_STATUS_SUCCESS)152status = QAT_PHYS_CONTIG_ALLOC(153&buffer_array[i][buff_num],154sizeof (CpaBufferList));155156if (status == CPA_STATUS_SUCCESS)157status = QAT_PHYS_CONTIG_ALLOC(158&buffer_array[i][buff_num]->159pPrivateMetaData,160buff_meta_size);161162if (status == CPA_STATUS_SUCCESS)163status = QAT_PHYS_CONTIG_ALLOC(164&buffer_array[i][buff_num]->pBuffers,165sizeof (CpaFlatBuffer));166167if (status == CPA_STATUS_SUCCESS) {168/*169* implementation requires an intermediate170* buffer approximately twice the size of171* output buffer, which is 2x max buffer172* size here.173*/174status = QAT_PHYS_CONTIG_ALLOC(175&buffer_array[i][buff_num]->pBuffers->176pData, 2 * QAT_MAX_BUF_SIZE);177if (status != CPA_STATUS_SUCCESS)178goto fail;179180buffer_array[i][buff_num]->numBuffers = 1;181buffer_array[i][buff_num]->pBuffers->182dataLenInBytes = 2 * QAT_MAX_BUF_SIZE;183}184}185186status = cpaDcStartInstance(dc_inst_handles[i],187num_inter_buff_lists, buffer_array[i]);188if (status != CPA_STATUS_SUCCESS)189goto fail;190191sd.compLevel = CPA_DC_L1;192sd.compType = CPA_DC_DEFLATE;193sd.huffType = CPA_DC_HT_FULL_DYNAMIC;194sd.sessDirection = CPA_DC_DIR_COMBINED;195sd.sessState = CPA_DC_STATELESS;196#if (CPA_DC_API_VERSION_NUM_MAJOR == 1 && CPA_DC_API_VERSION_NUM_MINOR < 6)197sd.deflateWindowSize = 7;198#endif199sd.checksum = CPA_DC_ADLER32;200status = cpaDcGetSessionSize(dc_inst_handles[i],201&sd, &sess_size, &ctx_size);202if (status != CPA_STATUS_SUCCESS)203goto fail;204205QAT_PHYS_CONTIG_ALLOC(&session_handles[i], sess_size);206if (session_handles[i] == NULL)207goto fail;208209status = cpaDcInitSession(dc_inst_handles[i],210session_handles[i],211&sd, NULL, qat_dc_callback);212if (status != CPA_STATUS_SUCCESS)213goto fail;214}215216qat_dc_init_done = B_TRUE;217return (0);218fail:219qat_dc_clean();220return (-1);221}222223void224qat_dc_fini(void)225{226if (!qat_dc_init_done)227return;228229qat_dc_clean();230}231232/*233* The "add" parameter is an additional buffer which is passed234* to QAT as a scratch buffer alongside the destination buffer235* in case the "compressed" data ends up being larger than the236* original source data. This is necessary to prevent QAT from237* generating buffer overflow warnings for incompressible data.238*/239static int240qat_compress_impl(qat_compress_dir_t dir, char *src, int src_len,241char *dst, int dst_len, char *add, int add_len, size_t *c_len)242{243CpaInstanceHandle dc_inst_handle;244CpaDcSessionHandle session_handle;245CpaBufferList *buf_list_src = NULL;246CpaBufferList *buf_list_dst = NULL;247CpaFlatBuffer *flat_buf_src = NULL;248CpaFlatBuffer *flat_buf_dst = NULL;249Cpa8U *buffer_meta_src = NULL;250Cpa8U *buffer_meta_dst = NULL;251Cpa32U buffer_meta_size = 0;252CpaDcRqResults dc_results = {.checksum = 1};253CpaStatus status = CPA_STATUS_FAIL;254Cpa32U hdr_sz = 0;255Cpa32U compressed_sz;256Cpa32U num_src_buf = (src_len >> PAGE_SHIFT) + 2;257Cpa32U num_dst_buf = (dst_len >> PAGE_SHIFT) + 2;258Cpa32U num_add_buf = (add_len >> PAGE_SHIFT) + 2;259Cpa32U bytes_left;260Cpa32U dst_pages = 0;261Cpa32U adler32 = 0;262char *data;263struct page *page;264struct page **in_pages = NULL;265struct page **out_pages = NULL;266struct page **add_pages = NULL;267Cpa32U page_off = 0;268struct completion complete;269Cpa32U page_num = 0;270Cpa16U i;271272/*273* We increment num_src_buf and num_dst_buf by 2 to allow274* us to handle non page-aligned buffer addresses and buffers275* whose sizes are not divisible by PAGE_SIZE.276*/277Cpa32U src_buffer_list_mem_size = sizeof (CpaBufferList) +278(num_src_buf * sizeof (CpaFlatBuffer));279Cpa32U dst_buffer_list_mem_size = sizeof (CpaBufferList) +280((num_dst_buf + num_add_buf) * sizeof (CpaFlatBuffer));281282status = QAT_PHYS_CONTIG_ALLOC(&in_pages,283num_src_buf * sizeof (struct page *));284if (status != CPA_STATUS_SUCCESS)285goto fail;286287status = QAT_PHYS_CONTIG_ALLOC(&out_pages,288num_dst_buf * sizeof (struct page *));289if (status != CPA_STATUS_SUCCESS)290goto fail;291292status = QAT_PHYS_CONTIG_ALLOC(&add_pages,293num_add_buf * sizeof (struct page *));294if (status != CPA_STATUS_SUCCESS)295goto fail;296297i = (Cpa32U)atomic_inc_32_nv(&inst_num) % num_inst;298dc_inst_handle = dc_inst_handles[i];299session_handle = session_handles[i];300301cpaDcBufferListGetMetaSize(dc_inst_handle, num_src_buf,302&buffer_meta_size);303status = QAT_PHYS_CONTIG_ALLOC(&buffer_meta_src, buffer_meta_size);304if (status != CPA_STATUS_SUCCESS)305goto fail;306307cpaDcBufferListGetMetaSize(dc_inst_handle, num_dst_buf + num_add_buf,308&buffer_meta_size);309status = QAT_PHYS_CONTIG_ALLOC(&buffer_meta_dst, buffer_meta_size);310if (status != CPA_STATUS_SUCCESS)311goto fail;312313/* build source buffer list */314status = QAT_PHYS_CONTIG_ALLOC(&buf_list_src, src_buffer_list_mem_size);315if (status != CPA_STATUS_SUCCESS)316goto fail;317318flat_buf_src = (CpaFlatBuffer *)(buf_list_src + 1);319320buf_list_src->pBuffers = flat_buf_src; /* always point to first one */321322/* build destination buffer list */323status = QAT_PHYS_CONTIG_ALLOC(&buf_list_dst, dst_buffer_list_mem_size);324if (status != CPA_STATUS_SUCCESS)325goto fail;326327flat_buf_dst = (CpaFlatBuffer *)(buf_list_dst + 1);328329buf_list_dst->pBuffers = flat_buf_dst; /* always point to first one */330331buf_list_src->numBuffers = 0;332buf_list_src->pPrivateMetaData = buffer_meta_src;333bytes_left = src_len;334data = src;335page_num = 0;336while (bytes_left > 0) {337page_off = ((long)data & ~PAGE_MASK);338page = qat_mem_to_page(data);339in_pages[page_num] = page;340flat_buf_src->pData = kmap(page) + page_off;341flat_buf_src->dataLenInBytes =342min((long)PAGE_SIZE - page_off, (long)bytes_left);343344bytes_left -= flat_buf_src->dataLenInBytes;345data += flat_buf_src->dataLenInBytes;346flat_buf_src++;347buf_list_src->numBuffers++;348page_num++;349}350351buf_list_dst->numBuffers = 0;352buf_list_dst->pPrivateMetaData = buffer_meta_dst;353bytes_left = dst_len;354data = dst;355page_num = 0;356while (bytes_left > 0) {357page_off = ((long)data & ~PAGE_MASK);358page = qat_mem_to_page(data);359flat_buf_dst->pData = kmap(page) + page_off;360out_pages[page_num] = page;361flat_buf_dst->dataLenInBytes =362min((long)PAGE_SIZE - page_off, (long)bytes_left);363364bytes_left -= flat_buf_dst->dataLenInBytes;365data += flat_buf_dst->dataLenInBytes;366flat_buf_dst++;367buf_list_dst->numBuffers++;368page_num++;369dst_pages++;370}371372/* map additional scratch pages into the destination buffer list */373bytes_left = add_len;374data = add;375page_num = 0;376while (bytes_left > 0) {377page_off = ((long)data & ~PAGE_MASK);378page = qat_mem_to_page(data);379flat_buf_dst->pData = kmap(page) + page_off;380add_pages[page_num] = page;381flat_buf_dst->dataLenInBytes =382min((long)PAGE_SIZE - page_off, (long)bytes_left);383384bytes_left -= flat_buf_dst->dataLenInBytes;385data += flat_buf_dst->dataLenInBytes;386flat_buf_dst++;387buf_list_dst->numBuffers++;388page_num++;389}390391init_completion(&complete);392393if (dir == QAT_COMPRESS) {394QAT_STAT_BUMP(comp_requests);395QAT_STAT_INCR(comp_total_in_bytes, src_len);396397cpaDcGenerateHeader(session_handle,398buf_list_dst->pBuffers, &hdr_sz);399buf_list_dst->pBuffers->pData += hdr_sz;400buf_list_dst->pBuffers->dataLenInBytes -= hdr_sz;401status = cpaDcCompressData(402dc_inst_handle, session_handle,403buf_list_src, buf_list_dst,404&dc_results, CPA_DC_FLUSH_FINAL,405&complete);406if (status != CPA_STATUS_SUCCESS) {407goto fail;408}409410/* we now wait until the completion of the operation. */411wait_for_completion(&complete);412413if (dc_results.status != CPA_STATUS_SUCCESS) {414status = CPA_STATUS_FAIL;415goto fail;416}417418compressed_sz = dc_results.produced;419if (compressed_sz + hdr_sz + ZLIB_FOOT_SZ > dst_len) {420status = CPA_STATUS_INCOMPRESSIBLE;421goto fail;422}423424/* get adler32 checksum and append footer */425*(Cpa32U*)(dst + hdr_sz + compressed_sz) =426BSWAP_32(dc_results.checksum);427428*c_len = hdr_sz + compressed_sz + ZLIB_FOOT_SZ;429QAT_STAT_INCR(comp_total_out_bytes, *c_len);430} else {431ASSERT3U(dir, ==, QAT_DECOMPRESS);432QAT_STAT_BUMP(decomp_requests);433QAT_STAT_INCR(decomp_total_in_bytes, src_len);434435buf_list_src->pBuffers->pData += ZLIB_HEAD_SZ;436buf_list_src->pBuffers->dataLenInBytes -= ZLIB_HEAD_SZ;437status = cpaDcDecompressData(dc_inst_handle, session_handle,438buf_list_src, buf_list_dst, &dc_results, CPA_DC_FLUSH_FINAL,439&complete);440441if (CPA_STATUS_SUCCESS != status) {442status = CPA_STATUS_FAIL;443goto fail;444}445446/* we now wait until the completion of the operation. */447wait_for_completion(&complete);448449if (dc_results.status != CPA_STATUS_SUCCESS) {450status = CPA_STATUS_FAIL;451goto fail;452}453454/* verify adler checksum */455adler32 = *(Cpa32U *)(src + dc_results.consumed + ZLIB_HEAD_SZ);456if (adler32 != BSWAP_32(dc_results.checksum)) {457status = CPA_STATUS_FAIL;458goto fail;459}460*c_len = dc_results.produced;461QAT_STAT_INCR(decomp_total_out_bytes, *c_len);462}463464fail:465if (status != CPA_STATUS_SUCCESS && status != CPA_STATUS_INCOMPRESSIBLE)466QAT_STAT_BUMP(dc_fails);467468if (in_pages) {469for (page_num = 0;470page_num < buf_list_src->numBuffers;471page_num++) {472kunmap(in_pages[page_num]);473}474QAT_PHYS_CONTIG_FREE(in_pages);475}476477if (out_pages) {478for (page_num = 0; page_num < dst_pages; page_num++) {479kunmap(out_pages[page_num]);480}481QAT_PHYS_CONTIG_FREE(out_pages);482}483484if (add_pages) {485for (page_num = 0;486page_num < buf_list_dst->numBuffers - dst_pages;487page_num++) {488kunmap(add_pages[page_num]);489}490QAT_PHYS_CONTIG_FREE(add_pages);491}492493QAT_PHYS_CONTIG_FREE(buffer_meta_src);494QAT_PHYS_CONTIG_FREE(buffer_meta_dst);495QAT_PHYS_CONTIG_FREE(buf_list_src);496QAT_PHYS_CONTIG_FREE(buf_list_dst);497498return (status);499}500501/*502* Entry point for QAT accelerated compression / decompression.503*/504int505qat_compress(qat_compress_dir_t dir, char *src, int src_len,506char *dst, int dst_len, size_t *c_len)507{508int ret;509size_t add_len = 0;510void *add = NULL;511512if (dir == QAT_COMPRESS) {513add_len = dst_len;514add = zio_data_buf_alloc(add_len);515}516517ret = qat_compress_impl(dir, src, src_len, dst,518dst_len, add, add_len, c_len);519520if (dir == QAT_COMPRESS)521zio_data_buf_free(add, add_len);522523return (ret);524}525526static int527param_set_qat_compress(const char *val, zfs_kernel_param_t *kp)528{529int ret;530int *pvalue = kp->arg;531ret = param_set_int(val, kp);532if (ret)533return (ret);534/*535* zfs_qat_compress_disable = 0: enable qat compress536* try to initialize qat instance if it has not been done537*/538if (*pvalue == 0 && !qat_dc_init_done) {539ret = qat_dc_init();540if (ret != 0) {541zfs_qat_compress_disable = 1;542return (ret);543}544}545return (ret);546}547548module_param_call(zfs_qat_compress_disable, param_set_qat_compress,549param_get_int, &zfs_qat_compress_disable, 0644);550MODULE_PARM_DESC(zfs_qat_compress_disable, "Enable/Disable QAT compression");551552#endif553554555