Path: blob/master/drivers/crypto/hisilicon/zip/zip_crypto.c
26292 views
// SPDX-License-Identifier: GPL-2.01/* Copyright (c) 2019 HiSilicon Limited. */2#include <crypto/internal/acompress.h>3#include <linux/bitfield.h>4#include <linux/bitmap.h>5#include <linux/dma-mapping.h>6#include <linux/scatterlist.h>7#include "zip.h"89/* hisi_zip_sqe dw3 */10#define HZIP_BD_STATUS_M GENMASK(7, 0)11/* hisi_zip_sqe dw7 */12#define HZIP_IN_SGE_DATA_OFFSET_M GENMASK(23, 0)13#define HZIP_SQE_TYPE_M GENMASK(31, 28)14/* hisi_zip_sqe dw8 */15#define HZIP_OUT_SGE_DATA_OFFSET_M GENMASK(23, 0)16/* hisi_zip_sqe dw9 */17#define HZIP_REQ_TYPE_M GENMASK(7, 0)18#define HZIP_ALG_TYPE_DEFLATE 0x0119#define HZIP_BUF_TYPE_M GENMASK(11, 8)20#define HZIP_SGL 0x12122#define HZIP_ALG_PRIORITY 30023#define HZIP_SGL_SGE_NR 102425#define HZIP_ALG_DEFLATE GENMASK(5, 4)2627static DEFINE_MUTEX(zip_algs_lock);28static unsigned int zip_available_devs;2930enum hisi_zip_alg_type {31HZIP_ALG_TYPE_COMP = 0,32HZIP_ALG_TYPE_DECOMP = 1,33};3435enum {36HZIP_QPC_COMP,37HZIP_QPC_DECOMP,38HZIP_CTX_Q_NUM39};4041#define COMP_NAME_TO_TYPE(alg_name) \42(!strcmp((alg_name), "deflate") ? HZIP_ALG_TYPE_DEFLATE : 0)4344struct hisi_zip_req {45struct acomp_req *req;46struct hisi_acc_hw_sgl *hw_src;47struct hisi_acc_hw_sgl *hw_dst;48dma_addr_t dma_src;49dma_addr_t dma_dst;50u16 req_id;51};5253struct hisi_zip_req_q {54struct hisi_zip_req *q;55unsigned long *req_bitmap;56spinlock_t req_lock;57u16 size;58};5960struct hisi_zip_qp_ctx {61struct hisi_qp *qp;62struct hisi_zip_req_q req_q;63struct hisi_acc_sgl_pool *sgl_pool;64struct hisi_zip *zip_dev;65struct hisi_zip_ctx *ctx;66};6768struct hisi_zip_sqe_ops {69u8 sqe_type;70void (*fill_addr)(struct hisi_zip_sqe *sqe, struct hisi_zip_req *req);71void (*fill_buf_size)(struct hisi_zip_sqe *sqe, struct hisi_zip_req *req);72void (*fill_buf_type)(struct hisi_zip_sqe *sqe, u8 buf_type);73void (*fill_req_type)(struct hisi_zip_sqe *sqe, u8 req_type);74void (*fill_tag)(struct hisi_zip_sqe *sqe, struct hisi_zip_req *req);75void (*fill_sqe_type)(struct hisi_zip_sqe *sqe, u8 sqe_type);76u32 (*get_tag)(struct hisi_zip_sqe *sqe);77u32 (*get_status)(struct hisi_zip_sqe *sqe);78u32 (*get_dstlen)(struct hisi_zip_sqe *sqe);79};8081struct hisi_zip_ctx {82struct hisi_zip_qp_ctx qp_ctx[HZIP_CTX_Q_NUM];83const struct hisi_zip_sqe_ops *ops;84};8586static int sgl_sge_nr_set(const char *val, const struct kernel_param *kp)87{88int ret;89u16 n;9091if (!val)92return -EINVAL;9394ret = kstrtou16(val, 10, &n);95if (ret || n == 0 || n > HISI_ACC_SGL_SGE_NR_MAX)96return -EINVAL;9798return param_set_ushort(val, kp);99}100101static const struct kernel_param_ops sgl_sge_nr_ops = {102.set = sgl_sge_nr_set,103.get = param_get_ushort,104};105106static u16 sgl_sge_nr = HZIP_SGL_SGE_NR;107module_param_cb(sgl_sge_nr, &sgl_sge_nr_ops, &sgl_sge_nr, 0444);108MODULE_PARM_DESC(sgl_sge_nr, "Number of sge in sgl(1-255)");109110static struct hisi_zip_req *hisi_zip_create_req(struct hisi_zip_qp_ctx *qp_ctx,111struct acomp_req *req)112{113struct hisi_zip_req_q *req_q = &qp_ctx->req_q;114struct hisi_zip_req *q = req_q->q;115struct hisi_zip_req *req_cache;116int req_id;117118spin_lock(&req_q->req_lock);119120req_id = find_first_zero_bit(req_q->req_bitmap, req_q->size);121if (req_id >= req_q->size) {122spin_unlock(&req_q->req_lock);123dev_dbg(&qp_ctx->qp->qm->pdev->dev, "req cache is full!\n");124return ERR_PTR(-EAGAIN);125}126set_bit(req_id, req_q->req_bitmap);127128spin_unlock(&req_q->req_lock);129130req_cache = q + req_id;131req_cache->req_id = req_id;132req_cache->req = req;133134return req_cache;135}136137static void hisi_zip_remove_req(struct hisi_zip_qp_ctx *qp_ctx,138struct hisi_zip_req *req)139{140struct hisi_zip_req_q *req_q = &qp_ctx->req_q;141142spin_lock(&req_q->req_lock);143clear_bit(req->req_id, req_q->req_bitmap);144spin_unlock(&req_q->req_lock);145}146147static void hisi_zip_fill_addr(struct hisi_zip_sqe *sqe, struct hisi_zip_req *req)148{149sqe->source_addr_l = lower_32_bits(req->dma_src);150sqe->source_addr_h = upper_32_bits(req->dma_src);151sqe->dest_addr_l = lower_32_bits(req->dma_dst);152sqe->dest_addr_h = upper_32_bits(req->dma_dst);153}154155static void hisi_zip_fill_buf_size(struct hisi_zip_sqe *sqe, struct hisi_zip_req *req)156{157struct acomp_req *a_req = req->req;158159sqe->input_data_length = a_req->slen;160sqe->dest_avail_out = a_req->dlen;161}162163static void hisi_zip_fill_buf_type(struct hisi_zip_sqe *sqe, u8 buf_type)164{165u32 val;166167val = sqe->dw9 & ~HZIP_BUF_TYPE_M;168val |= FIELD_PREP(HZIP_BUF_TYPE_M, buf_type);169sqe->dw9 = val;170}171172static void hisi_zip_fill_req_type(struct hisi_zip_sqe *sqe, u8 req_type)173{174u32 val;175176val = sqe->dw9 & ~HZIP_REQ_TYPE_M;177val |= FIELD_PREP(HZIP_REQ_TYPE_M, req_type);178sqe->dw9 = val;179}180181static void hisi_zip_fill_tag(struct hisi_zip_sqe *sqe, struct hisi_zip_req *req)182{183sqe->dw26 = req->req_id;184}185186static void hisi_zip_fill_sqe_type(struct hisi_zip_sqe *sqe, u8 sqe_type)187{188u32 val;189190val = sqe->dw7 & ~HZIP_SQE_TYPE_M;191val |= FIELD_PREP(HZIP_SQE_TYPE_M, sqe_type);192sqe->dw7 = val;193}194195static void hisi_zip_fill_sqe(struct hisi_zip_ctx *ctx, struct hisi_zip_sqe *sqe,196u8 req_type, struct hisi_zip_req *req)197{198const struct hisi_zip_sqe_ops *ops = ctx->ops;199200memset(sqe, 0, sizeof(struct hisi_zip_sqe));201202ops->fill_addr(sqe, req);203ops->fill_buf_size(sqe, req);204ops->fill_buf_type(sqe, HZIP_SGL);205ops->fill_req_type(sqe, req_type);206ops->fill_tag(sqe, req);207ops->fill_sqe_type(sqe, ops->sqe_type);208}209210static int hisi_zip_do_work(struct hisi_zip_qp_ctx *qp_ctx,211struct hisi_zip_req *req)212{213struct hisi_acc_sgl_pool *pool = qp_ctx->sgl_pool;214struct hisi_zip_dfx *dfx = &qp_ctx->zip_dev->dfx;215struct hisi_zip_req_q *req_q = &qp_ctx->req_q;216struct acomp_req *a_req = req->req;217struct hisi_qp *qp = qp_ctx->qp;218struct device *dev = &qp->qm->pdev->dev;219struct hisi_zip_sqe zip_sqe;220int ret;221222if (unlikely(!a_req->src || !a_req->slen || !a_req->dst || !a_req->dlen))223return -EINVAL;224225req->hw_src = hisi_acc_sg_buf_map_to_hw_sgl(dev, a_req->src, pool,226req->req_id << 1, &req->dma_src,227DMA_TO_DEVICE);228if (IS_ERR(req->hw_src)) {229dev_err(dev, "failed to map the src buffer to hw sgl (%ld)!\n",230PTR_ERR(req->hw_src));231return PTR_ERR(req->hw_src);232}233234req->hw_dst = hisi_acc_sg_buf_map_to_hw_sgl(dev, a_req->dst, pool,235(req->req_id << 1) + 1,236&req->dma_dst, DMA_FROM_DEVICE);237if (IS_ERR(req->hw_dst)) {238ret = PTR_ERR(req->hw_dst);239dev_err(dev, "failed to map the dst buffer to hw slg (%d)!\n",240ret);241goto err_unmap_input;242}243244hisi_zip_fill_sqe(qp_ctx->ctx, &zip_sqe, qp->req_type, req);245246/* send command to start a task */247atomic64_inc(&dfx->send_cnt);248spin_lock_bh(&req_q->req_lock);249ret = hisi_qp_send(qp, &zip_sqe);250spin_unlock_bh(&req_q->req_lock);251if (unlikely(ret < 0)) {252atomic64_inc(&dfx->send_busy_cnt);253ret = -EAGAIN;254dev_dbg_ratelimited(dev, "failed to send request!\n");255goto err_unmap_output;256}257258return -EINPROGRESS;259260err_unmap_output:261hisi_acc_sg_buf_unmap(dev, a_req->dst, req->hw_dst, DMA_FROM_DEVICE);262err_unmap_input:263hisi_acc_sg_buf_unmap(dev, a_req->src, req->hw_src, DMA_TO_DEVICE);264return ret;265}266267static u32 hisi_zip_get_tag(struct hisi_zip_sqe *sqe)268{269return sqe->dw26;270}271272static u32 hisi_zip_get_status(struct hisi_zip_sqe *sqe)273{274return sqe->dw3 & HZIP_BD_STATUS_M;275}276277static u32 hisi_zip_get_dstlen(struct hisi_zip_sqe *sqe)278{279return sqe->produced;280}281282static void hisi_zip_acomp_cb(struct hisi_qp *qp, void *data)283{284struct hisi_zip_qp_ctx *qp_ctx = qp->qp_ctx;285const struct hisi_zip_sqe_ops *ops = qp_ctx->ctx->ops;286struct hisi_zip_dfx *dfx = &qp_ctx->zip_dev->dfx;287struct hisi_zip_req_q *req_q = &qp_ctx->req_q;288struct device *dev = &qp->qm->pdev->dev;289struct hisi_zip_sqe *sqe = data;290u32 tag = ops->get_tag(sqe);291struct hisi_zip_req *req = req_q->q + tag;292struct acomp_req *acomp_req = req->req;293int err = 0;294u32 status;295296atomic64_inc(&dfx->recv_cnt);297status = ops->get_status(sqe);298if (unlikely(status != 0 && status != HZIP_NC_ERR)) {299dev_err(dev, "%scompress fail in qp%u: %u, output: %u\n",300(qp->alg_type == 0) ? "" : "de", qp->qp_id, status,301sqe->produced);302atomic64_inc(&dfx->err_bd_cnt);303err = -EIO;304}305306hisi_acc_sg_buf_unmap(dev, acomp_req->dst, req->hw_dst, DMA_FROM_DEVICE);307hisi_acc_sg_buf_unmap(dev, acomp_req->src, req->hw_src, DMA_TO_DEVICE);308309acomp_req->dlen = ops->get_dstlen(sqe);310311if (acomp_req->base.complete)312acomp_request_complete(acomp_req, err);313314hisi_zip_remove_req(qp_ctx, req);315}316317static int hisi_zip_acompress(struct acomp_req *acomp_req)318{319struct hisi_zip_ctx *ctx = crypto_tfm_ctx(acomp_req->base.tfm);320struct hisi_zip_qp_ctx *qp_ctx = &ctx->qp_ctx[HZIP_QPC_COMP];321struct device *dev = &qp_ctx->qp->qm->pdev->dev;322struct hisi_zip_req *req;323int ret;324325req = hisi_zip_create_req(qp_ctx, acomp_req);326if (IS_ERR(req))327return PTR_ERR(req);328329ret = hisi_zip_do_work(qp_ctx, req);330if (unlikely(ret != -EINPROGRESS)) {331dev_info_ratelimited(dev, "failed to do compress (%d)!\n", ret);332hisi_zip_remove_req(qp_ctx, req);333}334335return ret;336}337338static int hisi_zip_adecompress(struct acomp_req *acomp_req)339{340struct hisi_zip_ctx *ctx = crypto_tfm_ctx(acomp_req->base.tfm);341struct hisi_zip_qp_ctx *qp_ctx = &ctx->qp_ctx[HZIP_QPC_DECOMP];342struct device *dev = &qp_ctx->qp->qm->pdev->dev;343struct hisi_zip_req *req;344int ret;345346req = hisi_zip_create_req(qp_ctx, acomp_req);347if (IS_ERR(req))348return PTR_ERR(req);349350ret = hisi_zip_do_work(qp_ctx, req);351if (unlikely(ret != -EINPROGRESS)) {352dev_info_ratelimited(dev, "failed to do decompress (%d)!\n",353ret);354hisi_zip_remove_req(qp_ctx, req);355}356357return ret;358}359360static int hisi_zip_start_qp(struct hisi_qp *qp, struct hisi_zip_qp_ctx *qp_ctx,361int alg_type, int req_type)362{363struct device *dev = &qp->qm->pdev->dev;364int ret;365366qp->req_type = req_type;367qp->alg_type = alg_type;368qp->qp_ctx = qp_ctx;369370ret = hisi_qm_start_qp(qp, 0);371if (ret < 0) {372dev_err(dev, "failed to start qp (%d)!\n", ret);373return ret;374}375376qp_ctx->qp = qp;377378return 0;379}380381static void hisi_zip_release_qp(struct hisi_zip_qp_ctx *qp_ctx)382{383hisi_qm_stop_qp(qp_ctx->qp);384hisi_qm_free_qps(&qp_ctx->qp, 1);385}386387static const struct hisi_zip_sqe_ops hisi_zip_ops = {388.sqe_type = 0x3,389.fill_addr = hisi_zip_fill_addr,390.fill_buf_size = hisi_zip_fill_buf_size,391.fill_buf_type = hisi_zip_fill_buf_type,392.fill_req_type = hisi_zip_fill_req_type,393.fill_tag = hisi_zip_fill_tag,394.fill_sqe_type = hisi_zip_fill_sqe_type,395.get_tag = hisi_zip_get_tag,396.get_status = hisi_zip_get_status,397.get_dstlen = hisi_zip_get_dstlen,398};399400static int hisi_zip_ctx_init(struct hisi_zip_ctx *hisi_zip_ctx, u8 req_type, int node)401{402struct hisi_qp *qps[HZIP_CTX_Q_NUM] = { NULL };403struct hisi_zip_qp_ctx *qp_ctx;404struct hisi_zip *hisi_zip;405int ret, i, j;406407ret = zip_create_qps(qps, HZIP_CTX_Q_NUM, node);408if (ret) {409pr_err("failed to create zip qps (%d)!\n", ret);410return -ENODEV;411}412413hisi_zip = container_of(qps[0]->qm, struct hisi_zip, qm);414415for (i = 0; i < HZIP_CTX_Q_NUM; i++) {416/* alg_type = 0 for compress, 1 for decompress in hw sqe */417qp_ctx = &hisi_zip_ctx->qp_ctx[i];418qp_ctx->ctx = hisi_zip_ctx;419ret = hisi_zip_start_qp(qps[i], qp_ctx, i, req_type);420if (ret) {421for (j = i - 1; j >= 0; j--)422hisi_qm_stop_qp(hisi_zip_ctx->qp_ctx[j].qp);423424hisi_qm_free_qps(qps, HZIP_CTX_Q_NUM);425return ret;426}427428qp_ctx->zip_dev = hisi_zip;429}430431hisi_zip_ctx->ops = &hisi_zip_ops;432433return 0;434}435436static void hisi_zip_ctx_exit(struct hisi_zip_ctx *hisi_zip_ctx)437{438int i;439440for (i = 0; i < HZIP_CTX_Q_NUM; i++)441hisi_zip_release_qp(&hisi_zip_ctx->qp_ctx[i]);442}443444static int hisi_zip_create_req_q(struct hisi_zip_ctx *ctx)445{446u16 q_depth = ctx->qp_ctx[0].qp->sq_depth;447struct hisi_zip_req_q *req_q;448int i, ret;449450for (i = 0; i < HZIP_CTX_Q_NUM; i++) {451req_q = &ctx->qp_ctx[i].req_q;452req_q->size = q_depth;453454req_q->req_bitmap = bitmap_zalloc(req_q->size, GFP_KERNEL);455if (!req_q->req_bitmap) {456ret = -ENOMEM;457if (i == 0)458return ret;459460goto err_free_comp_q;461}462spin_lock_init(&req_q->req_lock);463464req_q->q = kcalloc(req_q->size, sizeof(struct hisi_zip_req),465GFP_KERNEL);466if (!req_q->q) {467ret = -ENOMEM;468if (i == 0)469goto err_free_comp_bitmap;470else471goto err_free_decomp_bitmap;472}473}474475return 0;476477err_free_decomp_bitmap:478bitmap_free(ctx->qp_ctx[HZIP_QPC_DECOMP].req_q.req_bitmap);479err_free_comp_q:480kfree(ctx->qp_ctx[HZIP_QPC_COMP].req_q.q);481err_free_comp_bitmap:482bitmap_free(ctx->qp_ctx[HZIP_QPC_COMP].req_q.req_bitmap);483return ret;484}485486static void hisi_zip_release_req_q(struct hisi_zip_ctx *ctx)487{488int i;489490for (i = 0; i < HZIP_CTX_Q_NUM; i++) {491kfree(ctx->qp_ctx[i].req_q.q);492bitmap_free(ctx->qp_ctx[i].req_q.req_bitmap);493}494}495496static int hisi_zip_create_sgl_pool(struct hisi_zip_ctx *ctx)497{498u16 q_depth = ctx->qp_ctx[0].qp->sq_depth;499struct hisi_zip_qp_ctx *tmp;500struct device *dev;501int i;502503for (i = 0; i < HZIP_CTX_Q_NUM; i++) {504tmp = &ctx->qp_ctx[i];505dev = &tmp->qp->qm->pdev->dev;506tmp->sgl_pool = hisi_acc_create_sgl_pool(dev, q_depth << 1,507sgl_sge_nr);508if (IS_ERR(tmp->sgl_pool)) {509if (i == 1)510goto err_free_sgl_pool0;511return -ENOMEM;512}513}514515return 0;516517err_free_sgl_pool0:518hisi_acc_free_sgl_pool(&ctx->qp_ctx[HZIP_QPC_COMP].qp->qm->pdev->dev,519ctx->qp_ctx[HZIP_QPC_COMP].sgl_pool);520return -ENOMEM;521}522523static void hisi_zip_release_sgl_pool(struct hisi_zip_ctx *ctx)524{525int i;526527for (i = 0; i < HZIP_CTX_Q_NUM; i++)528hisi_acc_free_sgl_pool(&ctx->qp_ctx[i].qp->qm->pdev->dev,529ctx->qp_ctx[i].sgl_pool);530}531532static void hisi_zip_set_acomp_cb(struct hisi_zip_ctx *ctx,533void (*fn)(struct hisi_qp *, void *))534{535int i;536537for (i = 0; i < HZIP_CTX_Q_NUM; i++)538ctx->qp_ctx[i].qp->req_cb = fn;539}540541static int hisi_zip_acomp_init(struct crypto_acomp *tfm)542{543const char *alg_name = crypto_tfm_alg_name(&tfm->base);544struct hisi_zip_ctx *ctx = crypto_tfm_ctx(&tfm->base);545struct device *dev;546int ret;547548ret = hisi_zip_ctx_init(ctx, COMP_NAME_TO_TYPE(alg_name), tfm->base.node);549if (ret) {550pr_err("failed to init ctx (%d)!\n", ret);551return ret;552}553554dev = &ctx->qp_ctx[0].qp->qm->pdev->dev;555556ret = hisi_zip_create_req_q(ctx);557if (ret) {558dev_err(dev, "failed to create request queue (%d)!\n", ret);559goto err_ctx_exit;560}561562ret = hisi_zip_create_sgl_pool(ctx);563if (ret) {564dev_err(dev, "failed to create sgl pool (%d)!\n", ret);565goto err_release_req_q;566}567568hisi_zip_set_acomp_cb(ctx, hisi_zip_acomp_cb);569570return 0;571572err_release_req_q:573hisi_zip_release_req_q(ctx);574err_ctx_exit:575hisi_zip_ctx_exit(ctx);576return ret;577}578579static void hisi_zip_acomp_exit(struct crypto_acomp *tfm)580{581struct hisi_zip_ctx *ctx = crypto_tfm_ctx(&tfm->base);582583hisi_zip_set_acomp_cb(ctx, NULL);584hisi_zip_release_sgl_pool(ctx);585hisi_zip_release_req_q(ctx);586hisi_zip_ctx_exit(ctx);587}588589static struct acomp_alg hisi_zip_acomp_deflate = {590.init = hisi_zip_acomp_init,591.exit = hisi_zip_acomp_exit,592.compress = hisi_zip_acompress,593.decompress = hisi_zip_adecompress,594.base = {595.cra_name = "deflate",596.cra_driver_name = "hisi-deflate-acomp",597.cra_flags = CRYPTO_ALG_ASYNC,598.cra_module = THIS_MODULE,599.cra_priority = HZIP_ALG_PRIORITY,600.cra_ctxsize = sizeof(struct hisi_zip_ctx),601}602};603604static int hisi_zip_register_deflate(struct hisi_qm *qm)605{606int ret;607608if (!hisi_zip_alg_support(qm, HZIP_ALG_DEFLATE))609return 0;610611ret = crypto_register_acomp(&hisi_zip_acomp_deflate);612if (ret)613dev_err(&qm->pdev->dev, "failed to register to deflate (%d)!\n", ret);614615return ret;616}617618static void hisi_zip_unregister_deflate(struct hisi_qm *qm)619{620if (!hisi_zip_alg_support(qm, HZIP_ALG_DEFLATE))621return;622623crypto_unregister_acomp(&hisi_zip_acomp_deflate);624}625626int hisi_zip_register_to_crypto(struct hisi_qm *qm)627{628int ret = 0;629630mutex_lock(&zip_algs_lock);631if (zip_available_devs++)632goto unlock;633634ret = hisi_zip_register_deflate(qm);635if (ret)636zip_available_devs--;637638unlock:639mutex_unlock(&zip_algs_lock);640return ret;641}642643void hisi_zip_unregister_from_crypto(struct hisi_qm *qm)644{645mutex_lock(&zip_algs_lock);646if (--zip_available_devs)647goto unlock;648649hisi_zip_unregister_deflate(qm);650651unlock:652mutex_unlock(&zip_algs_lock);653}654655656