blob: c42b235ba64f9574e43717e7700cc3c133be0f46 [file]
// SPDX-License-Identifier: (GPL-2.0+ OR MIT)
/*
* Copyright (c) 2019 Amlogic, Inc. All rights reserved.
*/
#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/slab.h>
#include <linux/err.h>
#include <linux/clk.h>
#include <linux/io.h>
#include <linux/hw_random.h>
#include <linux/platform_device.h>
#include <linux/pm_runtime.h>
#include <linux/of_device.h>
#include <linux/device.h>
#include <linux/init.h>
#include <linux/errno.h>
#include <linux/interrupt.h>
#include <linux/irq.h>
#include <linux/scatterlist.h>
#include <linux/dma-mapping.h>
#include <linux/delay.h>
#include <linux/crypto.h>
#include <crypto/scatterwalk.h>
#include <crypto/algapi.h>
#include <crypto/sm4.h>
#include <crypto/hash.h>
#include <crypto/internal/hash.h>
#include <linux/of_platform.h>
#include <crypto/skcipher.h>
#include "aml-crypto-dma.h"
#include <crypto/internal/skcipher.h>
/* SM4 flags */
#define SM4_FLAGS_MODE_MASK 0x07
#define SM4_FLAGS_ENCRYPT BIT(0)
#define SM4_FLAGS_CBC BIT(1)
#define SM4_FLAGS_CTR BIT(2)
#define SM4_FLAGS_INIT BIT(8)
#define SM4_FLAGS_DMA BIT(9)
#define SM4_FLAGS_FAST BIT(10)
#define SM4_FLAGS_BUSY BIT(11)
#define SM4_FLAGS_ERROR BIT(12)
#define AML_SM4_QUEUE_LENGTH 50
#define AML_SM4_DMA_THRESHOLD 16
#define DEFAULT_AUTOSUSPEND_DELAY 1000
struct aml_sm4_dev;
struct aml_sm4_ctx {
struct aml_sm4_dev *dd;
int keylen;
u32 key[SM4_KEY_SIZE / sizeof(u32)];
u16 block_size;
struct crypto_skcipher *fallback;
int kte;
};
struct aml_sm4_reqctx {
unsigned long mode;
};
struct aml_sm4_dev {
struct list_head list;
struct aml_sm4_ctx *ctx;
struct device *dev;
struct device *parent;
int irq;
unsigned long flags;
int err;
struct aml_dma_dev *dma;
u32 thread;
u32 status;
u8 link_mode;
struct crypto_queue queue;
struct tasklet_struct done_task;
struct tasklet_struct queue_task;
struct skcipher_request *req;
size_t total;
size_t fast_total;
struct scatterlist *in_sg;
size_t in_offset;
struct scatterlist *out_sg;
size_t out_offset;
size_t buflen;
size_t dma_size;
void *buf_in;
dma_addr_t dma_addr_in;
void *buf_out;
dma_addr_t dma_addr_out;
void *descriptor;
dma_addr_t dma_descript_tab;
void *sg_dsc_in;
dma_addr_t dma_sg_dsc_in;
void *sg_dsc_out;
dma_addr_t dma_sg_dsc_out;
u8 iv_swap;
};
struct aml_sm4_drv {
struct list_head dev_list;
spinlock_t lock; /* spinlock for device list */
};
struct aml_sm4_info {
struct skcipher_alg *algs;
u32 num_algs;
};
static struct aml_sm4_drv aml_sm4 = {
.dev_list = LIST_HEAD_INIT(aml_sm4.dev_list),
.lock = __SPIN_LOCK_UNLOCKED(aml_sm4.lock),
};
static int aml_sm4_crypt_dma_stop(struct aml_sm4_dev *dd);
static int set_sm4_kl_key_iv(struct aml_sm4_dev *dd, u32 *key,
u32 keylen, u32 *iv, u8 swap)
{
struct device *dev = dd->dev;
struct dma_dsc *dsc = dd->descriptor;
u32 *key_iv = kzalloc(DMA_KEY_IV_BUF_SIZE, GFP_ATOMIC);
s32 len = keylen;
dma_addr_t dma_addr_key = 0;
if (!key_iv) {
dev_err(dev, "error allocating key_iv buffer\n");
return -EINVAL;
}
if (iv) {
u32 *piv = key_iv; // + 8;
if (swap) {
*(piv + 3) = swap_ulong32(*iv);
*(piv + 2) = swap_ulong32(*(iv + 1));
*(piv + 1) = swap_ulong32(*(iv + 2));
*(piv + 0) = swap_ulong32(*(iv + 3));
} else {
memcpy(piv, iv, 16);
}
}
len = DMA_KEY_IV_BUF_SIZE; /* full key storage */
dma_addr_key = dma_map_single(dd->parent, key_iv,
DMA_KEY_IV_BUF_SIZE, DMA_TO_DEVICE);
if (dma_mapping_error(dd->parent, dma_addr_key)) {
dev_err(dev, "error mapping dma_addr_key\n");
kfree(key_iv);
return -EINVAL;
}
dsc[0].src_addr = (u32)(0xffffff00 | dd->ctx->kte);
dsc[0].tgt_addr = 0;
dsc[0].dsc_cfg.d32 = 0;
dsc[0].dsc_cfg.b.length = keylen;
dsc[0].dsc_cfg.b.mode = MODE_KEY;
dsc[0].dsc_cfg.b.eoc = 0;
dsc[0].dsc_cfg.b.owner = 1;
if (iv) {
dsc[1].src_addr = (u32)dma_addr_key;
dsc[1].tgt_addr = 32;
dsc[1].dsc_cfg.d32 = 0;
dsc[1].dsc_cfg.b.length = 16;
dsc[1].dsc_cfg.b.mode = MODE_KEY;
dsc[1].dsc_cfg.b.eoc = 1;
dsc[1].dsc_cfg.b.owner = 1;
} else {
dsc[0].dsc_cfg.b.eoc = 1;
}
aml_write_crypto_reg(dd->thread,
(uintptr_t)dd->dma_descript_tab | 2);
aml_dma_debug(dsc, 1, __func__, dd->thread, dd->status);
while (aml_read_crypto_reg(dd->status) == 0)
;
aml_write_crypto_reg(dd->status, 0xf);
dma_unmap_single(dd->parent, dma_addr_key,
DMA_KEY_IV_BUF_SIZE, DMA_TO_DEVICE);
kfree(key_iv);
return 0;
}
static int set_sm4_key_iv(struct aml_sm4_dev *dd, u32 *key,
u32 keylen, u32 *iv, u8 swap)
{
struct device *dev = dd->dev;
struct dma_dsc *dsc = dd->descriptor;
u32 *key_iv = kzalloc(DMA_KEY_IV_BUF_SIZE, GFP_ATOMIC);
s32 len = keylen;
dma_addr_t dma_addr_key = 0;
u8 status = 0;
int err = 0;
if (!key_iv) {
dev_err(dev, "error allocating key_iv buffer\n");
return -EINVAL;
}
if (key)
memcpy(key_iv, key, keylen);
if (iv) {
u32 *piv = key_iv + 8;
if (swap) {
*(piv + 3) = swap_ulong32(*iv);
*(piv + 2) = swap_ulong32(*(iv + 1));
*(piv + 1) = swap_ulong32(*(iv + 2));
*(piv + 0) = swap_ulong32(*(iv + 3));
} else {
memcpy(piv, iv, 16);
}
}
len = DMA_KEY_IV_BUF_SIZE; /* full key storage */
dma_addr_key = dma_map_single(dd->parent, key_iv,
DMA_KEY_IV_BUF_SIZE, DMA_TO_DEVICE);
if (dma_mapping_error(dd->parent, dma_addr_key)) {
dev_err(dev, "error mapping dma_addr_key\n");
kfree(key_iv);
return -EINVAL;
}
dsc[0].src_addr = (u32)dma_addr_key;
dsc[0].tgt_addr = 0;
dsc[0].dsc_cfg.d32 = 0;
dsc[0].dsc_cfg.b.length = len;
dsc[0].dsc_cfg.b.mode = MODE_KEY;
dsc[0].dsc_cfg.b.eoc = 1;
dsc[0].dsc_cfg.b.owner = 1;
aml_dma_debug(dsc, 1, __func__, dd->thread, dd->status);
#if DMA_IRQ_MODE
aml_write_crypto_reg(dd->thread,
(uintptr_t)dd->dma_descript_tab | 2);
while (aml_read_crypto_reg(dd->status) == 0)
;
status = aml_read_crypto_reg(dd->status);
if (status & DMA_STATUS_KEY_ERROR) {
dev_err(dev, "hw crypto failed.\n");
err = -EINVAL;
}
aml_write_crypto_reg(dd->status, 0xf);
#else
status = aml_dma_do_hw_crypto(dd->dma, dsc, 1, dd->dma_descript_tab,
1, DMA_FLAG_SM4_IN_USE);
aml_dma_debug(dsc, 1, "end sm4 keyiv", dd->thread, dd->status);
if (status & DMA_STATUS_KEY_ERROR) {
dev_err(dev, "hw crypto failed.\n");
err = -EINVAL;
}
#endif
dma_unmap_single(dd->parent, dma_addr_key,
DMA_KEY_IV_BUF_SIZE, DMA_TO_DEVICE);
kfree(key_iv);
return err;
}
static size_t aml_sm4_sg_copy(struct scatterlist **sg, size_t *offset,
void *buf, size_t buflen, size_t total, int out)
{
size_t count, off = 0;
while (buflen && total) {
count = min((*sg)->length - *offset, total);
count = min(count, buflen);
if (!count)
return off;
scatterwalk_map_and_copy(buf + off, *sg, *offset, count, out);
off += count;
buflen -= count;
*offset += count;
total -= count;
if (*offset == (*sg)->length) {
*sg = sg_next(*sg);
if (*sg)
*offset = 0;
else
total = 0;
}
}
return off;
}
static size_t aml_sm4_sg_dma(struct aml_sm4_dev *dd, struct dma_dsc *dsc,
size_t total)
{
struct device *dev = dd->dev;
u32 i = 0;
int err = 0;
struct scatterlist *in_sg = dd->in_sg;
struct scatterlist *out_sg = dd->out_sg;
u32 in_nents = 0, out_nents = 0;
struct dma_sg_dsc *sg_dsc = NULL;
in_nents = sg_nents(in_sg);
out_nents = sg_nents(out_sg);
if (dd->in_sg != dd->out_sg) {
err = dma_map_sg(dd->parent, dd->in_sg, in_nents, DMA_TO_DEVICE);
if (!err) {
dev_err(dev, "dma_map_sg() error\n");
return 0;
}
err = dma_map_sg(dd->parent, dd->out_sg, out_nents,
DMA_FROM_DEVICE);
if (!err) {
dev_err(dev, "dma_map_sg() error\n");
dma_unmap_sg(dd->parent, dd->in_sg, in_nents,
DMA_TO_DEVICE);
return 0;
}
} else {
err = dma_map_sg(dd->parent, dd->in_sg, in_nents,
DMA_BIDIRECTIONAL);
if (!err) {
dev_err(dev, "dma_map_sg() error\n");
return 0;
}
dma_sync_sg_for_device(dd->parent, dd->in_sg,
in_nents, DMA_TO_DEVICE);
}
#if DMA_IRQ_MODE
dd->sg_dsc_in = dma_alloc_coherent(dd->parent,
in_nents * sizeof(struct dma_sg_dsc),
&dd->dma_sg_dsc_in, GFP_ATOMIC | GFP_DMA);
if (!dd->sg_dsc_in) {
dev_err(dev, "dma_alloc_coherent() for input error\n");
return 0;
}
dd->sg_dsc_out = dma_alloc_coherent(dd->parent,
out_nents * sizeof(struct dma_sg_dsc),
&dd->dma_sg_dsc_out, GFP_ATOMIC | GFP_DMA);
if (!dd->dma_sg_dsc_out) {
dev_err(dev, "dma_alloc_coherent() for output error\n");
dma_free_coherent(dd->parent, in_nents * sizeof(struct dma_sg_dsc),
dd->sg_dsc_in, dd->dma_sg_dsc_in);
return 0;
}
#else
dd->sg_dsc_in = dma_alloc_coherent(dd->parent,
in_nents * sizeof(struct dma_sg_dsc),
&dd->dma_sg_dsc_in, GFP_KERNEL | GFP_DMA);
if (!dd->sg_dsc_in) {
dev_err(dev, "dma_alloc_coherent() for input error\n");
return 0;
}
dd->sg_dsc_out = dma_alloc_coherent(dd->parent,
out_nents * sizeof(struct dma_sg_dsc),
&dd->dma_sg_dsc_out, GFP_KERNEL | GFP_DMA);
if (!dd->dma_sg_dsc_out) {
dev_err(dev, "dma_alloc_coherent() for output error\n");
dma_free_coherent(dd->parent, in_nents * sizeof(struct dma_sg_dsc),
dd->sg_dsc_in, dd->dma_sg_dsc_in);
return 0;
}
#endif
sg_dsc = dd->sg_dsc_in;
in_sg = dd->in_sg;
for (i = 0; i < in_nents; i++) {
sg_dsc[i].dsc_cfg.d32 = 0;
sg_dsc[i].dsc_cfg.b.valid = 1;
sg_dsc[i].dsc_cfg.b.eoc = i == (in_nents - 1) ? 1 : 0;
sg_dsc[i].dsc_cfg.b.length = in_sg->length;
sg_dsc[i].addr = in_sg->dma_address;
in_sg = sg_next(in_sg);
}
WARN_ON(in_sg);
out_sg = dd->out_sg;
sg_dsc = dd->sg_dsc_out;
for (i = 0; i < out_nents; i++) {
sg_dsc[i].dsc_cfg.d32 = 0;
sg_dsc[i].dsc_cfg.b.valid = 1;
sg_dsc[i].dsc_cfg.b.eoc = i == (out_nents - 1) ? 1 : 0;
sg_dsc[i].dsc_cfg.b.length = out_sg->length;
sg_dsc[i].addr = out_sg->dma_address;
out_sg = sg_next(out_sg);
}
WARN_ON(out_sg);
aml_dma_link_debug(dd->sg_dsc_in, dd->dma_sg_dsc_in, in_nents, __func__);
aml_dma_link_debug(dd->sg_dsc_out, dd->dma_sg_dsc_out, in_nents, __func__);
dsc->src_addr = dd->dma_sg_dsc_in;
dsc->tgt_addr = dd->dma_sg_dsc_out;
dsc->dsc_cfg.d32 = 0;
dsc->dsc_cfg.b.length = total;
dsc->dsc_cfg.b.link_error = 1;
return total;
}
static struct aml_sm4_dev *aml_sm4_find_dev(struct aml_sm4_ctx *ctx)
{
struct aml_sm4_dev *sm4_dd = NULL;
struct aml_sm4_dev *tmp;
spin_lock_bh(&aml_sm4.lock);
if (!ctx->dd) {
list_for_each_entry(tmp, &aml_sm4.dev_list, list) {
sm4_dd = tmp;
break;
}
ctx->dd = sm4_dd;
} else {
sm4_dd = ctx->dd;
}
spin_unlock_bh(&aml_sm4.lock);
return sm4_dd;
}
static int aml_sm4_hw_init(struct aml_sm4_dev *dd)
{
if (!(dd->flags & SM4_FLAGS_INIT)) {
dd->flags |= SM4_FLAGS_INIT;
dd->err = 0;
}
return 0;
}
static void aml_sm4_finish_req(struct aml_sm4_dev *dd, s32 err)
{
#if DMA_IRQ_MODE
struct skcipher_request *req = dd->req;
#endif
unsigned long flags;
dd->flags &= ~SM4_FLAGS_BUSY;
spin_lock_irqsave(&dd->dma->dma_lock, flags);
dd->dma->dma_busy &= ~DMA_FLAG_MAY_OCCUPY;
spin_unlock_irqrestore(&dd->dma->dma_lock, flags);
#if DMA_IRQ_MODE
req->base.complete(&req->base, err);
#endif
}
static int aml_sm4_crypt_dma(struct aml_sm4_dev *dd, struct dma_dsc *dsc,
u32 nents)
{
u32 op_mode = OP_MODE_ECB;
u32 i = 0;
#if DMA_IRQ_MODE
unsigned long flags;
#else
int err = 0;
u8 status = 0;
#endif
if (dd->flags & SM4_FLAGS_CBC)
op_mode = OP_MODE_CBC;
else if (dd->flags & SM4_FLAGS_CTR)
op_mode = OP_MODE_CTR;
for (i = 0; i < nents; i++) {
dsc[i].dsc_cfg.b.enc_sha_only = dd->flags & SM4_FLAGS_ENCRYPT;
dsc[i].dsc_cfg.b.mode = MODE_SM4;
dsc[i].dsc_cfg.b.op_mode = op_mode;
dsc[i].dsc_cfg.b.eoc = (i == (nents - 1));
dsc[i].dsc_cfg.b.owner = 1;
}
aml_dma_debug(dsc, nents, __func__, dd->thread, dd->status);
/* Start DMA transfer */
#if DMA_IRQ_MODE
spin_lock_irqsave(&dd->dma->dma_lock, flags);
dd->dma->dma_busy |= DMA_FLAG_SM4_IN_USE;
spin_unlock_irqrestore(&dd->dma->dma_lock, flags);
dd->flags |= SM4_FLAGS_DMA;
aml_write_crypto_reg(dd->thread, dd->dma_descript_tab | 2);
return -EINPROGRESS;
#else
dd->flags |= SM4_FLAGS_DMA;
status = aml_dma_do_hw_crypto(dd->dma, dsc, nents, dd->dma_descript_tab,
1, DMA_FLAG_SM4_IN_USE);
if (status & DMA_STATUS_KEY_ERROR)
dd->flags |= SM4_FLAGS_ERROR;
aml_dma_debug(dsc, nents, "end sm4", dd->thread, dd->status);
err = aml_sm4_crypt_dma_stop(dd);
if (!err) {
err = dd->flags & SM4_FLAGS_ERROR;
dd->flags = (dd->flags & ~SM4_FLAGS_ERROR);
}
return err;
#endif
}
static int aml_sm4_crypt_dma_start(struct aml_sm4_dev *dd)
{
int err = 0;
size_t count = 0;
dma_addr_t addr_in, addr_out;
struct dma_dsc *dsc = dd->descriptor;
u32 nents;
/* slow dma */
/* use cache buffers */
count = aml_sm4_sg_copy(&dd->in_sg, &dd->in_offset,
dd->buf_in, dd->buflen, dd->total, 0);
addr_in = dd->dma_addr_in;
addr_out = dd->dma_addr_out;
dd->dma_size = count;
dma_sync_single_for_device(dd->parent, addr_in,
((dd->dma_size + SM4_BLOCK_SIZE - 1)
/ SM4_BLOCK_SIZE) * SM4_BLOCK_SIZE,
DMA_TO_DEVICE);
dsc->src_addr = (u32)addr_in;
dsc->tgt_addr = (u32)addr_out;
dsc->dsc_cfg.d32 = 0;
/* We align data to SM4_BLOCK_SIZE for old aml-dma devices */
dsc->dsc_cfg.b.length = ((count + SM4_BLOCK_SIZE - 1)
/ SM4_BLOCK_SIZE) * SM4_BLOCK_SIZE;
nents = 1;
dd->flags &= ~SM4_FLAGS_FAST;
dbgp(1, "use slow dma: cnt:%zd, len:%d\n",
count, dsc->dsc_cfg.b.length);
dd->total -= count;
err = aml_sm4_crypt_dma(dd, dsc, nents);
return err;
}
static int aml_sm4_crypt_dma_link_mode_start(struct aml_sm4_dev *dd)
{
int err = 0;
size_t count = 0;
struct dma_dsc *dsc = dd->descriptor;
count = aml_sm4_sg_dma(dd, dsc, dd->total);
dd->flags |= SM4_FLAGS_FAST;
dd->fast_total = count;
dd->total -= dd->fast_total;
/* install IV */
if ((dd->flags & SM4_FLAGS_CBC) && !(dd->flags & SM4_FLAGS_ENCRYPT))
scatterwalk_map_and_copy(dd->req->iv,
dd->in_sg,
dd->fast_total - 16,
16, 0);
/* using 1 entry in link mode */
err = aml_sm4_crypt_dma(dd, dsc, 1);
return err;
}
static int aml_sm4_write_ctrl(struct aml_sm4_dev *dd)
{
int err = 0;
u32 *iv = NULL;
u8 iv_swap = 0;
err = aml_sm4_hw_init(dd);
if (err)
return err;
if (dd->flags & SM4_FLAGS_CBC) {
iv = (u32 *)dd->req->iv;
} else if (dd->flags & SM4_FLAGS_CTR) {
iv = (u32 *)dd->req->iv;
iv_swap = dd->iv_swap;
}
if (dd->ctx->kte >= 0)
err = set_sm4_kl_key_iv(dd, dd->ctx->key, dd->ctx->keylen,
iv, iv_swap);
else
err = set_sm4_key_iv(dd, dd->ctx->key, dd->ctx->keylen,
iv, iv_swap);
return err;
}
static int aml_sm4_handle_queue(struct aml_sm4_dev *dd,
struct skcipher_request *req)
{
struct device *dev = dd->dev;
#if DMA_IRQ_MODE
struct crypto_async_request *async_req, *backlog;
#endif
struct aml_sm4_ctx *ctx;
struct aml_sm4_reqctx *rctx;
s32 err = 0;
#if DMA_IRQ_MODE
s32 ret = 0;
#endif
#if DMA_IRQ_MODE
unsigned long flags;
spin_lock_irqsave(&dd->dma->dma_lock, flags);
if (req)
ret = crypto_enqueue_request(&dd->queue, &req->base);
if ((dd->flags & SM4_FLAGS_BUSY) || dd->dma->dma_busy) {
spin_unlock_irqrestore(&dd->dma->dma_lock, flags);
return ret;
}
backlog = crypto_get_backlog(&dd->queue);
async_req = crypto_dequeue_request(&dd->queue);
if (async_req) {
dd->flags |= SM4_FLAGS_BUSY;
dd->dma->dma_busy |= DMA_FLAG_MAY_OCCUPY;
}
spin_unlock_irqrestore(&dd->dma->dma_lock, flags);
if (!async_req) {
pm_runtime_mark_last_busy(dd->parent);
pm_runtime_put_autosuspend(dd->parent);
return ret;
}
if (backlog)
backlog->complete(backlog, -EINPROGRESS);
req = skcipher_request_cast(async_req);
#endif
/* assign new request to device */
dd->req = req;
dd->total = req->cryptlen;
dd->in_offset = 0;
dd->in_sg = req->src;
dd->out_offset = 0;
dd->out_sg = req->dst;
rctx = skcipher_request_ctx(req);
ctx = crypto_skcipher_ctx(crypto_skcipher_reqtfm(req));
rctx->mode &= SM4_FLAGS_MODE_MASK;
dd->flags = (dd->flags & ~SM4_FLAGS_MODE_MASK) | rctx->mode;
dd->flags = (dd->flags & ~SM4_FLAGS_ERROR);
dd->ctx = ctx;
ctx->dd = dd;
err = aml_sm4_write_ctrl(dd);
if (!err) {
if (dd->total % AML_SM4_DMA_THRESHOLD == 0 ||
(dd->flags & SM4_FLAGS_CTR)) {
if (dd->link_mode && !disable_link_mode) {
err = aml_sm4_crypt_dma_link_mode_start(dd);
} else {
do {
err = aml_sm4_crypt_dma_start(dd);
} while (!err && dd->total);
}
} else {
dev_err(dev, "size %zd is not multiple of %d",
dd->total, AML_SM4_DMA_THRESHOLD);
err = -EINVAL;
}
}
if (err != -EINPROGRESS) {
/* sm4_task will not finish it, so do it here */
aml_sm4_finish_req(dd, err);
#if DMA_IRQ_MODE
tasklet_schedule(&dd->queue_task);
#endif
}
#if DMA_IRQ_MODE
return ret;
#else
if (err)
return -EAGAIN;
else
return 0;
#endif
}
int aml_sm4_process(struct skcipher_request *req)
{
struct aml_sm4_ctx *tctx = crypto_tfm_ctx(req->base.tfm);
struct aml_sm4_dev *dd = tctx->dd;
return aml_sm4_handle_queue(dd, req);
}
/* Increment 128-bit counter */
static void aml_sm4_ctr_update_iv(unsigned char *val, unsigned int value)
{
int i;
while (value > 0) {
for (i = 15; i >= 0; i--) {
val[i] = (val[i] + 1) & 0xff;
if (val[i])
break;
}
value--;
}
}
static int aml_sm4_crypt_dma_stop(struct aml_sm4_dev *dd)
{
struct device *dev = dd->dev;
int err = -EINVAL;
size_t count;
u32 in_nents = 0, out_nents = 0;
if (dd->flags & SM4_FLAGS_DMA) {
err = 0;
if (dd->flags & SM4_FLAGS_FAST) {
in_nents = sg_nents(dd->in_sg);
out_nents = sg_nents(dd->out_sg);
if (dd->in_sg != dd->out_sg) {
dma_unmap_sg(dd->parent, dd->in_sg, in_nents,
DMA_TO_DEVICE);
dma_unmap_sg(dd->parent, dd->out_sg, out_nents,
DMA_FROM_DEVICE);
} else {
dma_sync_sg_for_cpu(dd->parent, dd->in_sg, in_nents,
DMA_FROM_DEVICE);
dma_unmap_sg(dd->parent, dd->in_sg, in_nents,
DMA_BIDIRECTIONAL);
}
aml_dma_link_debug(dd->sg_dsc_in, dd->dma_sg_dsc_in, in_nents, __func__);
aml_dma_link_debug(dd->sg_dsc_out, dd->dma_sg_dsc_out, in_nents, __func__);
dma_free_coherent(dd->parent,
in_nents * sizeof(struct dma_sg_dsc),
dd->sg_dsc_in, dd->dma_sg_dsc_in);
dma_free_coherent(dd->parent,
out_nents * sizeof(struct dma_sg_dsc),
dd->sg_dsc_out, dd->dma_sg_dsc_out);
/* install IV */
if (dd->flags & SM4_FLAGS_CBC) {
u32 length = dd->fast_total - SM4_BLOCK_SIZE;
if (dd->flags & SM4_FLAGS_ENCRYPT) {
scatterwalk_map_and_copy(dd->req->iv,
dd->out_sg,
length,
SM4_BLOCK_SIZE,
0);
}
} else if (dd->flags & SM4_FLAGS_CTR) {
u32 dma_nblock =
(dd->fast_total + SM4_BLOCK_SIZE - 1)
/ SM4_BLOCK_SIZE;
aml_sm4_ctr_update_iv(dd->req->iv,
dma_nblock);
}
} else {
dma_sync_single_for_cpu(dd->parent,
dd->dma_addr_out,
((dd->dma_size +
SM4_BLOCK_SIZE - 1)
/ SM4_BLOCK_SIZE) *
SM4_BLOCK_SIZE,
DMA_FROM_DEVICE);
/* copy data */
count = aml_sm4_sg_copy(&dd->out_sg, &dd->out_offset,
dd->buf_out, dd->buflen,
dd->dma_size, 1);
if (count != dd->dma_size) {
err = -EINVAL;
dev_err(dev, "not all data converted: %zu\n",
count);
}
/* install IV */
if (dd->flags & SM4_FLAGS_CBC) {
if (dd->flags & SM4_FLAGS_ENCRYPT) {
memcpy(dd->req->iv, dd->buf_out +
dd->dma_size - SM4_BLOCK_SIZE,
SM4_BLOCK_SIZE);
} else {
memcpy(dd->req->iv, dd->buf_in +
dd->dma_size - SM4_BLOCK_SIZE,
SM4_BLOCK_SIZE);
}
} else if (dd->flags & SM4_FLAGS_CTR) {
u32 dma_nblock =
(dd->dma_size + SM4_BLOCK_SIZE - 1)
/ SM4_BLOCK_SIZE;
aml_sm4_ctr_update_iv(dd->req->iv,
dma_nblock);
}
}
dd->flags &= ~SM4_FLAGS_DMA;
}
return err;
}
static int aml_sm4_buff_init(struct aml_sm4_dev *dd)
{
struct device *dev = dd->dev;
int err = -ENOMEM;
dd->buf_in = (void *)__get_free_pages(GFP_KERNEL, 0);
dd->buf_out = (void *)__get_free_pages(GFP_KERNEL, 0);
dd->buflen = PAGE_SIZE;
dd->buflen &= ~(SM4_BLOCK_SIZE - 1);
if (!dd->buf_in || !dd->buf_out) {
dev_err(dev, "unable to alloc pages.\n");
goto err_alloc;
}
dd->descriptor =
dmam_alloc_coherent(dd->parent,
MAX_NUM_TABLES * sizeof(struct dma_dsc),
&dd->dma_descript_tab, GFP_KERNEL | GFP_DMA);
if (!dd->descriptor) {
dev_err(dev, "dma descriptor error\n");
err = -EINVAL;
goto err_map_in;
}
/* MAP here */
dd->dma_addr_in = dma_map_single(dd->parent, dd->buf_in,
dd->buflen, DMA_TO_DEVICE);
if (dma_mapping_error(dd->parent, dd->dma_addr_in)) {
dev_err(dev, "dma %zd bytes error\n", dd->buflen);
err = -EINVAL;
goto err_map_in;
}
dd->dma_addr_out = dma_map_single(dd->parent, dd->buf_out,
dd->buflen, DMA_FROM_DEVICE);
if (dma_mapping_error(dd->parent, dd->dma_addr_out)) {
dev_err(dev, "dma %zd bytes error\n", dd->buflen);
err = -EINVAL;
goto err_map_out;
}
return 0;
err_map_out:
dma_unmap_single(dd->parent, dd->dma_addr_in, dd->buflen,
DMA_TO_DEVICE);
err_map_in:
free_page((uintptr_t)dd->buf_out);
free_page((uintptr_t)dd->buf_in);
err_alloc:
if (err)
dev_err(dev, "error: %d\n", err);
return err;
}
static void aml_sm4_buff_cleanup(struct aml_sm4_dev *dd)
{
dma_unmap_single(dd->parent, dd->dma_addr_out, dd->buflen,
DMA_FROM_DEVICE);
dma_unmap_single(dd->parent, dd->dma_addr_in, dd->buflen,
DMA_TO_DEVICE);
dmam_free_coherent(dd->parent, MAX_NUM_TABLES * sizeof(struct dma_dsc),
dd->descriptor, dd->dma_descript_tab);
free_page((uintptr_t)dd->buf_out);
free_page((uintptr_t)dd->buf_in);
}
static int aml_sm4_crypt(struct skcipher_request *req, unsigned long mode)
{
struct aml_sm4_ctx *ctx =
crypto_skcipher_ctx(crypto_skcipher_reqtfm(req));
struct aml_sm4_reqctx *rctx = skcipher_request_ctx(req);
struct aml_sm4_dev *dd;
int ret;
if (!IS_ALIGNED(req->cryptlen, SM4_BLOCK_SIZE) &&
!(mode & SM4_FLAGS_CTR)) {
pr_err("request size is not exact amount of SM4 blocks\n");
return -EINVAL;
}
ctx->block_size = SM4_BLOCK_SIZE;
dd = aml_sm4_find_dev(ctx);
if (!dd)
return -ENODEV;
rctx->mode = mode;
if (pm_runtime_suspended(dd->parent)) {
ret = pm_runtime_get_sync(dd->parent);
if (ret < 0) {
dev_err(dd->parent, "%s: pm_runtime_get_sync fails: %d\n",
__func__, ret);
return ret;
}
}
#if DMA_IRQ_MODE
return aml_sm4_handle_queue(dd, req);
#else
return aml_dma_crypto_enqueue_req(dd->dma, &req->base);
#endif
}
static int aml_sm4_kl_setkey(struct crypto_skcipher *tfm, const u8 *key,
unsigned int keylen)
{
struct aml_sm4_ctx *ctx = crypto_skcipher_ctx(tfm);
int ret = 0;
/* key[0:3] = kte */
ctx->kte = *(uint32_t *)&key[0];
if (keylen != SM4_KEY_SIZE) {
//crypto_skcipher_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN);
pr_err("aml-sm4-lite:invalid keysize: %d\n", keylen);
return -EINVAL;
}
ctx->keylen = keylen;
return ret;
}
static int aml_sm4_ecb_encrypt(struct skcipher_request *req)
{
return aml_sm4_crypt(req,
SM4_FLAGS_ENCRYPT);
}
static int aml_sm4_ecb_decrypt(struct skcipher_request *req)
{
return aml_sm4_crypt(req,
0);
}
static int aml_sm4_cbc_encrypt(struct skcipher_request *req)
{
return aml_sm4_crypt(req,
SM4_FLAGS_ENCRYPT | SM4_FLAGS_CBC);
}
static int aml_sm4_cbc_decrypt(struct skcipher_request *req)
{
return aml_sm4_crypt(req,
SM4_FLAGS_CBC);
}
static int aml_sm4_ctr_encrypt(struct skcipher_request *req)
{
return aml_sm4_crypt(req,
SM4_FLAGS_ENCRYPT | SM4_FLAGS_CTR);
}
static int aml_sm4_ctr_decrypt(struct skcipher_request *req)
{
/* XXX: use encrypt to replace for decrypt */
return aml_sm4_crypt(req,
SM4_FLAGS_ENCRYPT | SM4_FLAGS_CTR);
}
static int aml_sm4_cra_init(struct crypto_skcipher *tfm)
{
struct aml_sm4_ctx *ctx = crypto_skcipher_ctx(tfm);
crypto_skcipher_set_reqsize(tfm, sizeof(struct aml_sm4_reqctx));
ctx->fallback = NULL;
return 0;
}
static void aml_sm4_cra_exit(struct crypto_skcipher *tfm)
{
}
static int aml_sm4_setkey(struct crypto_skcipher *tfm, const u8 *key,
unsigned int keylen)
{
struct aml_sm4_ctx *ctx = crypto_skcipher_ctx(tfm);
if (keylen != SM4_KEY_SIZE) {
//crypto_skcipher_set_flags(tfm, CRYPTO_TFM_RES_BAD_KEY_LEN);
pr_err("aml-sm4:invalid keysize: %d\n", keylen);
return -EINVAL;
}
memcpy(ctx->key, key, keylen);
ctx->keylen = keylen;
ctx->kte = -1;
return 0;
}
static struct skcipher_alg sm4_algs[] = {
{
.base.cra_name = "ecb(sm4-aml)",
.base.cra_driver_name = "ecb-sm4-aml",
.base.cra_priority = 100,
.base.cra_flags = CRYPTO_ALG_ASYNC,
.base.cra_blocksize = SM4_BLOCK_SIZE,
.base.cra_ctxsize = sizeof(struct aml_sm4_ctx),
.base.cra_alignmask = 0xf,
.base.cra_module = THIS_MODULE,
.init = aml_sm4_cra_init,
.exit = aml_sm4_cra_exit,
.min_keysize = SM4_KEY_SIZE,
.max_keysize = SM4_KEY_SIZE,
.ivsize = SM4_BLOCK_SIZE,
.setkey = aml_sm4_setkey,
.encrypt = aml_sm4_ecb_encrypt,
.decrypt = aml_sm4_ecb_decrypt,
},
{
.base.cra_name = "cbc(sm4-aml)",
.base.cra_driver_name = "cbc-sm4-aml",
.base.cra_priority = 100,
.base.cra_flags = CRYPTO_ALG_ASYNC,
.base.cra_blocksize = SM4_BLOCK_SIZE,
.base.cra_ctxsize = sizeof(struct aml_sm4_ctx),
.base.cra_alignmask = 0xf,
.base.cra_module = THIS_MODULE,
.init = aml_sm4_cra_init,
.exit = aml_sm4_cra_exit,
.min_keysize = SM4_KEY_SIZE,
.max_keysize = SM4_KEY_SIZE,
.ivsize = SM4_BLOCK_SIZE,
.setkey = aml_sm4_setkey,
.encrypt = aml_sm4_cbc_encrypt,
.decrypt = aml_sm4_cbc_decrypt,
},
{
.base.cra_name = "ctr(sm4-aml)",
.base.cra_driver_name = "ctr-sm4-aml",
.base.cra_priority = 100,
.base.cra_flags = CRYPTO_ALG_ASYNC,
.base.cra_blocksize = SM4_BLOCK_SIZE,
.base.cra_ctxsize = sizeof(struct aml_sm4_ctx),
.base.cra_alignmask = 0xf,
.base.cra_module = THIS_MODULE,
.init = aml_sm4_cra_init,
.exit = aml_sm4_cra_exit,
.min_keysize = SM4_KEY_SIZE,
.max_keysize = SM4_KEY_SIZE,
.ivsize = SM4_BLOCK_SIZE,
.setkey = aml_sm4_setkey,
.encrypt = aml_sm4_ctr_encrypt,
.decrypt = aml_sm4_ctr_decrypt,
},
{
.base.cra_name = "ecb(sm4-kl-aml)",
.base.cra_driver_name = "ecb-sm4-kl-aml",
.base.cra_priority = 100,
.base.cra_flags = CRYPTO_ALG_ASYNC,
.base.cra_blocksize = SM4_BLOCK_SIZE,
.base.cra_ctxsize = sizeof(struct aml_sm4_ctx),
.base.cra_alignmask = 0xf,
.base.cra_module = THIS_MODULE,
.init = aml_sm4_cra_init,
.exit = aml_sm4_cra_exit,
.min_keysize = SM4_KEY_SIZE,
.max_keysize = SM4_KEY_SIZE,
.setkey = aml_sm4_kl_setkey,
.encrypt = aml_sm4_ecb_encrypt,
.decrypt = aml_sm4_ecb_decrypt,
},
{
.base.cra_name = "cbc(sm4-kl-aml)",
.base.cra_driver_name = "cbc-sm4-kl-aml",
.base.cra_priority = 100,
.base.cra_flags = CRYPTO_ALG_ASYNC,
.base.cra_blocksize = SM4_BLOCK_SIZE,
.base.cra_ctxsize = sizeof(struct aml_sm4_ctx),
.base.cra_alignmask = 0xf,
.base.cra_module = THIS_MODULE,
.init = aml_sm4_cra_init,
.exit = aml_sm4_cra_exit,
.min_keysize = SM4_KEY_SIZE,
.max_keysize = SM4_KEY_SIZE,
.ivsize = SM4_BLOCK_SIZE,
.setkey = aml_sm4_kl_setkey,
.encrypt = aml_sm4_cbc_encrypt,
.decrypt = aml_sm4_cbc_decrypt,
},
{
.base.cra_name = "ctr(sm4-kl-aml)",
.base.cra_driver_name = "ctr-sm4-kl-aml",
.base.cra_priority = 100,
.base.cra_flags = CRYPTO_ALG_ASYNC,
.base.cra_blocksize = SM4_BLOCK_SIZE,
.base.cra_ctxsize = sizeof(struct aml_sm4_ctx),
.base.cra_alignmask = 0xf,
.base.cra_module = THIS_MODULE,
.init = aml_sm4_cra_init,
.exit = aml_sm4_cra_exit,
.min_keysize = SM4_KEY_SIZE,
.max_keysize = SM4_KEY_SIZE,
.ivsize = SM4_BLOCK_SIZE,
.setkey = aml_sm4_kl_setkey,
.encrypt = aml_sm4_ctr_encrypt,
.decrypt = aml_sm4_ctr_decrypt,
}
};
struct aml_sm4_info aml_sm4_data = {
.algs = sm4_algs,
.num_algs = ARRAY_SIZE(sm4_algs),
};
#ifdef CONFIG_OF
static const struct of_device_id aml_sm4_dt_match[] = {
{ .compatible = "amlogic,sm4_dma",
.data = &aml_sm4_data,
},
{},
};
#else
#define aml_sm4_dt_match NULL
#endif
#if DMA_IRQ_MODE
static void aml_sm4_queue_task(unsigned long data)
{
struct aml_sm4_dev *dd = (struct aml_sm4_dev *)data;
aml_sm4_handle_queue(dd, NULL);
}
static void aml_sm4_done_task(unsigned long data)
{
struct aml_sm4_dev *dd = (struct aml_sm4_dev *)data;
int err;
err = aml_sm4_crypt_dma_stop(dd);
if (!err) {
err = dd->flags & SM4_FLAGS_ERROR;
dd->flags = (dd->flags & ~SM4_FLAGS_ERROR);
}
aml_dma_debug(dd->descriptor, 1, __func__, dd->thread, dd->status);
err = dd->err ? dd->err : err;
if (dd->total && !err) {
if (!err)
err = aml_sm4_crypt_dma_start(dd);
if (err == -EINPROGRESS)
return; /* DMA started. Not finishing. */
}
if (dd->ctx->kte < 0)
err = set_sm4_key_iv(dd, NULL, 0, NULL, 0);
aml_sm4_finish_req(dd, err);
aml_sm4_handle_queue(dd, NULL);
}
static irqreturn_t aml_sm4_irq(int irq, void *dev_id)
{
struct aml_sm4_dev *sm4_dd = dev_id;
struct device *dev = sm4_dd->dev;
u8 status = aml_read_crypto_reg(sm4_dd->status);
if (status) {
if (status == 0x1)
dev_err(dev, "irq overwrite\n");
if (sm4_dd->dma->dma_busy == DMA_FLAG_MAY_OCCUPY)
return IRQ_HANDLED;
if ((sm4_dd->flags & SM4_FLAGS_DMA) &&
(sm4_dd->dma->dma_busy & DMA_FLAG_SM4_IN_USE)) {
if (status & DMA_STATUS_KEY_ERROR)
sm4_dd->flags |= SM4_FLAGS_ERROR;
aml_write_crypto_reg(sm4_dd->status, 0xf);
sm4_dd->dma->dma_busy &= ~DMA_FLAG_SM4_IN_USE;
tasklet_schedule(&sm4_dd->done_task);
return IRQ_HANDLED;
} else {
return IRQ_NONE;
}
}
return IRQ_NONE;
}
#endif
static void aml_sm4_unregister_algs(struct aml_sm4_dev *dd,
const struct aml_sm4_info *sm4_info)
{
int i;
for (i = 0; i < sm4_info->num_algs; i++)
crypto_unregister_skcipher(&sm4_info->algs[i]);
}
static int aml_sm4_register_algs(struct aml_sm4_dev *dd,
const struct aml_sm4_info *sm4_info)
{
int err, i, j;
for (i = 0; i < sm4_info->num_algs; i++) {
err = crypto_register_skcipher(&sm4_info->algs[i]);
if (err)
goto err_sm4_algs;
}
return 0;
err_sm4_algs:
for (j = 0; j < i; j++)
crypto_unregister_skcipher(&sm4_info->algs[j]);
return err;
}
static int aml_sm4_probe(struct platform_device *pdev)
{
struct aml_sm4_dev *sm4_dd;
struct device *dev = &pdev->dev;
const struct of_device_id *match;
int err = -EPERM;
const struct aml_sm4_info *sm4_info = NULL;
/* Set default iv_swap to 1 for backward compatible.
* It can be modified by specifying iv_swap in dts.
*/
u8 iv_swap = 1;
sm4_dd = devm_kzalloc(dev, sizeof(struct aml_sm4_dev), GFP_KERNEL);
if (!sm4_dd) {
err = -ENOMEM;
goto sm4_dd_err;
}
match = of_match_device(aml_sm4_dt_match, &pdev->dev);
if (!match) {
dev_err(dev, "%s: cannot find match dt\n", __func__);
err = -EINVAL;
goto sm4_dd_err;
}
of_property_read_u8(pdev->dev.of_node, "iv_swap", &iv_swap);
sm4_info = match->data;
sm4_dd->dev = dev;
sm4_dd->parent = dev->parent;
sm4_dd->dma = dev_get_drvdata(dev->parent);
sm4_dd->thread = sm4_dd->dma->thread;
sm4_dd->status = sm4_dd->dma->status;
sm4_dd->link_mode = sm4_dd->dma->link_mode;
sm4_dd->irq = sm4_dd->dma->irq;
sm4_dd->iv_swap = iv_swap;
platform_set_drvdata(pdev, sm4_dd);
INIT_LIST_HEAD(&sm4_dd->list);
#if DMA_IRQ_MODE
tasklet_init(&sm4_dd->done_task, aml_sm4_done_task,
(unsigned long)sm4_dd);
tasklet_init(&sm4_dd->queue_task, aml_sm4_queue_task,
(unsigned long)sm4_dd);
crypto_init_queue(&sm4_dd->queue, AML_SM4_QUEUE_LENGTH);
err = devm_request_irq(dev, sm4_dd->irq, aml_sm4_irq, IRQF_SHARED,
"aml-sm4", sm4_dd);
if (err) {
dev_err(dev, "unable to request sm4 irq.\n");
goto sm4_irq_err;
}
#endif
pm_runtime_use_autosuspend(dev);
pm_runtime_set_autosuspend_delay(dev, DEFAULT_AUTOSUSPEND_DELAY);
pm_runtime_enable(dev);
err = pm_runtime_get_sync(dev);
if (err < 0) {
dev_err(dev, "%s: pm_runtime_get_sync fails: %d\n",
__func__, err);
goto err_sm4_pm;
}
err = aml_sm4_hw_init(sm4_dd);
if (err)
goto err_sm4_buff;
err = aml_sm4_buff_init(sm4_dd);
if (err)
goto err_sm4_buff;
spin_lock(&aml_sm4.lock);
list_add_tail(&sm4_dd->list, &aml_sm4.dev_list);
spin_unlock(&aml_sm4.lock);
err = aml_sm4_register_algs(sm4_dd, sm4_info);
if (err)
goto err_algs;
dev_info(dev, "Aml SM4_dma\n");
pm_runtime_put_sync_autosuspend(dev);
return 0;
err_algs:
spin_lock(&aml_sm4.lock);
list_del(&sm4_dd->list);
spin_unlock(&aml_sm4.lock);
aml_sm4_buff_cleanup(sm4_dd);
err_sm4_buff:
err_sm4_pm:
pm_runtime_disable(dev);
#if DMA_IRQ_MODE
sm4_irq_err:
tasklet_kill(&sm4_dd->done_task);
tasklet_kill(&sm4_dd->queue_task);
#endif
sm4_dd_err:
dev_err(dev, "initialization failed.\n");
return err;
}
static int aml_sm4_remove(struct platform_device *pdev)
{
struct device *dev = &pdev->dev;
static struct aml_sm4_dev *sm4_dd;
const struct of_device_id *match;
const struct aml_sm4_info *sm4_info = NULL;
sm4_dd = platform_get_drvdata(pdev);
if (!sm4_dd)
return -ENODEV;
match = of_match_device(aml_sm4_dt_match, &pdev->dev);
if (!match) {
dev_err(dev, "%s: cannot find match dt\n", __func__);
return -EINVAL;
}
sm4_info = match->data;
spin_lock(&aml_sm4.lock);
list_del(&sm4_dd->list);
spin_unlock(&aml_sm4.lock);
aml_sm4_buff_cleanup(sm4_dd);
aml_sm4_unregister_algs(sm4_dd, sm4_info);
#if DMA_IRQ_MODE
tasklet_kill(&sm4_dd->done_task);
tasklet_kill(&sm4_dd->queue_task);
#endif
pm_runtime_disable(sm4_dd->parent);
return 0;
}
static struct platform_driver aml_sm4_driver = {
.probe = aml_sm4_probe,
.remove = aml_sm4_remove,
.driver = {
.name = "aml_sm4_dma",
.owner = THIS_MODULE,
.of_match_table = aml_sm4_dt_match,
},
};
int __init aml_sm4_driver_init(void)
{
return platform_driver_register(&aml_sm4_driver);
}
void aml_sm4_driver_exit(void)
{
platform_driver_unregister(&aml_sm4_driver);
}