xref: /OK3568_Linux_fs/kernel/drivers/crypto/allwinner/sun8i-ss/sun8i-ss-prng.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * sun8i-ss-prng.c - hardware cryptographic offloader for
4*4882a593Smuzhiyun  * Allwinner A80/A83T SoC
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * Copyright (C) 2015-2020 Corentin Labbe <clabbe@baylibre.com>
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * This file handle the PRNG found in the SS
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  * You could find a link for the datasheet in Documentation/arm/sunxi.rst
11*4882a593Smuzhiyun  */
12*4882a593Smuzhiyun #include "sun8i-ss.h"
13*4882a593Smuzhiyun #include <linux/dma-mapping.h>
14*4882a593Smuzhiyun #include <linux/pm_runtime.h>
15*4882a593Smuzhiyun #include <crypto/internal/rng.h>
16*4882a593Smuzhiyun 
sun8i_ss_prng_seed(struct crypto_rng * tfm,const u8 * seed,unsigned int slen)17*4882a593Smuzhiyun int sun8i_ss_prng_seed(struct crypto_rng *tfm, const u8 *seed,
18*4882a593Smuzhiyun 		       unsigned int slen)
19*4882a593Smuzhiyun {
20*4882a593Smuzhiyun 	struct sun8i_ss_rng_tfm_ctx *ctx = crypto_rng_ctx(tfm);
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun 	if (ctx->seed && ctx->slen != slen) {
23*4882a593Smuzhiyun 		memzero_explicit(ctx->seed, ctx->slen);
24*4882a593Smuzhiyun 		kfree(ctx->seed);
25*4882a593Smuzhiyun 		ctx->slen = 0;
26*4882a593Smuzhiyun 		ctx->seed = NULL;
27*4882a593Smuzhiyun 	}
28*4882a593Smuzhiyun 	if (!ctx->seed)
29*4882a593Smuzhiyun 		ctx->seed = kmalloc(slen, GFP_KERNEL | GFP_DMA);
30*4882a593Smuzhiyun 	if (!ctx->seed)
31*4882a593Smuzhiyun 		return -ENOMEM;
32*4882a593Smuzhiyun 
33*4882a593Smuzhiyun 	memcpy(ctx->seed, seed, slen);
34*4882a593Smuzhiyun 	ctx->slen = slen;
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun 	return 0;
37*4882a593Smuzhiyun }
38*4882a593Smuzhiyun 
sun8i_ss_prng_init(struct crypto_tfm * tfm)39*4882a593Smuzhiyun int sun8i_ss_prng_init(struct crypto_tfm *tfm)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun 	struct sun8i_ss_rng_tfm_ctx *ctx = crypto_tfm_ctx(tfm);
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun 	memset(ctx, 0, sizeof(struct sun8i_ss_rng_tfm_ctx));
44*4882a593Smuzhiyun 	return 0;
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun 
sun8i_ss_prng_exit(struct crypto_tfm * tfm)47*4882a593Smuzhiyun void sun8i_ss_prng_exit(struct crypto_tfm *tfm)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun 	struct sun8i_ss_rng_tfm_ctx *ctx = crypto_tfm_ctx(tfm);
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun 	memzero_explicit(ctx->seed, ctx->slen);
52*4882a593Smuzhiyun 	kfree(ctx->seed);
53*4882a593Smuzhiyun 	ctx->seed = NULL;
54*4882a593Smuzhiyun 	ctx->slen = 0;
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun 
sun8i_ss_prng_generate(struct crypto_rng * tfm,const u8 * src,unsigned int slen,u8 * dst,unsigned int dlen)57*4882a593Smuzhiyun int sun8i_ss_prng_generate(struct crypto_rng *tfm, const u8 *src,
58*4882a593Smuzhiyun 			   unsigned int slen, u8 *dst, unsigned int dlen)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun 	struct sun8i_ss_rng_tfm_ctx *ctx = crypto_rng_ctx(tfm);
61*4882a593Smuzhiyun 	struct rng_alg *alg = crypto_rng_alg(tfm);
62*4882a593Smuzhiyun 	struct sun8i_ss_alg_template *algt;
63*4882a593Smuzhiyun 	struct sun8i_ss_dev *ss;
64*4882a593Smuzhiyun 	dma_addr_t dma_iv, dma_dst;
65*4882a593Smuzhiyun 	unsigned int todo;
66*4882a593Smuzhiyun 	int err = 0;
67*4882a593Smuzhiyun 	int flow;
68*4882a593Smuzhiyun 	void *d;
69*4882a593Smuzhiyun 	u32 v;
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	algt = container_of(alg, struct sun8i_ss_alg_template, alg.rng);
72*4882a593Smuzhiyun 	ss = algt->ss;
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun 	if (ctx->slen == 0) {
75*4882a593Smuzhiyun 		dev_err(ss->dev, "The PRNG is not seeded\n");
76*4882a593Smuzhiyun 		return -EINVAL;
77*4882a593Smuzhiyun 	}
78*4882a593Smuzhiyun 
79*4882a593Smuzhiyun 	/* The SS does not give an updated seed, so we need to get a new one.
80*4882a593Smuzhiyun 	 * So we will ask for an extra PRNG_SEED_SIZE data.
81*4882a593Smuzhiyun 	 * We want dlen + seedsize rounded up to a multiple of PRNG_DATA_SIZE
82*4882a593Smuzhiyun 	 */
83*4882a593Smuzhiyun 	todo = dlen + PRNG_SEED_SIZE + PRNG_DATA_SIZE;
84*4882a593Smuzhiyun 	todo -= todo % PRNG_DATA_SIZE;
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun 	d = kzalloc(todo, GFP_KERNEL | GFP_DMA);
87*4882a593Smuzhiyun 	if (!d)
88*4882a593Smuzhiyun 		return -ENOMEM;
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	flow = sun8i_ss_get_engine_number(ss);
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun #ifdef CONFIG_CRYPTO_DEV_SUN8I_SS_DEBUG
93*4882a593Smuzhiyun 	algt->stat_req++;
94*4882a593Smuzhiyun 	algt->stat_bytes += todo;
95*4882a593Smuzhiyun #endif
96*4882a593Smuzhiyun 
97*4882a593Smuzhiyun 	v = SS_ALG_PRNG | SS_PRNG_CONTINUE | SS_START;
98*4882a593Smuzhiyun 	if (flow)
99*4882a593Smuzhiyun 		v |= SS_FLOW1;
100*4882a593Smuzhiyun 	else
101*4882a593Smuzhiyun 		v |= SS_FLOW0;
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun 	dma_iv = dma_map_single(ss->dev, ctx->seed, ctx->slen, DMA_TO_DEVICE);
104*4882a593Smuzhiyun 	if (dma_mapping_error(ss->dev, dma_iv)) {
105*4882a593Smuzhiyun 		dev_err(ss->dev, "Cannot DMA MAP IV\n");
106*4882a593Smuzhiyun 		err = -EFAULT;
107*4882a593Smuzhiyun 		goto err_free;
108*4882a593Smuzhiyun 	}
109*4882a593Smuzhiyun 
110*4882a593Smuzhiyun 	dma_dst = dma_map_single(ss->dev, d, todo, DMA_FROM_DEVICE);
111*4882a593Smuzhiyun 	if (dma_mapping_error(ss->dev, dma_dst)) {
112*4882a593Smuzhiyun 		dev_err(ss->dev, "Cannot DMA MAP DST\n");
113*4882a593Smuzhiyun 		err = -EFAULT;
114*4882a593Smuzhiyun 		goto err_iv;
115*4882a593Smuzhiyun 	}
116*4882a593Smuzhiyun 
117*4882a593Smuzhiyun 	err = pm_runtime_get_sync(ss->dev);
118*4882a593Smuzhiyun 	if (err < 0) {
119*4882a593Smuzhiyun 		pm_runtime_put_noidle(ss->dev);
120*4882a593Smuzhiyun 		goto err_pm;
121*4882a593Smuzhiyun 	}
122*4882a593Smuzhiyun 	err = 0;
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun 	mutex_lock(&ss->mlock);
125*4882a593Smuzhiyun 	writel(dma_iv, ss->base + SS_IV_ADR_REG);
126*4882a593Smuzhiyun 	/* the PRNG act badly (failing rngtest) without SS_KEY_ADR_REG set */
127*4882a593Smuzhiyun 	writel(dma_iv, ss->base + SS_KEY_ADR_REG);
128*4882a593Smuzhiyun 	writel(dma_dst, ss->base + SS_DST_ADR_REG);
129*4882a593Smuzhiyun 	writel(todo / 4, ss->base + SS_LEN_ADR_REG);
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun 	reinit_completion(&ss->flows[flow].complete);
132*4882a593Smuzhiyun 	ss->flows[flow].status = 0;
133*4882a593Smuzhiyun 	/* Be sure all data is written before enabling the task */
134*4882a593Smuzhiyun 	wmb();
135*4882a593Smuzhiyun 
136*4882a593Smuzhiyun 	writel(v, ss->base + SS_CTL_REG);
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	wait_for_completion_interruptible_timeout(&ss->flows[flow].complete,
139*4882a593Smuzhiyun 						  msecs_to_jiffies(todo));
140*4882a593Smuzhiyun 	if (ss->flows[flow].status == 0) {
141*4882a593Smuzhiyun 		dev_err(ss->dev, "DMA timeout for PRNG (size=%u)\n", todo);
142*4882a593Smuzhiyun 		err = -EFAULT;
143*4882a593Smuzhiyun 	}
144*4882a593Smuzhiyun 	/* Since cipher and hash use the linux/cryptoengine and that we have
145*4882a593Smuzhiyun 	 * a cryptoengine per flow, we are sure that they will issue only one
146*4882a593Smuzhiyun 	 * request per flow.
147*4882a593Smuzhiyun 	 * Since the cryptoengine wait for completion before submitting a new
148*4882a593Smuzhiyun 	 * one, the mlock could be left just after the final writel.
149*4882a593Smuzhiyun 	 * But cryptoengine cannot handle crypto_rng, so we need to be sure
150*4882a593Smuzhiyun 	 * nothing will use our flow.
151*4882a593Smuzhiyun 	 * The easiest way is to grab mlock until the hardware end our requests.
152*4882a593Smuzhiyun 	 * We could have used a per flow lock, but this would increase
153*4882a593Smuzhiyun 	 * complexity.
154*4882a593Smuzhiyun 	 * The drawback is that no request could be handled for the other flow.
155*4882a593Smuzhiyun 	 */
156*4882a593Smuzhiyun 	mutex_unlock(&ss->mlock);
157*4882a593Smuzhiyun 
158*4882a593Smuzhiyun 	pm_runtime_put(ss->dev);
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun err_pm:
161*4882a593Smuzhiyun 	dma_unmap_single(ss->dev, dma_dst, todo, DMA_FROM_DEVICE);
162*4882a593Smuzhiyun err_iv:
163*4882a593Smuzhiyun 	dma_unmap_single(ss->dev, dma_iv, ctx->slen, DMA_TO_DEVICE);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	if (!err) {
166*4882a593Smuzhiyun 		memcpy(dst, d, dlen);
167*4882a593Smuzhiyun 		/* Update seed */
168*4882a593Smuzhiyun 		memcpy(ctx->seed, d + dlen, ctx->slen);
169*4882a593Smuzhiyun 	}
170*4882a593Smuzhiyun 	memzero_explicit(d, todo);
171*4882a593Smuzhiyun err_free:
172*4882a593Smuzhiyun 	kfree(d);
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 	return err;
175*4882a593Smuzhiyun }
176