1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * sun8i-ss-prng.c - hardware cryptographic offloader for
4*4882a593Smuzhiyun * Allwinner A80/A83T SoC
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * Copyright (C) 2015-2020 Corentin Labbe <clabbe@baylibre.com>
7*4882a593Smuzhiyun *
8*4882a593Smuzhiyun * This file handle the PRNG found in the SS
9*4882a593Smuzhiyun *
10*4882a593Smuzhiyun * You could find a link for the datasheet in Documentation/arm/sunxi.rst
11*4882a593Smuzhiyun */
12*4882a593Smuzhiyun #include "sun8i-ss.h"
13*4882a593Smuzhiyun #include <linux/dma-mapping.h>
14*4882a593Smuzhiyun #include <linux/pm_runtime.h>
15*4882a593Smuzhiyun #include <crypto/internal/rng.h>
16*4882a593Smuzhiyun
sun8i_ss_prng_seed(struct crypto_rng * tfm,const u8 * seed,unsigned int slen)17*4882a593Smuzhiyun int sun8i_ss_prng_seed(struct crypto_rng *tfm, const u8 *seed,
18*4882a593Smuzhiyun unsigned int slen)
19*4882a593Smuzhiyun {
20*4882a593Smuzhiyun struct sun8i_ss_rng_tfm_ctx *ctx = crypto_rng_ctx(tfm);
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun if (ctx->seed && ctx->slen != slen) {
23*4882a593Smuzhiyun memzero_explicit(ctx->seed, ctx->slen);
24*4882a593Smuzhiyun kfree(ctx->seed);
25*4882a593Smuzhiyun ctx->slen = 0;
26*4882a593Smuzhiyun ctx->seed = NULL;
27*4882a593Smuzhiyun }
28*4882a593Smuzhiyun if (!ctx->seed)
29*4882a593Smuzhiyun ctx->seed = kmalloc(slen, GFP_KERNEL | GFP_DMA);
30*4882a593Smuzhiyun if (!ctx->seed)
31*4882a593Smuzhiyun return -ENOMEM;
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun memcpy(ctx->seed, seed, slen);
34*4882a593Smuzhiyun ctx->slen = slen;
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun return 0;
37*4882a593Smuzhiyun }
38*4882a593Smuzhiyun
sun8i_ss_prng_init(struct crypto_tfm * tfm)39*4882a593Smuzhiyun int sun8i_ss_prng_init(struct crypto_tfm *tfm)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun struct sun8i_ss_rng_tfm_ctx *ctx = crypto_tfm_ctx(tfm);
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun memset(ctx, 0, sizeof(struct sun8i_ss_rng_tfm_ctx));
44*4882a593Smuzhiyun return 0;
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun
sun8i_ss_prng_exit(struct crypto_tfm * tfm)47*4882a593Smuzhiyun void sun8i_ss_prng_exit(struct crypto_tfm *tfm)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun struct sun8i_ss_rng_tfm_ctx *ctx = crypto_tfm_ctx(tfm);
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun memzero_explicit(ctx->seed, ctx->slen);
52*4882a593Smuzhiyun kfree(ctx->seed);
53*4882a593Smuzhiyun ctx->seed = NULL;
54*4882a593Smuzhiyun ctx->slen = 0;
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun
sun8i_ss_prng_generate(struct crypto_rng * tfm,const u8 * src,unsigned int slen,u8 * dst,unsigned int dlen)57*4882a593Smuzhiyun int sun8i_ss_prng_generate(struct crypto_rng *tfm, const u8 *src,
58*4882a593Smuzhiyun unsigned int slen, u8 *dst, unsigned int dlen)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun struct sun8i_ss_rng_tfm_ctx *ctx = crypto_rng_ctx(tfm);
61*4882a593Smuzhiyun struct rng_alg *alg = crypto_rng_alg(tfm);
62*4882a593Smuzhiyun struct sun8i_ss_alg_template *algt;
63*4882a593Smuzhiyun struct sun8i_ss_dev *ss;
64*4882a593Smuzhiyun dma_addr_t dma_iv, dma_dst;
65*4882a593Smuzhiyun unsigned int todo;
66*4882a593Smuzhiyun int err = 0;
67*4882a593Smuzhiyun int flow;
68*4882a593Smuzhiyun void *d;
69*4882a593Smuzhiyun u32 v;
70*4882a593Smuzhiyun
71*4882a593Smuzhiyun algt = container_of(alg, struct sun8i_ss_alg_template, alg.rng);
72*4882a593Smuzhiyun ss = algt->ss;
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun if (ctx->slen == 0) {
75*4882a593Smuzhiyun dev_err(ss->dev, "The PRNG is not seeded\n");
76*4882a593Smuzhiyun return -EINVAL;
77*4882a593Smuzhiyun }
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun /* The SS does not give an updated seed, so we need to get a new one.
80*4882a593Smuzhiyun * So we will ask for an extra PRNG_SEED_SIZE data.
81*4882a593Smuzhiyun * We want dlen + seedsize rounded up to a multiple of PRNG_DATA_SIZE
82*4882a593Smuzhiyun */
83*4882a593Smuzhiyun todo = dlen + PRNG_SEED_SIZE + PRNG_DATA_SIZE;
84*4882a593Smuzhiyun todo -= todo % PRNG_DATA_SIZE;
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun d = kzalloc(todo, GFP_KERNEL | GFP_DMA);
87*4882a593Smuzhiyun if (!d)
88*4882a593Smuzhiyun return -ENOMEM;
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun flow = sun8i_ss_get_engine_number(ss);
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun #ifdef CONFIG_CRYPTO_DEV_SUN8I_SS_DEBUG
93*4882a593Smuzhiyun algt->stat_req++;
94*4882a593Smuzhiyun algt->stat_bytes += todo;
95*4882a593Smuzhiyun #endif
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun v = SS_ALG_PRNG | SS_PRNG_CONTINUE | SS_START;
98*4882a593Smuzhiyun if (flow)
99*4882a593Smuzhiyun v |= SS_FLOW1;
100*4882a593Smuzhiyun else
101*4882a593Smuzhiyun v |= SS_FLOW0;
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun dma_iv = dma_map_single(ss->dev, ctx->seed, ctx->slen, DMA_TO_DEVICE);
104*4882a593Smuzhiyun if (dma_mapping_error(ss->dev, dma_iv)) {
105*4882a593Smuzhiyun dev_err(ss->dev, "Cannot DMA MAP IV\n");
106*4882a593Smuzhiyun err = -EFAULT;
107*4882a593Smuzhiyun goto err_free;
108*4882a593Smuzhiyun }
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun dma_dst = dma_map_single(ss->dev, d, todo, DMA_FROM_DEVICE);
111*4882a593Smuzhiyun if (dma_mapping_error(ss->dev, dma_dst)) {
112*4882a593Smuzhiyun dev_err(ss->dev, "Cannot DMA MAP DST\n");
113*4882a593Smuzhiyun err = -EFAULT;
114*4882a593Smuzhiyun goto err_iv;
115*4882a593Smuzhiyun }
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun err = pm_runtime_get_sync(ss->dev);
118*4882a593Smuzhiyun if (err < 0) {
119*4882a593Smuzhiyun pm_runtime_put_noidle(ss->dev);
120*4882a593Smuzhiyun goto err_pm;
121*4882a593Smuzhiyun }
122*4882a593Smuzhiyun err = 0;
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun mutex_lock(&ss->mlock);
125*4882a593Smuzhiyun writel(dma_iv, ss->base + SS_IV_ADR_REG);
126*4882a593Smuzhiyun /* the PRNG act badly (failing rngtest) without SS_KEY_ADR_REG set */
127*4882a593Smuzhiyun writel(dma_iv, ss->base + SS_KEY_ADR_REG);
128*4882a593Smuzhiyun writel(dma_dst, ss->base + SS_DST_ADR_REG);
129*4882a593Smuzhiyun writel(todo / 4, ss->base + SS_LEN_ADR_REG);
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun reinit_completion(&ss->flows[flow].complete);
132*4882a593Smuzhiyun ss->flows[flow].status = 0;
133*4882a593Smuzhiyun /* Be sure all data is written before enabling the task */
134*4882a593Smuzhiyun wmb();
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun writel(v, ss->base + SS_CTL_REG);
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun wait_for_completion_interruptible_timeout(&ss->flows[flow].complete,
139*4882a593Smuzhiyun msecs_to_jiffies(todo));
140*4882a593Smuzhiyun if (ss->flows[flow].status == 0) {
141*4882a593Smuzhiyun dev_err(ss->dev, "DMA timeout for PRNG (size=%u)\n", todo);
142*4882a593Smuzhiyun err = -EFAULT;
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun /* Since cipher and hash use the linux/cryptoengine and that we have
145*4882a593Smuzhiyun * a cryptoengine per flow, we are sure that they will issue only one
146*4882a593Smuzhiyun * request per flow.
147*4882a593Smuzhiyun * Since the cryptoengine wait for completion before submitting a new
148*4882a593Smuzhiyun * one, the mlock could be left just after the final writel.
149*4882a593Smuzhiyun * But cryptoengine cannot handle crypto_rng, so we need to be sure
150*4882a593Smuzhiyun * nothing will use our flow.
151*4882a593Smuzhiyun * The easiest way is to grab mlock until the hardware end our requests.
152*4882a593Smuzhiyun * We could have used a per flow lock, but this would increase
153*4882a593Smuzhiyun * complexity.
154*4882a593Smuzhiyun * The drawback is that no request could be handled for the other flow.
155*4882a593Smuzhiyun */
156*4882a593Smuzhiyun mutex_unlock(&ss->mlock);
157*4882a593Smuzhiyun
158*4882a593Smuzhiyun pm_runtime_put(ss->dev);
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun err_pm:
161*4882a593Smuzhiyun dma_unmap_single(ss->dev, dma_dst, todo, DMA_FROM_DEVICE);
162*4882a593Smuzhiyun err_iv:
163*4882a593Smuzhiyun dma_unmap_single(ss->dev, dma_iv, ctx->slen, DMA_TO_DEVICE);
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun if (!err) {
166*4882a593Smuzhiyun memcpy(dst, d, dlen);
167*4882a593Smuzhiyun /* Update seed */
168*4882a593Smuzhiyun memcpy(ctx->seed, d + dlen, ctx->slen);
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun memzero_explicit(d, todo);
171*4882a593Smuzhiyun err_free:
172*4882a593Smuzhiyun kfree(d);
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun return err;
175*4882a593Smuzhiyun }
176