xref: /OK3568_Linux_fs/kernel/drivers/crypto/inside-secure/safexcel.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (C) 2017 Marvell
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Antoine Tenart <antoine.tenart@free-electrons.com>
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #include <linux/clk.h>
9*4882a593Smuzhiyun #include <linux/device.h>
10*4882a593Smuzhiyun #include <linux/dma-mapping.h>
11*4882a593Smuzhiyun #include <linux/dmapool.h>
12*4882a593Smuzhiyun #include <linux/firmware.h>
13*4882a593Smuzhiyun #include <linux/interrupt.h>
14*4882a593Smuzhiyun #include <linux/module.h>
15*4882a593Smuzhiyun #include <linux/of_platform.h>
16*4882a593Smuzhiyun #include <linux/of_irq.h>
17*4882a593Smuzhiyun #include <linux/pci.h>
18*4882a593Smuzhiyun #include <linux/platform_device.h>
19*4882a593Smuzhiyun #include <linux/workqueue.h>
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun #include <crypto/internal/aead.h>
22*4882a593Smuzhiyun #include <crypto/internal/hash.h>
23*4882a593Smuzhiyun #include <crypto/internal/skcipher.h>
24*4882a593Smuzhiyun 
25*4882a593Smuzhiyun #include "safexcel.h"
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun static u32 max_rings = EIP197_MAX_RINGS;
28*4882a593Smuzhiyun module_param(max_rings, uint, 0644);
29*4882a593Smuzhiyun MODULE_PARM_DESC(max_rings, "Maximum number of rings to use.");
30*4882a593Smuzhiyun 
eip197_trc_cache_setupvirt(struct safexcel_crypto_priv * priv)31*4882a593Smuzhiyun static void eip197_trc_cache_setupvirt(struct safexcel_crypto_priv *priv)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun 	int i;
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun 	/*
36*4882a593Smuzhiyun 	 * Map all interfaces/rings to register index 0
37*4882a593Smuzhiyun 	 * so they can share contexts. Without this, the EIP197 will
38*4882a593Smuzhiyun 	 * assume each interface/ring to be in its own memory domain
39*4882a593Smuzhiyun 	 * i.e. have its own subset of UNIQUE memory addresses.
40*4882a593Smuzhiyun 	 * Which would cause records with the SAME memory address to
41*4882a593Smuzhiyun 	 * use DIFFERENT cache buffers, causing both poor cache utilization
42*4882a593Smuzhiyun 	 * AND serious coherence/invalidation issues.
43*4882a593Smuzhiyun 	 */
44*4882a593Smuzhiyun 	for (i = 0; i < 4; i++)
45*4882a593Smuzhiyun 		writel(0, priv->base + EIP197_FLUE_IFC_LUT(i));
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun 	/*
48*4882a593Smuzhiyun 	 * Initialize other virtualization regs for cache
49*4882a593Smuzhiyun 	 * These may not be in their reset state ...
50*4882a593Smuzhiyun 	 */
51*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
52*4882a593Smuzhiyun 		writel(0, priv->base + EIP197_FLUE_CACHEBASE_LO(i));
53*4882a593Smuzhiyun 		writel(0, priv->base + EIP197_FLUE_CACHEBASE_HI(i));
54*4882a593Smuzhiyun 		writel(EIP197_FLUE_CONFIG_MAGIC,
55*4882a593Smuzhiyun 		       priv->base + EIP197_FLUE_CONFIG(i));
56*4882a593Smuzhiyun 	}
57*4882a593Smuzhiyun 	writel(0, priv->base + EIP197_FLUE_OFFSETS);
58*4882a593Smuzhiyun 	writel(0, priv->base + EIP197_FLUE_ARC4_OFFSET);
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun 
eip197_trc_cache_banksel(struct safexcel_crypto_priv * priv,u32 addrmid,int * actbank)61*4882a593Smuzhiyun static void eip197_trc_cache_banksel(struct safexcel_crypto_priv *priv,
62*4882a593Smuzhiyun 				     u32 addrmid, int *actbank)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun 	u32 val;
65*4882a593Smuzhiyun 	int curbank;
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun 	curbank = addrmid >> 16;
68*4882a593Smuzhiyun 	if (curbank != *actbank) {
69*4882a593Smuzhiyun 		val = readl(priv->base + EIP197_CS_RAM_CTRL);
70*4882a593Smuzhiyun 		val = (val & ~EIP197_CS_BANKSEL_MASK) |
71*4882a593Smuzhiyun 		      (curbank << EIP197_CS_BANKSEL_OFS);
72*4882a593Smuzhiyun 		writel(val, priv->base + EIP197_CS_RAM_CTRL);
73*4882a593Smuzhiyun 		*actbank = curbank;
74*4882a593Smuzhiyun 	}
75*4882a593Smuzhiyun }
76*4882a593Smuzhiyun 
eip197_trc_cache_probe(struct safexcel_crypto_priv * priv,int maxbanks,u32 probemask,u32 stride)77*4882a593Smuzhiyun static u32 eip197_trc_cache_probe(struct safexcel_crypto_priv *priv,
78*4882a593Smuzhiyun 				  int maxbanks, u32 probemask, u32 stride)
79*4882a593Smuzhiyun {
80*4882a593Smuzhiyun 	u32 val, addrhi, addrlo, addrmid, addralias, delta, marker;
81*4882a593Smuzhiyun 	int actbank;
82*4882a593Smuzhiyun 
83*4882a593Smuzhiyun 	/*
84*4882a593Smuzhiyun 	 * And probe the actual size of the physically attached cache data RAM
85*4882a593Smuzhiyun 	 * Using a binary subdivision algorithm downto 32 byte cache lines.
86*4882a593Smuzhiyun 	 */
87*4882a593Smuzhiyun 	addrhi = 1 << (16 + maxbanks);
88*4882a593Smuzhiyun 	addrlo = 0;
89*4882a593Smuzhiyun 	actbank = min(maxbanks - 1, 0);
90*4882a593Smuzhiyun 	while ((addrhi - addrlo) > stride) {
91*4882a593Smuzhiyun 		/* write marker to lowest address in top half */
92*4882a593Smuzhiyun 		addrmid = (addrhi + addrlo) >> 1;
93*4882a593Smuzhiyun 		marker = (addrmid ^ 0xabadbabe) & probemask; /* Unique */
94*4882a593Smuzhiyun 		eip197_trc_cache_banksel(priv, addrmid, &actbank);
95*4882a593Smuzhiyun 		writel(marker,
96*4882a593Smuzhiyun 			priv->base + EIP197_CLASSIFICATION_RAMS +
97*4882a593Smuzhiyun 			(addrmid & 0xffff));
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun 		/* write invalid markers to possible aliases */
100*4882a593Smuzhiyun 		delta = 1 << __fls(addrmid);
101*4882a593Smuzhiyun 		while (delta >= stride) {
102*4882a593Smuzhiyun 			addralias = addrmid - delta;
103*4882a593Smuzhiyun 			eip197_trc_cache_banksel(priv, addralias, &actbank);
104*4882a593Smuzhiyun 			writel(~marker,
105*4882a593Smuzhiyun 			       priv->base + EIP197_CLASSIFICATION_RAMS +
106*4882a593Smuzhiyun 			       (addralias & 0xffff));
107*4882a593Smuzhiyun 			delta >>= 1;
108*4882a593Smuzhiyun 		}
109*4882a593Smuzhiyun 
110*4882a593Smuzhiyun 		/* read back marker from top half */
111*4882a593Smuzhiyun 		eip197_trc_cache_banksel(priv, addrmid, &actbank);
112*4882a593Smuzhiyun 		val = readl(priv->base + EIP197_CLASSIFICATION_RAMS +
113*4882a593Smuzhiyun 			    (addrmid & 0xffff));
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun 		if ((val & probemask) == marker)
116*4882a593Smuzhiyun 			/* read back correct, continue with top half */
117*4882a593Smuzhiyun 			addrlo = addrmid;
118*4882a593Smuzhiyun 		else
119*4882a593Smuzhiyun 			/* not read back correct, continue with bottom half */
120*4882a593Smuzhiyun 			addrhi = addrmid;
121*4882a593Smuzhiyun 	}
122*4882a593Smuzhiyun 	return addrhi;
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun 
eip197_trc_cache_clear(struct safexcel_crypto_priv * priv,int cs_rc_max,int cs_ht_wc)125*4882a593Smuzhiyun static void eip197_trc_cache_clear(struct safexcel_crypto_priv *priv,
126*4882a593Smuzhiyun 				   int cs_rc_max, int cs_ht_wc)
127*4882a593Smuzhiyun {
128*4882a593Smuzhiyun 	int i;
129*4882a593Smuzhiyun 	u32 htable_offset, val, offset;
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun 	/* Clear all records in administration RAM */
132*4882a593Smuzhiyun 	for (i = 0; i < cs_rc_max; i++) {
133*4882a593Smuzhiyun 		offset = EIP197_CLASSIFICATION_RAMS + i * EIP197_CS_RC_SIZE;
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun 		writel(EIP197_CS_RC_NEXT(EIP197_RC_NULL) |
136*4882a593Smuzhiyun 		       EIP197_CS_RC_PREV(EIP197_RC_NULL),
137*4882a593Smuzhiyun 		       priv->base + offset);
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 		val = EIP197_CS_RC_NEXT(i + 1) | EIP197_CS_RC_PREV(i - 1);
140*4882a593Smuzhiyun 		if (i == 0)
141*4882a593Smuzhiyun 			val |= EIP197_CS_RC_PREV(EIP197_RC_NULL);
142*4882a593Smuzhiyun 		else if (i == cs_rc_max - 1)
143*4882a593Smuzhiyun 			val |= EIP197_CS_RC_NEXT(EIP197_RC_NULL);
144*4882a593Smuzhiyun 		writel(val, priv->base + offset + 4);
145*4882a593Smuzhiyun 		/* must also initialize the address key due to ECC! */
146*4882a593Smuzhiyun 		writel(0, priv->base + offset + 8);
147*4882a593Smuzhiyun 		writel(0, priv->base + offset + 12);
148*4882a593Smuzhiyun 	}
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	/* Clear the hash table entries */
151*4882a593Smuzhiyun 	htable_offset = cs_rc_max * EIP197_CS_RC_SIZE;
152*4882a593Smuzhiyun 	for (i = 0; i < cs_ht_wc; i++)
153*4882a593Smuzhiyun 		writel(GENMASK(29, 0),
154*4882a593Smuzhiyun 		       priv->base + EIP197_CLASSIFICATION_RAMS +
155*4882a593Smuzhiyun 		       htable_offset + i * sizeof(u32));
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun 
eip197_trc_cache_init(struct safexcel_crypto_priv * priv)158*4882a593Smuzhiyun static int eip197_trc_cache_init(struct safexcel_crypto_priv *priv)
159*4882a593Smuzhiyun {
160*4882a593Smuzhiyun 	u32 val, dsize, asize;
161*4882a593Smuzhiyun 	int cs_rc_max, cs_ht_wc, cs_trc_rec_wc, cs_trc_lg_rec_wc;
162*4882a593Smuzhiyun 	int cs_rc_abs_max, cs_ht_sz;
163*4882a593Smuzhiyun 	int maxbanks;
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	/* Setup (dummy) virtualization for cache */
166*4882a593Smuzhiyun 	eip197_trc_cache_setupvirt(priv);
167*4882a593Smuzhiyun 
168*4882a593Smuzhiyun 	/*
169*4882a593Smuzhiyun 	 * Enable the record cache memory access and
170*4882a593Smuzhiyun 	 * probe the bank select width
171*4882a593Smuzhiyun 	 */
172*4882a593Smuzhiyun 	val = readl(priv->base + EIP197_CS_RAM_CTRL);
173*4882a593Smuzhiyun 	val &= ~EIP197_TRC_ENABLE_MASK;
174*4882a593Smuzhiyun 	val |= EIP197_TRC_ENABLE_0 | EIP197_CS_BANKSEL_MASK;
175*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_CS_RAM_CTRL);
176*4882a593Smuzhiyun 	val = readl(priv->base + EIP197_CS_RAM_CTRL);
177*4882a593Smuzhiyun 	maxbanks = ((val&EIP197_CS_BANKSEL_MASK)>>EIP197_CS_BANKSEL_OFS) + 1;
178*4882a593Smuzhiyun 
179*4882a593Smuzhiyun 	/* Clear all ECC errors */
180*4882a593Smuzhiyun 	writel(0, priv->base + EIP197_TRC_ECCCTRL);
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	/*
183*4882a593Smuzhiyun 	 * Make sure the cache memory is accessible by taking record cache into
184*4882a593Smuzhiyun 	 * reset. Need data memory access here, not admin access.
185*4882a593Smuzhiyun 	 */
186*4882a593Smuzhiyun 	val = readl(priv->base + EIP197_TRC_PARAMS);
187*4882a593Smuzhiyun 	val |= EIP197_TRC_PARAMS_SW_RESET | EIP197_TRC_PARAMS_DATA_ACCESS;
188*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_TRC_PARAMS);
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun 	/* Probed data RAM size in bytes */
191*4882a593Smuzhiyun 	dsize = eip197_trc_cache_probe(priv, maxbanks, 0xffffffff, 32);
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun 	/*
194*4882a593Smuzhiyun 	 * Now probe the administration RAM size pretty much the same way
195*4882a593Smuzhiyun 	 * Except that only the lower 30 bits are writable and we don't need
196*4882a593Smuzhiyun 	 * bank selects
197*4882a593Smuzhiyun 	 */
198*4882a593Smuzhiyun 	val = readl(priv->base + EIP197_TRC_PARAMS);
199*4882a593Smuzhiyun 	/* admin access now */
200*4882a593Smuzhiyun 	val &= ~(EIP197_TRC_PARAMS_DATA_ACCESS | EIP197_CS_BANKSEL_MASK);
201*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_TRC_PARAMS);
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun 	/* Probed admin RAM size in admin words */
204*4882a593Smuzhiyun 	asize = eip197_trc_cache_probe(priv, 0, 0x3fffffff, 16) >> 4;
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	/* Clear any ECC errors detected while probing! */
207*4882a593Smuzhiyun 	writel(0, priv->base + EIP197_TRC_ECCCTRL);
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun 	/* Sanity check probing results */
210*4882a593Smuzhiyun 	if (dsize < EIP197_MIN_DSIZE || asize < EIP197_MIN_ASIZE) {
211*4882a593Smuzhiyun 		dev_err(priv->dev, "Record cache probing failed (%d,%d).",
212*4882a593Smuzhiyun 			dsize, asize);
213*4882a593Smuzhiyun 		return -ENODEV;
214*4882a593Smuzhiyun 	}
215*4882a593Smuzhiyun 
216*4882a593Smuzhiyun 	/*
217*4882a593Smuzhiyun 	 * Determine optimal configuration from RAM sizes
218*4882a593Smuzhiyun 	 * Note that we assume that the physical RAM configuration is sane
219*4882a593Smuzhiyun 	 * Therefore, we don't do any parameter error checking here ...
220*4882a593Smuzhiyun 	 */
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun 	/* For now, just use a single record format covering everything */
223*4882a593Smuzhiyun 	cs_trc_rec_wc = EIP197_CS_TRC_REC_WC;
224*4882a593Smuzhiyun 	cs_trc_lg_rec_wc = EIP197_CS_TRC_REC_WC;
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 	/*
227*4882a593Smuzhiyun 	 * Step #1: How many records will physically fit?
228*4882a593Smuzhiyun 	 * Hard upper limit is 1023!
229*4882a593Smuzhiyun 	 */
230*4882a593Smuzhiyun 	cs_rc_abs_max = min_t(uint, ((dsize >> 2) / cs_trc_lg_rec_wc), 1023);
231*4882a593Smuzhiyun 	/* Step #2: Need at least 2 words in the admin RAM per record */
232*4882a593Smuzhiyun 	cs_rc_max = min_t(uint, cs_rc_abs_max, (asize >> 1));
233*4882a593Smuzhiyun 	/* Step #3: Determine log2 of hash table size */
234*4882a593Smuzhiyun 	cs_ht_sz = __fls(asize - cs_rc_max) - 2;
235*4882a593Smuzhiyun 	/* Step #4: determine current size of hash table in dwords */
236*4882a593Smuzhiyun 	cs_ht_wc = 16 << cs_ht_sz; /* dwords, not admin words */
237*4882a593Smuzhiyun 	/* Step #5: add back excess words and see if we can fit more records */
238*4882a593Smuzhiyun 	cs_rc_max = min_t(uint, cs_rc_abs_max, asize - (cs_ht_wc >> 2));
239*4882a593Smuzhiyun 
240*4882a593Smuzhiyun 	/* Clear the cache RAMs */
241*4882a593Smuzhiyun 	eip197_trc_cache_clear(priv, cs_rc_max, cs_ht_wc);
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun 	/* Disable the record cache memory access */
244*4882a593Smuzhiyun 	val = readl(priv->base + EIP197_CS_RAM_CTRL);
245*4882a593Smuzhiyun 	val &= ~EIP197_TRC_ENABLE_MASK;
246*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_CS_RAM_CTRL);
247*4882a593Smuzhiyun 
248*4882a593Smuzhiyun 	/* Write head and tail pointers of the record free chain */
249*4882a593Smuzhiyun 	val = EIP197_TRC_FREECHAIN_HEAD_PTR(0) |
250*4882a593Smuzhiyun 	      EIP197_TRC_FREECHAIN_TAIL_PTR(cs_rc_max - 1);
251*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_TRC_FREECHAIN);
252*4882a593Smuzhiyun 
253*4882a593Smuzhiyun 	/* Configure the record cache #1 */
254*4882a593Smuzhiyun 	val = EIP197_TRC_PARAMS2_RC_SZ_SMALL(cs_trc_rec_wc) |
255*4882a593Smuzhiyun 	      EIP197_TRC_PARAMS2_HTABLE_PTR(cs_rc_max);
256*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_TRC_PARAMS2);
257*4882a593Smuzhiyun 
258*4882a593Smuzhiyun 	/* Configure the record cache #2 */
259*4882a593Smuzhiyun 	val = EIP197_TRC_PARAMS_RC_SZ_LARGE(cs_trc_lg_rec_wc) |
260*4882a593Smuzhiyun 	      EIP197_TRC_PARAMS_BLK_TIMER_SPEED(1) |
261*4882a593Smuzhiyun 	      EIP197_TRC_PARAMS_HTABLE_SZ(cs_ht_sz);
262*4882a593Smuzhiyun 	writel(val, priv->base + EIP197_TRC_PARAMS);
263*4882a593Smuzhiyun 
264*4882a593Smuzhiyun 	dev_info(priv->dev, "TRC init: %dd,%da (%dr,%dh)\n",
265*4882a593Smuzhiyun 		 dsize, asize, cs_rc_max, cs_ht_wc + cs_ht_wc);
266*4882a593Smuzhiyun 	return 0;
267*4882a593Smuzhiyun }
268*4882a593Smuzhiyun 
eip197_init_firmware(struct safexcel_crypto_priv * priv)269*4882a593Smuzhiyun static void eip197_init_firmware(struct safexcel_crypto_priv *priv)
270*4882a593Smuzhiyun {
271*4882a593Smuzhiyun 	int pe, i;
272*4882a593Smuzhiyun 	u32 val;
273*4882a593Smuzhiyun 
274*4882a593Smuzhiyun 	for (pe = 0; pe < priv->config.pes; pe++) {
275*4882a593Smuzhiyun 		/* Configure the token FIFO's */
276*4882a593Smuzhiyun 		writel(3, EIP197_PE(priv) + EIP197_PE_ICE_PUTF_CTRL(pe));
277*4882a593Smuzhiyun 		writel(0, EIP197_PE(priv) + EIP197_PE_ICE_PPTF_CTRL(pe));
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 		/* Clear the ICE scratchpad memory */
280*4882a593Smuzhiyun 		val = readl(EIP197_PE(priv) + EIP197_PE_ICE_SCRATCH_CTRL(pe));
281*4882a593Smuzhiyun 		val |= EIP197_PE_ICE_SCRATCH_CTRL_CHANGE_TIMER |
282*4882a593Smuzhiyun 		       EIP197_PE_ICE_SCRATCH_CTRL_TIMER_EN |
283*4882a593Smuzhiyun 		       EIP197_PE_ICE_SCRATCH_CTRL_SCRATCH_ACCESS |
284*4882a593Smuzhiyun 		       EIP197_PE_ICE_SCRATCH_CTRL_CHANGE_ACCESS;
285*4882a593Smuzhiyun 		writel(val, EIP197_PE(priv) + EIP197_PE_ICE_SCRATCH_CTRL(pe));
286*4882a593Smuzhiyun 
287*4882a593Smuzhiyun 		/* clear the scratchpad RAM using 32 bit writes only */
288*4882a593Smuzhiyun 		for (i = 0; i < EIP197_NUM_OF_SCRATCH_BLOCKS; i++)
289*4882a593Smuzhiyun 			writel(0, EIP197_PE(priv) +
290*4882a593Smuzhiyun 				  EIP197_PE_ICE_SCRATCH_RAM(pe) + (i << 2));
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 		/* Reset the IFPP engine to make its program mem accessible */
293*4882a593Smuzhiyun 		writel(EIP197_PE_ICE_x_CTRL_SW_RESET |
294*4882a593Smuzhiyun 		       EIP197_PE_ICE_x_CTRL_CLR_ECC_CORR |
295*4882a593Smuzhiyun 		       EIP197_PE_ICE_x_CTRL_CLR_ECC_NON_CORR,
296*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_ICE_FPP_CTRL(pe));
297*4882a593Smuzhiyun 
298*4882a593Smuzhiyun 		/* Reset the IPUE engine to make its program mem accessible */
299*4882a593Smuzhiyun 		writel(EIP197_PE_ICE_x_CTRL_SW_RESET |
300*4882a593Smuzhiyun 		       EIP197_PE_ICE_x_CTRL_CLR_ECC_CORR |
301*4882a593Smuzhiyun 		       EIP197_PE_ICE_x_CTRL_CLR_ECC_NON_CORR,
302*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_ICE_PUE_CTRL(pe));
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun 		/* Enable access to all IFPP program memories */
305*4882a593Smuzhiyun 		writel(EIP197_PE_ICE_RAM_CTRL_FPP_PROG_EN,
306*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_ICE_RAM_CTRL(pe));
307*4882a593Smuzhiyun 
308*4882a593Smuzhiyun 		/* bypass the OCE, if present */
309*4882a593Smuzhiyun 		if (priv->flags & EIP197_OCE)
310*4882a593Smuzhiyun 			writel(EIP197_DEBUG_OCE_BYPASS, EIP197_PE(priv) +
311*4882a593Smuzhiyun 							EIP197_PE_DEBUG(pe));
312*4882a593Smuzhiyun 	}
313*4882a593Smuzhiyun 
314*4882a593Smuzhiyun }
315*4882a593Smuzhiyun 
eip197_write_firmware(struct safexcel_crypto_priv * priv,const struct firmware * fw)316*4882a593Smuzhiyun static int eip197_write_firmware(struct safexcel_crypto_priv *priv,
317*4882a593Smuzhiyun 				  const struct firmware *fw)
318*4882a593Smuzhiyun {
319*4882a593Smuzhiyun 	const __be32 *data = (const __be32 *)fw->data;
320*4882a593Smuzhiyun 	int i;
321*4882a593Smuzhiyun 
322*4882a593Smuzhiyun 	/* Write the firmware */
323*4882a593Smuzhiyun 	for (i = 0; i < fw->size / sizeof(u32); i++)
324*4882a593Smuzhiyun 		writel(be32_to_cpu(data[i]),
325*4882a593Smuzhiyun 		       priv->base + EIP197_CLASSIFICATION_RAMS +
326*4882a593Smuzhiyun 		       i * sizeof(__be32));
327*4882a593Smuzhiyun 
328*4882a593Smuzhiyun 	/* Exclude final 2 NOPs from size */
329*4882a593Smuzhiyun 	return i - EIP197_FW_TERMINAL_NOPS;
330*4882a593Smuzhiyun }
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun /*
333*4882a593Smuzhiyun  * If FW is actual production firmware, then poll for its initialization
334*4882a593Smuzhiyun  * to complete and check if it is good for the HW, otherwise just return OK.
335*4882a593Smuzhiyun  */
poll_fw_ready(struct safexcel_crypto_priv * priv,int fpp)336*4882a593Smuzhiyun static bool poll_fw_ready(struct safexcel_crypto_priv *priv, int fpp)
337*4882a593Smuzhiyun {
338*4882a593Smuzhiyun 	int pe, pollcnt;
339*4882a593Smuzhiyun 	u32 base, pollofs;
340*4882a593Smuzhiyun 
341*4882a593Smuzhiyun 	if (fpp)
342*4882a593Smuzhiyun 		pollofs  = EIP197_FW_FPP_READY;
343*4882a593Smuzhiyun 	else
344*4882a593Smuzhiyun 		pollofs  = EIP197_FW_PUE_READY;
345*4882a593Smuzhiyun 
346*4882a593Smuzhiyun 	for (pe = 0; pe < priv->config.pes; pe++) {
347*4882a593Smuzhiyun 		base = EIP197_PE_ICE_SCRATCH_RAM(pe);
348*4882a593Smuzhiyun 		pollcnt = EIP197_FW_START_POLLCNT;
349*4882a593Smuzhiyun 		while (pollcnt &&
350*4882a593Smuzhiyun 		       (readl_relaxed(EIP197_PE(priv) + base +
351*4882a593Smuzhiyun 			      pollofs) != 1)) {
352*4882a593Smuzhiyun 			pollcnt--;
353*4882a593Smuzhiyun 		}
354*4882a593Smuzhiyun 		if (!pollcnt) {
355*4882a593Smuzhiyun 			dev_err(priv->dev, "FW(%d) for PE %d failed to start\n",
356*4882a593Smuzhiyun 				fpp, pe);
357*4882a593Smuzhiyun 			return false;
358*4882a593Smuzhiyun 		}
359*4882a593Smuzhiyun 	}
360*4882a593Smuzhiyun 	return true;
361*4882a593Smuzhiyun }
362*4882a593Smuzhiyun 
eip197_start_firmware(struct safexcel_crypto_priv * priv,int ipuesz,int ifppsz,int minifw)363*4882a593Smuzhiyun static bool eip197_start_firmware(struct safexcel_crypto_priv *priv,
364*4882a593Smuzhiyun 				  int ipuesz, int ifppsz, int minifw)
365*4882a593Smuzhiyun {
366*4882a593Smuzhiyun 	int pe;
367*4882a593Smuzhiyun 	u32 val;
368*4882a593Smuzhiyun 
369*4882a593Smuzhiyun 	for (pe = 0; pe < priv->config.pes; pe++) {
370*4882a593Smuzhiyun 		/* Disable access to all program memory */
371*4882a593Smuzhiyun 		writel(0, EIP197_PE(priv) + EIP197_PE_ICE_RAM_CTRL(pe));
372*4882a593Smuzhiyun 
373*4882a593Smuzhiyun 		/* Start IFPP microengines */
374*4882a593Smuzhiyun 		if (minifw)
375*4882a593Smuzhiyun 			val = 0;
376*4882a593Smuzhiyun 		else
377*4882a593Smuzhiyun 			val = EIP197_PE_ICE_UENG_START_OFFSET((ifppsz - 1) &
378*4882a593Smuzhiyun 					EIP197_PE_ICE_UENG_INIT_ALIGN_MASK) |
379*4882a593Smuzhiyun 				EIP197_PE_ICE_UENG_DEBUG_RESET;
380*4882a593Smuzhiyun 		writel(val, EIP197_PE(priv) + EIP197_PE_ICE_FPP_CTRL(pe));
381*4882a593Smuzhiyun 
382*4882a593Smuzhiyun 		/* Start IPUE microengines */
383*4882a593Smuzhiyun 		if (minifw)
384*4882a593Smuzhiyun 			val = 0;
385*4882a593Smuzhiyun 		else
386*4882a593Smuzhiyun 			val = EIP197_PE_ICE_UENG_START_OFFSET((ipuesz - 1) &
387*4882a593Smuzhiyun 					EIP197_PE_ICE_UENG_INIT_ALIGN_MASK) |
388*4882a593Smuzhiyun 				EIP197_PE_ICE_UENG_DEBUG_RESET;
389*4882a593Smuzhiyun 		writel(val, EIP197_PE(priv) + EIP197_PE_ICE_PUE_CTRL(pe));
390*4882a593Smuzhiyun 	}
391*4882a593Smuzhiyun 
392*4882a593Smuzhiyun 	/* For miniFW startup, there is no initialization, so always succeed */
393*4882a593Smuzhiyun 	if (minifw)
394*4882a593Smuzhiyun 		return true;
395*4882a593Smuzhiyun 
396*4882a593Smuzhiyun 	/* Wait until all the firmwares have properly started up */
397*4882a593Smuzhiyun 	if (!poll_fw_ready(priv, 1))
398*4882a593Smuzhiyun 		return false;
399*4882a593Smuzhiyun 	if (!poll_fw_ready(priv, 0))
400*4882a593Smuzhiyun 		return false;
401*4882a593Smuzhiyun 
402*4882a593Smuzhiyun 	return true;
403*4882a593Smuzhiyun }
404*4882a593Smuzhiyun 
eip197_load_firmwares(struct safexcel_crypto_priv * priv)405*4882a593Smuzhiyun static int eip197_load_firmwares(struct safexcel_crypto_priv *priv)
406*4882a593Smuzhiyun {
407*4882a593Smuzhiyun 	const char *fw_name[] = {"ifpp.bin", "ipue.bin"};
408*4882a593Smuzhiyun 	const struct firmware *fw[FW_NB];
409*4882a593Smuzhiyun 	char fw_path[37], *dir = NULL;
410*4882a593Smuzhiyun 	int i, j, ret = 0, pe;
411*4882a593Smuzhiyun 	int ipuesz, ifppsz, minifw = 0;
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	if (priv->version == EIP197D_MRVL)
414*4882a593Smuzhiyun 		dir = "eip197d";
415*4882a593Smuzhiyun 	else if (priv->version == EIP197B_MRVL ||
416*4882a593Smuzhiyun 		 priv->version == EIP197_DEVBRD)
417*4882a593Smuzhiyun 		dir = "eip197b";
418*4882a593Smuzhiyun 	else
419*4882a593Smuzhiyun 		return -ENODEV;
420*4882a593Smuzhiyun 
421*4882a593Smuzhiyun retry_fw:
422*4882a593Smuzhiyun 	for (i = 0; i < FW_NB; i++) {
423*4882a593Smuzhiyun 		snprintf(fw_path, 37, "inside-secure/%s/%s", dir, fw_name[i]);
424*4882a593Smuzhiyun 		ret = firmware_request_nowarn(&fw[i], fw_path, priv->dev);
425*4882a593Smuzhiyun 		if (ret) {
426*4882a593Smuzhiyun 			if (minifw || priv->version != EIP197B_MRVL)
427*4882a593Smuzhiyun 				goto release_fw;
428*4882a593Smuzhiyun 
429*4882a593Smuzhiyun 			/* Fallback to the old firmware location for the
430*4882a593Smuzhiyun 			 * EIP197b.
431*4882a593Smuzhiyun 			 */
432*4882a593Smuzhiyun 			ret = firmware_request_nowarn(&fw[i], fw_name[i],
433*4882a593Smuzhiyun 						      priv->dev);
434*4882a593Smuzhiyun 			if (ret)
435*4882a593Smuzhiyun 				goto release_fw;
436*4882a593Smuzhiyun 		}
437*4882a593Smuzhiyun 	}
438*4882a593Smuzhiyun 
439*4882a593Smuzhiyun 	eip197_init_firmware(priv);
440*4882a593Smuzhiyun 
441*4882a593Smuzhiyun 	ifppsz = eip197_write_firmware(priv, fw[FW_IFPP]);
442*4882a593Smuzhiyun 
443*4882a593Smuzhiyun 	/* Enable access to IPUE program memories */
444*4882a593Smuzhiyun 	for (pe = 0; pe < priv->config.pes; pe++)
445*4882a593Smuzhiyun 		writel(EIP197_PE_ICE_RAM_CTRL_PUE_PROG_EN,
446*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_ICE_RAM_CTRL(pe));
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun 	ipuesz = eip197_write_firmware(priv, fw[FW_IPUE]);
449*4882a593Smuzhiyun 
450*4882a593Smuzhiyun 	if (eip197_start_firmware(priv, ipuesz, ifppsz, minifw)) {
451*4882a593Smuzhiyun 		dev_dbg(priv->dev, "Firmware loaded successfully\n");
452*4882a593Smuzhiyun 		return 0;
453*4882a593Smuzhiyun 	}
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun 	ret = -ENODEV;
456*4882a593Smuzhiyun 
457*4882a593Smuzhiyun release_fw:
458*4882a593Smuzhiyun 	for (j = 0; j < i; j++)
459*4882a593Smuzhiyun 		release_firmware(fw[j]);
460*4882a593Smuzhiyun 
461*4882a593Smuzhiyun 	if (!minifw) {
462*4882a593Smuzhiyun 		/* Retry with minifw path */
463*4882a593Smuzhiyun 		dev_dbg(priv->dev, "Firmware set not (fully) present or init failed, falling back to BCLA mode\n");
464*4882a593Smuzhiyun 		dir = "eip197_minifw";
465*4882a593Smuzhiyun 		minifw = 1;
466*4882a593Smuzhiyun 		goto retry_fw;
467*4882a593Smuzhiyun 	}
468*4882a593Smuzhiyun 
469*4882a593Smuzhiyun 	dev_dbg(priv->dev, "Firmware load failed.\n");
470*4882a593Smuzhiyun 
471*4882a593Smuzhiyun 	return ret;
472*4882a593Smuzhiyun }
473*4882a593Smuzhiyun 
safexcel_hw_setup_cdesc_rings(struct safexcel_crypto_priv * priv)474*4882a593Smuzhiyun static int safexcel_hw_setup_cdesc_rings(struct safexcel_crypto_priv *priv)
475*4882a593Smuzhiyun {
476*4882a593Smuzhiyun 	u32 cd_size_rnd, val;
477*4882a593Smuzhiyun 	int i, cd_fetch_cnt;
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 	cd_size_rnd  = (priv->config.cd_size +
480*4882a593Smuzhiyun 			(BIT(priv->hwconfig.hwdataw) - 1)) >>
481*4882a593Smuzhiyun 		       priv->hwconfig.hwdataw;
482*4882a593Smuzhiyun 	/* determine number of CD's we can fetch into the CD FIFO as 1 block */
483*4882a593Smuzhiyun 	if (priv->flags & SAFEXCEL_HW_EIP197) {
484*4882a593Smuzhiyun 		/* EIP197: try to fetch enough in 1 go to keep all pipes busy */
485*4882a593Smuzhiyun 		cd_fetch_cnt = (1 << priv->hwconfig.hwcfsize) / cd_size_rnd;
486*4882a593Smuzhiyun 		cd_fetch_cnt = min_t(uint, cd_fetch_cnt,
487*4882a593Smuzhiyun 				     (priv->config.pes * EIP197_FETCH_DEPTH));
488*4882a593Smuzhiyun 	} else {
489*4882a593Smuzhiyun 		/* for the EIP97, just fetch all that fits minus 1 */
490*4882a593Smuzhiyun 		cd_fetch_cnt = ((1 << priv->hwconfig.hwcfsize) /
491*4882a593Smuzhiyun 				cd_size_rnd) - 1;
492*4882a593Smuzhiyun 	}
493*4882a593Smuzhiyun 	/*
494*4882a593Smuzhiyun 	 * Since we're using command desc's way larger than formally specified,
495*4882a593Smuzhiyun 	 * we need to check whether we can fit even 1 for low-end EIP196's!
496*4882a593Smuzhiyun 	 */
497*4882a593Smuzhiyun 	if (!cd_fetch_cnt) {
498*4882a593Smuzhiyun 		dev_err(priv->dev, "Unable to fit even 1 command desc!\n");
499*4882a593Smuzhiyun 		return -ENODEV;
500*4882a593Smuzhiyun 	}
501*4882a593Smuzhiyun 
502*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
503*4882a593Smuzhiyun 		/* ring base address */
504*4882a593Smuzhiyun 		writel(lower_32_bits(priv->ring[i].cdr.base_dma),
505*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_LO);
506*4882a593Smuzhiyun 		writel(upper_32_bits(priv->ring[i].cdr.base_dma),
507*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_HI);
508*4882a593Smuzhiyun 
509*4882a593Smuzhiyun 		writel(EIP197_xDR_DESC_MODE_64BIT | EIP197_CDR_DESC_MODE_ADCP |
510*4882a593Smuzhiyun 		       (priv->config.cd_offset << 14) | priv->config.cd_size,
511*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_DESC_SIZE);
512*4882a593Smuzhiyun 		writel(((cd_fetch_cnt *
513*4882a593Smuzhiyun 			 (cd_size_rnd << priv->hwconfig.hwdataw)) << 16) |
514*4882a593Smuzhiyun 		       (cd_fetch_cnt * (priv->config.cd_offset / sizeof(u32))),
515*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_CFG);
516*4882a593Smuzhiyun 
517*4882a593Smuzhiyun 		/* Configure DMA tx control */
518*4882a593Smuzhiyun 		val = EIP197_HIA_xDR_CFG_WR_CACHE(WR_CACHE_3BITS);
519*4882a593Smuzhiyun 		val |= EIP197_HIA_xDR_CFG_RD_CACHE(RD_CACHE_3BITS);
520*4882a593Smuzhiyun 		writel(val, EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_DMA_CFG);
521*4882a593Smuzhiyun 
522*4882a593Smuzhiyun 		/* clear any pending interrupt */
523*4882a593Smuzhiyun 		writel(GENMASK(5, 0),
524*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_STAT);
525*4882a593Smuzhiyun 	}
526*4882a593Smuzhiyun 
527*4882a593Smuzhiyun 	return 0;
528*4882a593Smuzhiyun }
529*4882a593Smuzhiyun 
safexcel_hw_setup_rdesc_rings(struct safexcel_crypto_priv * priv)530*4882a593Smuzhiyun static int safexcel_hw_setup_rdesc_rings(struct safexcel_crypto_priv *priv)
531*4882a593Smuzhiyun {
532*4882a593Smuzhiyun 	u32 rd_size_rnd, val;
533*4882a593Smuzhiyun 	int i, rd_fetch_cnt;
534*4882a593Smuzhiyun 
535*4882a593Smuzhiyun 	/* determine number of RD's we can fetch into the FIFO as one block */
536*4882a593Smuzhiyun 	rd_size_rnd = (EIP197_RD64_FETCH_SIZE +
537*4882a593Smuzhiyun 		       (BIT(priv->hwconfig.hwdataw) - 1)) >>
538*4882a593Smuzhiyun 		      priv->hwconfig.hwdataw;
539*4882a593Smuzhiyun 	if (priv->flags & SAFEXCEL_HW_EIP197) {
540*4882a593Smuzhiyun 		/* EIP197: try to fetch enough in 1 go to keep all pipes busy */
541*4882a593Smuzhiyun 		rd_fetch_cnt = (1 << priv->hwconfig.hwrfsize) / rd_size_rnd;
542*4882a593Smuzhiyun 		rd_fetch_cnt = min_t(uint, rd_fetch_cnt,
543*4882a593Smuzhiyun 				     (priv->config.pes * EIP197_FETCH_DEPTH));
544*4882a593Smuzhiyun 	} else {
545*4882a593Smuzhiyun 		/* for the EIP97, just fetch all that fits minus 1 */
546*4882a593Smuzhiyun 		rd_fetch_cnt = ((1 << priv->hwconfig.hwrfsize) /
547*4882a593Smuzhiyun 				rd_size_rnd) - 1;
548*4882a593Smuzhiyun 	}
549*4882a593Smuzhiyun 
550*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
551*4882a593Smuzhiyun 		/* ring base address */
552*4882a593Smuzhiyun 		writel(lower_32_bits(priv->ring[i].rdr.base_dma),
553*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_LO);
554*4882a593Smuzhiyun 		writel(upper_32_bits(priv->ring[i].rdr.base_dma),
555*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_HI);
556*4882a593Smuzhiyun 
557*4882a593Smuzhiyun 		writel(EIP197_xDR_DESC_MODE_64BIT | (priv->config.rd_offset << 14) |
558*4882a593Smuzhiyun 		       priv->config.rd_size,
559*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_DESC_SIZE);
560*4882a593Smuzhiyun 
561*4882a593Smuzhiyun 		writel(((rd_fetch_cnt *
562*4882a593Smuzhiyun 			 (rd_size_rnd << priv->hwconfig.hwdataw)) << 16) |
563*4882a593Smuzhiyun 		       (rd_fetch_cnt * (priv->config.rd_offset / sizeof(u32))),
564*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_CFG);
565*4882a593Smuzhiyun 
566*4882a593Smuzhiyun 		/* Configure DMA tx control */
567*4882a593Smuzhiyun 		val = EIP197_HIA_xDR_CFG_WR_CACHE(WR_CACHE_3BITS);
568*4882a593Smuzhiyun 		val |= EIP197_HIA_xDR_CFG_RD_CACHE(RD_CACHE_3BITS);
569*4882a593Smuzhiyun 		val |= EIP197_HIA_xDR_WR_RES_BUF | EIP197_HIA_xDR_WR_CTRL_BUF;
570*4882a593Smuzhiyun 		writel(val,
571*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_DMA_CFG);
572*4882a593Smuzhiyun 
573*4882a593Smuzhiyun 		/* clear any pending interrupt */
574*4882a593Smuzhiyun 		writel(GENMASK(7, 0),
575*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_STAT);
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun 		/* enable ring interrupt */
578*4882a593Smuzhiyun 		val = readl(EIP197_HIA_AIC_R(priv) + EIP197_HIA_AIC_R_ENABLE_CTRL(i));
579*4882a593Smuzhiyun 		val |= EIP197_RDR_IRQ(i);
580*4882a593Smuzhiyun 		writel(val, EIP197_HIA_AIC_R(priv) + EIP197_HIA_AIC_R_ENABLE_CTRL(i));
581*4882a593Smuzhiyun 	}
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 	return 0;
584*4882a593Smuzhiyun }
585*4882a593Smuzhiyun 
safexcel_hw_init(struct safexcel_crypto_priv * priv)586*4882a593Smuzhiyun static int safexcel_hw_init(struct safexcel_crypto_priv *priv)
587*4882a593Smuzhiyun {
588*4882a593Smuzhiyun 	u32 val;
589*4882a593Smuzhiyun 	int i, ret, pe, opbuflo, opbufhi;
590*4882a593Smuzhiyun 
591*4882a593Smuzhiyun 	dev_dbg(priv->dev, "HW init: using %d pipe(s) and %d ring(s)\n",
592*4882a593Smuzhiyun 		priv->config.pes, priv->config.rings);
593*4882a593Smuzhiyun 
594*4882a593Smuzhiyun 	/*
595*4882a593Smuzhiyun 	 * For EIP197's only set maximum number of TX commands to 2^5 = 32
596*4882a593Smuzhiyun 	 * Skip for the EIP97 as it does not have this field.
597*4882a593Smuzhiyun 	 */
598*4882a593Smuzhiyun 	if (priv->flags & SAFEXCEL_HW_EIP197) {
599*4882a593Smuzhiyun 		val = readl(EIP197_HIA_AIC(priv) + EIP197_HIA_MST_CTRL);
600*4882a593Smuzhiyun 		val |= EIP197_MST_CTRL_TX_MAX_CMD(5);
601*4882a593Smuzhiyun 		writel(val, EIP197_HIA_AIC(priv) + EIP197_HIA_MST_CTRL);
602*4882a593Smuzhiyun 	}
603*4882a593Smuzhiyun 
604*4882a593Smuzhiyun 	/* Configure wr/rd cache values */
605*4882a593Smuzhiyun 	writel(EIP197_MST_CTRL_RD_CACHE(RD_CACHE_4BITS) |
606*4882a593Smuzhiyun 	       EIP197_MST_CTRL_WD_CACHE(WR_CACHE_4BITS),
607*4882a593Smuzhiyun 	       EIP197_HIA_GEN_CFG(priv) + EIP197_MST_CTRL);
608*4882a593Smuzhiyun 
609*4882a593Smuzhiyun 	/* Interrupts reset */
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 	/* Disable all global interrupts */
612*4882a593Smuzhiyun 	writel(0, EIP197_HIA_AIC_G(priv) + EIP197_HIA_AIC_G_ENABLE_CTRL);
613*4882a593Smuzhiyun 
614*4882a593Smuzhiyun 	/* Clear any pending interrupt */
615*4882a593Smuzhiyun 	writel(GENMASK(31, 0), EIP197_HIA_AIC_G(priv) + EIP197_HIA_AIC_G_ACK);
616*4882a593Smuzhiyun 
617*4882a593Smuzhiyun 	/* Processing Engine configuration */
618*4882a593Smuzhiyun 	for (pe = 0; pe < priv->config.pes; pe++) {
619*4882a593Smuzhiyun 		/* Data Fetch Engine configuration */
620*4882a593Smuzhiyun 
621*4882a593Smuzhiyun 		/* Reset all DFE threads */
622*4882a593Smuzhiyun 		writel(EIP197_DxE_THR_CTRL_RESET_PE,
623*4882a593Smuzhiyun 		       EIP197_HIA_DFE_THR(priv) + EIP197_HIA_DFE_THR_CTRL(pe));
624*4882a593Smuzhiyun 
625*4882a593Smuzhiyun 		if (priv->flags & EIP197_PE_ARB)
626*4882a593Smuzhiyun 			/* Reset HIA input interface arbiter (if present) */
627*4882a593Smuzhiyun 			writel(EIP197_HIA_RA_PE_CTRL_RESET,
628*4882a593Smuzhiyun 			       EIP197_HIA_AIC(priv) + EIP197_HIA_RA_PE_CTRL(pe));
629*4882a593Smuzhiyun 
630*4882a593Smuzhiyun 		/* DMA transfer size to use */
631*4882a593Smuzhiyun 		val = EIP197_HIA_DFE_CFG_DIS_DEBUG;
632*4882a593Smuzhiyun 		val |= EIP197_HIA_DxE_CFG_MIN_DATA_SIZE(6) |
633*4882a593Smuzhiyun 		       EIP197_HIA_DxE_CFG_MAX_DATA_SIZE(9);
634*4882a593Smuzhiyun 		val |= EIP197_HIA_DxE_CFG_MIN_CTRL_SIZE(6) |
635*4882a593Smuzhiyun 		       EIP197_HIA_DxE_CFG_MAX_CTRL_SIZE(7);
636*4882a593Smuzhiyun 		val |= EIP197_HIA_DxE_CFG_DATA_CACHE_CTRL(RD_CACHE_3BITS);
637*4882a593Smuzhiyun 		val |= EIP197_HIA_DxE_CFG_CTRL_CACHE_CTRL(RD_CACHE_3BITS);
638*4882a593Smuzhiyun 		writel(val, EIP197_HIA_DFE(priv) + EIP197_HIA_DFE_CFG(pe));
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 		/* Leave the DFE threads reset state */
641*4882a593Smuzhiyun 		writel(0, EIP197_HIA_DFE_THR(priv) + EIP197_HIA_DFE_THR_CTRL(pe));
642*4882a593Smuzhiyun 
643*4882a593Smuzhiyun 		/* Configure the processing engine thresholds */
644*4882a593Smuzhiyun 		writel(EIP197_PE_IN_xBUF_THRES_MIN(6) |
645*4882a593Smuzhiyun 		       EIP197_PE_IN_xBUF_THRES_MAX(9),
646*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_IN_DBUF_THRES(pe));
647*4882a593Smuzhiyun 		writel(EIP197_PE_IN_xBUF_THRES_MIN(6) |
648*4882a593Smuzhiyun 		       EIP197_PE_IN_xBUF_THRES_MAX(7),
649*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_IN_TBUF_THRES(pe));
650*4882a593Smuzhiyun 
651*4882a593Smuzhiyun 		if (priv->flags & SAFEXCEL_HW_EIP197)
652*4882a593Smuzhiyun 			/* enable HIA input interface arbiter and rings */
653*4882a593Smuzhiyun 			writel(EIP197_HIA_RA_PE_CTRL_EN |
654*4882a593Smuzhiyun 			       GENMASK(priv->config.rings - 1, 0),
655*4882a593Smuzhiyun 			       EIP197_HIA_AIC(priv) + EIP197_HIA_RA_PE_CTRL(pe));
656*4882a593Smuzhiyun 
657*4882a593Smuzhiyun 		/* Data Store Engine configuration */
658*4882a593Smuzhiyun 
659*4882a593Smuzhiyun 		/* Reset all DSE threads */
660*4882a593Smuzhiyun 		writel(EIP197_DxE_THR_CTRL_RESET_PE,
661*4882a593Smuzhiyun 		       EIP197_HIA_DSE_THR(priv) + EIP197_HIA_DSE_THR_CTRL(pe));
662*4882a593Smuzhiyun 
663*4882a593Smuzhiyun 		/* Wait for all DSE threads to complete */
664*4882a593Smuzhiyun 		while ((readl(EIP197_HIA_DSE_THR(priv) + EIP197_HIA_DSE_THR_STAT(pe)) &
665*4882a593Smuzhiyun 			GENMASK(15, 12)) != GENMASK(15, 12))
666*4882a593Smuzhiyun 			;
667*4882a593Smuzhiyun 
668*4882a593Smuzhiyun 		/* DMA transfer size to use */
669*4882a593Smuzhiyun 		if (priv->hwconfig.hwnumpes > 4) {
670*4882a593Smuzhiyun 			opbuflo = 9;
671*4882a593Smuzhiyun 			opbufhi = 10;
672*4882a593Smuzhiyun 		} else {
673*4882a593Smuzhiyun 			opbuflo = 7;
674*4882a593Smuzhiyun 			opbufhi = 8;
675*4882a593Smuzhiyun 		}
676*4882a593Smuzhiyun 		val = EIP197_HIA_DSE_CFG_DIS_DEBUG;
677*4882a593Smuzhiyun 		val |= EIP197_HIA_DxE_CFG_MIN_DATA_SIZE(opbuflo) |
678*4882a593Smuzhiyun 		       EIP197_HIA_DxE_CFG_MAX_DATA_SIZE(opbufhi);
679*4882a593Smuzhiyun 		val |= EIP197_HIA_DxE_CFG_DATA_CACHE_CTRL(WR_CACHE_3BITS);
680*4882a593Smuzhiyun 		val |= EIP197_HIA_DSE_CFG_ALWAYS_BUFFERABLE;
681*4882a593Smuzhiyun 		/* FIXME: instability issues can occur for EIP97 but disabling
682*4882a593Smuzhiyun 		 * it impacts performance.
683*4882a593Smuzhiyun 		 */
684*4882a593Smuzhiyun 		if (priv->flags & SAFEXCEL_HW_EIP197)
685*4882a593Smuzhiyun 			val |= EIP197_HIA_DSE_CFG_EN_SINGLE_WR;
686*4882a593Smuzhiyun 		writel(val, EIP197_HIA_DSE(priv) + EIP197_HIA_DSE_CFG(pe));
687*4882a593Smuzhiyun 
688*4882a593Smuzhiyun 		/* Leave the DSE threads reset state */
689*4882a593Smuzhiyun 		writel(0, EIP197_HIA_DSE_THR(priv) + EIP197_HIA_DSE_THR_CTRL(pe));
690*4882a593Smuzhiyun 
691*4882a593Smuzhiyun 		/* Configure the procesing engine thresholds */
692*4882a593Smuzhiyun 		writel(EIP197_PE_OUT_DBUF_THRES_MIN(opbuflo) |
693*4882a593Smuzhiyun 		       EIP197_PE_OUT_DBUF_THRES_MAX(opbufhi),
694*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_OUT_DBUF_THRES(pe));
695*4882a593Smuzhiyun 
696*4882a593Smuzhiyun 		/* Processing Engine configuration */
697*4882a593Smuzhiyun 
698*4882a593Smuzhiyun 		/* Token & context configuration */
699*4882a593Smuzhiyun 		val = EIP197_PE_EIP96_TOKEN_CTRL_CTX_UPDATES |
700*4882a593Smuzhiyun 		      EIP197_PE_EIP96_TOKEN_CTRL_NO_TOKEN_WAIT |
701*4882a593Smuzhiyun 		      EIP197_PE_EIP96_TOKEN_CTRL_ENABLE_TIMEOUT;
702*4882a593Smuzhiyun 		writel(val, EIP197_PE(priv) + EIP197_PE_EIP96_TOKEN_CTRL(pe));
703*4882a593Smuzhiyun 
704*4882a593Smuzhiyun 		/* H/W capabilities selection: just enable everything */
705*4882a593Smuzhiyun 		writel(EIP197_FUNCTION_ALL,
706*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_EIP96_FUNCTION_EN(pe));
707*4882a593Smuzhiyun 		writel(EIP197_FUNCTION_ALL,
708*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_EIP96_FUNCTION2_EN(pe));
709*4882a593Smuzhiyun 	}
710*4882a593Smuzhiyun 
711*4882a593Smuzhiyun 	/* Command Descriptor Rings prepare */
712*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
713*4882a593Smuzhiyun 		/* Clear interrupts for this ring */
714*4882a593Smuzhiyun 		writel(GENMASK(31, 0),
715*4882a593Smuzhiyun 		       EIP197_HIA_AIC_R(priv) + EIP197_HIA_AIC_R_ENABLE_CLR(i));
716*4882a593Smuzhiyun 
717*4882a593Smuzhiyun 		/* Disable external triggering */
718*4882a593Smuzhiyun 		writel(0, EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_CFG);
719*4882a593Smuzhiyun 
720*4882a593Smuzhiyun 		/* Clear the pending prepared counter */
721*4882a593Smuzhiyun 		writel(EIP197_xDR_PREP_CLR_COUNT,
722*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_PREP_COUNT);
723*4882a593Smuzhiyun 
724*4882a593Smuzhiyun 		/* Clear the pending processed counter */
725*4882a593Smuzhiyun 		writel(EIP197_xDR_PROC_CLR_COUNT,
726*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_PROC_COUNT);
727*4882a593Smuzhiyun 
728*4882a593Smuzhiyun 		writel(0,
729*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_PREP_PNTR);
730*4882a593Smuzhiyun 		writel(0,
731*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_PROC_PNTR);
732*4882a593Smuzhiyun 
733*4882a593Smuzhiyun 		writel((EIP197_DEFAULT_RING_SIZE * priv->config.cd_offset),
734*4882a593Smuzhiyun 		       EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_RING_SIZE);
735*4882a593Smuzhiyun 	}
736*4882a593Smuzhiyun 
737*4882a593Smuzhiyun 	/* Result Descriptor Ring prepare */
738*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
739*4882a593Smuzhiyun 		/* Disable external triggering*/
740*4882a593Smuzhiyun 		writel(0, EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_CFG);
741*4882a593Smuzhiyun 
742*4882a593Smuzhiyun 		/* Clear the pending prepared counter */
743*4882a593Smuzhiyun 		writel(EIP197_xDR_PREP_CLR_COUNT,
744*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_PREP_COUNT);
745*4882a593Smuzhiyun 
746*4882a593Smuzhiyun 		/* Clear the pending processed counter */
747*4882a593Smuzhiyun 		writel(EIP197_xDR_PROC_CLR_COUNT,
748*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_PROC_COUNT);
749*4882a593Smuzhiyun 
750*4882a593Smuzhiyun 		writel(0,
751*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_PREP_PNTR);
752*4882a593Smuzhiyun 		writel(0,
753*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_PROC_PNTR);
754*4882a593Smuzhiyun 
755*4882a593Smuzhiyun 		/* Ring size */
756*4882a593Smuzhiyun 		writel((EIP197_DEFAULT_RING_SIZE * priv->config.rd_offset),
757*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_RING_SIZE);
758*4882a593Smuzhiyun 	}
759*4882a593Smuzhiyun 
760*4882a593Smuzhiyun 	for (pe = 0; pe < priv->config.pes; pe++) {
761*4882a593Smuzhiyun 		/* Enable command descriptor rings */
762*4882a593Smuzhiyun 		writel(EIP197_DxE_THR_CTRL_EN | GENMASK(priv->config.rings - 1, 0),
763*4882a593Smuzhiyun 		       EIP197_HIA_DFE_THR(priv) + EIP197_HIA_DFE_THR_CTRL(pe));
764*4882a593Smuzhiyun 
765*4882a593Smuzhiyun 		/* Enable result descriptor rings */
766*4882a593Smuzhiyun 		writel(EIP197_DxE_THR_CTRL_EN | GENMASK(priv->config.rings - 1, 0),
767*4882a593Smuzhiyun 		       EIP197_HIA_DSE_THR(priv) + EIP197_HIA_DSE_THR_CTRL(pe));
768*4882a593Smuzhiyun 	}
769*4882a593Smuzhiyun 
770*4882a593Smuzhiyun 	/* Clear any HIA interrupt */
771*4882a593Smuzhiyun 	writel(GENMASK(30, 20), EIP197_HIA_AIC_G(priv) + EIP197_HIA_AIC_G_ACK);
772*4882a593Smuzhiyun 
773*4882a593Smuzhiyun 	if (priv->flags & EIP197_SIMPLE_TRC) {
774*4882a593Smuzhiyun 		writel(EIP197_STRC_CONFIG_INIT |
775*4882a593Smuzhiyun 		       EIP197_STRC_CONFIG_LARGE_REC(EIP197_CS_TRC_REC_WC) |
776*4882a593Smuzhiyun 		       EIP197_STRC_CONFIG_SMALL_REC(EIP197_CS_TRC_REC_WC),
777*4882a593Smuzhiyun 		       priv->base + EIP197_STRC_CONFIG);
778*4882a593Smuzhiyun 		writel(EIP197_PE_EIP96_TOKEN_CTRL2_CTX_DONE,
779*4882a593Smuzhiyun 		       EIP197_PE(priv) + EIP197_PE_EIP96_TOKEN_CTRL2(0));
780*4882a593Smuzhiyun 	} else if (priv->flags & SAFEXCEL_HW_EIP197) {
781*4882a593Smuzhiyun 		ret = eip197_trc_cache_init(priv);
782*4882a593Smuzhiyun 		if (ret)
783*4882a593Smuzhiyun 			return ret;
784*4882a593Smuzhiyun 	}
785*4882a593Smuzhiyun 
786*4882a593Smuzhiyun 	if (priv->flags & EIP197_ICE) {
787*4882a593Smuzhiyun 		ret = eip197_load_firmwares(priv);
788*4882a593Smuzhiyun 		if (ret)
789*4882a593Smuzhiyun 			return ret;
790*4882a593Smuzhiyun 	}
791*4882a593Smuzhiyun 
792*4882a593Smuzhiyun 	return safexcel_hw_setup_cdesc_rings(priv) ?:
793*4882a593Smuzhiyun 	       safexcel_hw_setup_rdesc_rings(priv) ?:
794*4882a593Smuzhiyun 	       0;
795*4882a593Smuzhiyun }
796*4882a593Smuzhiyun 
797*4882a593Smuzhiyun /* Called with ring's lock taken */
safexcel_try_push_requests(struct safexcel_crypto_priv * priv,int ring)798*4882a593Smuzhiyun static void safexcel_try_push_requests(struct safexcel_crypto_priv *priv,
799*4882a593Smuzhiyun 				       int ring)
800*4882a593Smuzhiyun {
801*4882a593Smuzhiyun 	int coal = min_t(int, priv->ring[ring].requests, EIP197_MAX_BATCH_SZ);
802*4882a593Smuzhiyun 
803*4882a593Smuzhiyun 	if (!coal)
804*4882a593Smuzhiyun 		return;
805*4882a593Smuzhiyun 
806*4882a593Smuzhiyun 	/* Configure when we want an interrupt */
807*4882a593Smuzhiyun 	writel(EIP197_HIA_RDR_THRESH_PKT_MODE |
808*4882a593Smuzhiyun 	       EIP197_HIA_RDR_THRESH_PROC_PKT(coal),
809*4882a593Smuzhiyun 	       EIP197_HIA_RDR(priv, ring) + EIP197_HIA_xDR_THRESH);
810*4882a593Smuzhiyun }
811*4882a593Smuzhiyun 
safexcel_dequeue(struct safexcel_crypto_priv * priv,int ring)812*4882a593Smuzhiyun void safexcel_dequeue(struct safexcel_crypto_priv *priv, int ring)
813*4882a593Smuzhiyun {
814*4882a593Smuzhiyun 	struct crypto_async_request *req, *backlog;
815*4882a593Smuzhiyun 	struct safexcel_context *ctx;
816*4882a593Smuzhiyun 	int ret, nreq = 0, cdesc = 0, rdesc = 0, commands, results;
817*4882a593Smuzhiyun 
818*4882a593Smuzhiyun 	/* If a request wasn't properly dequeued because of a lack of resources,
819*4882a593Smuzhiyun 	 * proceeded it first,
820*4882a593Smuzhiyun 	 */
821*4882a593Smuzhiyun 	req = priv->ring[ring].req;
822*4882a593Smuzhiyun 	backlog = priv->ring[ring].backlog;
823*4882a593Smuzhiyun 	if (req)
824*4882a593Smuzhiyun 		goto handle_req;
825*4882a593Smuzhiyun 
826*4882a593Smuzhiyun 	while (true) {
827*4882a593Smuzhiyun 		spin_lock_bh(&priv->ring[ring].queue_lock);
828*4882a593Smuzhiyun 		backlog = crypto_get_backlog(&priv->ring[ring].queue);
829*4882a593Smuzhiyun 		req = crypto_dequeue_request(&priv->ring[ring].queue);
830*4882a593Smuzhiyun 		spin_unlock_bh(&priv->ring[ring].queue_lock);
831*4882a593Smuzhiyun 
832*4882a593Smuzhiyun 		if (!req) {
833*4882a593Smuzhiyun 			priv->ring[ring].req = NULL;
834*4882a593Smuzhiyun 			priv->ring[ring].backlog = NULL;
835*4882a593Smuzhiyun 			goto finalize;
836*4882a593Smuzhiyun 		}
837*4882a593Smuzhiyun 
838*4882a593Smuzhiyun handle_req:
839*4882a593Smuzhiyun 		ctx = crypto_tfm_ctx(req->tfm);
840*4882a593Smuzhiyun 		ret = ctx->send(req, ring, &commands, &results);
841*4882a593Smuzhiyun 		if (ret)
842*4882a593Smuzhiyun 			goto request_failed;
843*4882a593Smuzhiyun 
844*4882a593Smuzhiyun 		if (backlog)
845*4882a593Smuzhiyun 			backlog->complete(backlog, -EINPROGRESS);
846*4882a593Smuzhiyun 
847*4882a593Smuzhiyun 		/* In case the send() helper did not issue any command to push
848*4882a593Smuzhiyun 		 * to the engine because the input data was cached, continue to
849*4882a593Smuzhiyun 		 * dequeue other requests as this is valid and not an error.
850*4882a593Smuzhiyun 		 */
851*4882a593Smuzhiyun 		if (!commands && !results)
852*4882a593Smuzhiyun 			continue;
853*4882a593Smuzhiyun 
854*4882a593Smuzhiyun 		cdesc += commands;
855*4882a593Smuzhiyun 		rdesc += results;
856*4882a593Smuzhiyun 		nreq++;
857*4882a593Smuzhiyun 	}
858*4882a593Smuzhiyun 
859*4882a593Smuzhiyun request_failed:
860*4882a593Smuzhiyun 	/* Not enough resources to handle all the requests. Bail out and save
861*4882a593Smuzhiyun 	 * the request and the backlog for the next dequeue call (per-ring).
862*4882a593Smuzhiyun 	 */
863*4882a593Smuzhiyun 	priv->ring[ring].req = req;
864*4882a593Smuzhiyun 	priv->ring[ring].backlog = backlog;
865*4882a593Smuzhiyun 
866*4882a593Smuzhiyun finalize:
867*4882a593Smuzhiyun 	if (!nreq)
868*4882a593Smuzhiyun 		return;
869*4882a593Smuzhiyun 
870*4882a593Smuzhiyun 	spin_lock_bh(&priv->ring[ring].lock);
871*4882a593Smuzhiyun 
872*4882a593Smuzhiyun 	priv->ring[ring].requests += nreq;
873*4882a593Smuzhiyun 
874*4882a593Smuzhiyun 	if (!priv->ring[ring].busy) {
875*4882a593Smuzhiyun 		safexcel_try_push_requests(priv, ring);
876*4882a593Smuzhiyun 		priv->ring[ring].busy = true;
877*4882a593Smuzhiyun 	}
878*4882a593Smuzhiyun 
879*4882a593Smuzhiyun 	spin_unlock_bh(&priv->ring[ring].lock);
880*4882a593Smuzhiyun 
881*4882a593Smuzhiyun 	/* let the RDR know we have pending descriptors */
882*4882a593Smuzhiyun 	writel((rdesc * priv->config.rd_offset),
883*4882a593Smuzhiyun 	       EIP197_HIA_RDR(priv, ring) + EIP197_HIA_xDR_PREP_COUNT);
884*4882a593Smuzhiyun 
885*4882a593Smuzhiyun 	/* let the CDR know we have pending descriptors */
886*4882a593Smuzhiyun 	writel((cdesc * priv->config.cd_offset),
887*4882a593Smuzhiyun 	       EIP197_HIA_CDR(priv, ring) + EIP197_HIA_xDR_PREP_COUNT);
888*4882a593Smuzhiyun }
889*4882a593Smuzhiyun 
safexcel_rdesc_check_errors(struct safexcel_crypto_priv * priv,void * rdp)890*4882a593Smuzhiyun inline int safexcel_rdesc_check_errors(struct safexcel_crypto_priv *priv,
891*4882a593Smuzhiyun 				       void *rdp)
892*4882a593Smuzhiyun {
893*4882a593Smuzhiyun 	struct safexcel_result_desc *rdesc = rdp;
894*4882a593Smuzhiyun 	struct result_data_desc *result_data = rdp + priv->config.res_offset;
895*4882a593Smuzhiyun 
896*4882a593Smuzhiyun 	if (likely((!rdesc->last_seg) || /* Rest only valid if last seg! */
897*4882a593Smuzhiyun 		   ((!rdesc->descriptor_overflow) &&
898*4882a593Smuzhiyun 		    (!rdesc->buffer_overflow) &&
899*4882a593Smuzhiyun 		    (!result_data->error_code))))
900*4882a593Smuzhiyun 		return 0;
901*4882a593Smuzhiyun 
902*4882a593Smuzhiyun 	if (rdesc->descriptor_overflow)
903*4882a593Smuzhiyun 		dev_err(priv->dev, "Descriptor overflow detected");
904*4882a593Smuzhiyun 
905*4882a593Smuzhiyun 	if (rdesc->buffer_overflow)
906*4882a593Smuzhiyun 		dev_err(priv->dev, "Buffer overflow detected");
907*4882a593Smuzhiyun 
908*4882a593Smuzhiyun 	if (result_data->error_code & 0x4066) {
909*4882a593Smuzhiyun 		/* Fatal error (bits 1,2,5,6 & 14) */
910*4882a593Smuzhiyun 		dev_err(priv->dev,
911*4882a593Smuzhiyun 			"result descriptor error (%x)",
912*4882a593Smuzhiyun 			result_data->error_code);
913*4882a593Smuzhiyun 
914*4882a593Smuzhiyun 		return -EIO;
915*4882a593Smuzhiyun 	} else if (result_data->error_code &
916*4882a593Smuzhiyun 		   (BIT(7) | BIT(4) | BIT(3) | BIT(0))) {
917*4882a593Smuzhiyun 		/*
918*4882a593Smuzhiyun 		 * Give priority over authentication fails:
919*4882a593Smuzhiyun 		 * Blocksize, length & overflow errors,
920*4882a593Smuzhiyun 		 * something wrong with the input!
921*4882a593Smuzhiyun 		 */
922*4882a593Smuzhiyun 		return -EINVAL;
923*4882a593Smuzhiyun 	} else if (result_data->error_code & BIT(9)) {
924*4882a593Smuzhiyun 		/* Authentication failed */
925*4882a593Smuzhiyun 		return -EBADMSG;
926*4882a593Smuzhiyun 	}
927*4882a593Smuzhiyun 
928*4882a593Smuzhiyun 	/* All other non-fatal errors */
929*4882a593Smuzhiyun 	return -EINVAL;
930*4882a593Smuzhiyun }
931*4882a593Smuzhiyun 
safexcel_rdr_req_set(struct safexcel_crypto_priv * priv,int ring,struct safexcel_result_desc * rdesc,struct crypto_async_request * req)932*4882a593Smuzhiyun inline void safexcel_rdr_req_set(struct safexcel_crypto_priv *priv,
933*4882a593Smuzhiyun 				 int ring,
934*4882a593Smuzhiyun 				 struct safexcel_result_desc *rdesc,
935*4882a593Smuzhiyun 				 struct crypto_async_request *req)
936*4882a593Smuzhiyun {
937*4882a593Smuzhiyun 	int i = safexcel_ring_rdr_rdesc_index(priv, ring, rdesc);
938*4882a593Smuzhiyun 
939*4882a593Smuzhiyun 	priv->ring[ring].rdr_req[i] = req;
940*4882a593Smuzhiyun }
941*4882a593Smuzhiyun 
942*4882a593Smuzhiyun inline struct crypto_async_request *
safexcel_rdr_req_get(struct safexcel_crypto_priv * priv,int ring)943*4882a593Smuzhiyun safexcel_rdr_req_get(struct safexcel_crypto_priv *priv, int ring)
944*4882a593Smuzhiyun {
945*4882a593Smuzhiyun 	int i = safexcel_ring_first_rdr_index(priv, ring);
946*4882a593Smuzhiyun 
947*4882a593Smuzhiyun 	return priv->ring[ring].rdr_req[i];
948*4882a593Smuzhiyun }
949*4882a593Smuzhiyun 
safexcel_complete(struct safexcel_crypto_priv * priv,int ring)950*4882a593Smuzhiyun void safexcel_complete(struct safexcel_crypto_priv *priv, int ring)
951*4882a593Smuzhiyun {
952*4882a593Smuzhiyun 	struct safexcel_command_desc *cdesc;
953*4882a593Smuzhiyun 
954*4882a593Smuzhiyun 	/* Acknowledge the command descriptors */
955*4882a593Smuzhiyun 	do {
956*4882a593Smuzhiyun 		cdesc = safexcel_ring_next_rptr(priv, &priv->ring[ring].cdr);
957*4882a593Smuzhiyun 		if (IS_ERR(cdesc)) {
958*4882a593Smuzhiyun 			dev_err(priv->dev,
959*4882a593Smuzhiyun 				"Could not retrieve the command descriptor\n");
960*4882a593Smuzhiyun 			return;
961*4882a593Smuzhiyun 		}
962*4882a593Smuzhiyun 	} while (!cdesc->last_seg);
963*4882a593Smuzhiyun }
964*4882a593Smuzhiyun 
safexcel_inv_complete(struct crypto_async_request * req,int error)965*4882a593Smuzhiyun void safexcel_inv_complete(struct crypto_async_request *req, int error)
966*4882a593Smuzhiyun {
967*4882a593Smuzhiyun 	struct safexcel_inv_result *result = req->data;
968*4882a593Smuzhiyun 
969*4882a593Smuzhiyun 	if (error == -EINPROGRESS)
970*4882a593Smuzhiyun 		return;
971*4882a593Smuzhiyun 
972*4882a593Smuzhiyun 	result->error = error;
973*4882a593Smuzhiyun 	complete(&result->completion);
974*4882a593Smuzhiyun }
975*4882a593Smuzhiyun 
safexcel_invalidate_cache(struct crypto_async_request * async,struct safexcel_crypto_priv * priv,dma_addr_t ctxr_dma,int ring)976*4882a593Smuzhiyun int safexcel_invalidate_cache(struct crypto_async_request *async,
977*4882a593Smuzhiyun 			      struct safexcel_crypto_priv *priv,
978*4882a593Smuzhiyun 			      dma_addr_t ctxr_dma, int ring)
979*4882a593Smuzhiyun {
980*4882a593Smuzhiyun 	struct safexcel_command_desc *cdesc;
981*4882a593Smuzhiyun 	struct safexcel_result_desc *rdesc;
982*4882a593Smuzhiyun 	struct safexcel_token  *dmmy;
983*4882a593Smuzhiyun 	int ret = 0;
984*4882a593Smuzhiyun 
985*4882a593Smuzhiyun 	/* Prepare command descriptor */
986*4882a593Smuzhiyun 	cdesc = safexcel_add_cdesc(priv, ring, true, true, 0, 0, 0, ctxr_dma,
987*4882a593Smuzhiyun 				   &dmmy);
988*4882a593Smuzhiyun 	if (IS_ERR(cdesc))
989*4882a593Smuzhiyun 		return PTR_ERR(cdesc);
990*4882a593Smuzhiyun 
991*4882a593Smuzhiyun 	cdesc->control_data.type = EIP197_TYPE_EXTENDED;
992*4882a593Smuzhiyun 	cdesc->control_data.options = 0;
993*4882a593Smuzhiyun 	cdesc->control_data.context_lo &= ~EIP197_CONTEXT_SIZE_MASK;
994*4882a593Smuzhiyun 	cdesc->control_data.control0 = CONTEXT_CONTROL_INV_TR;
995*4882a593Smuzhiyun 
996*4882a593Smuzhiyun 	/* Prepare result descriptor */
997*4882a593Smuzhiyun 	rdesc = safexcel_add_rdesc(priv, ring, true, true, 0, 0);
998*4882a593Smuzhiyun 
999*4882a593Smuzhiyun 	if (IS_ERR(rdesc)) {
1000*4882a593Smuzhiyun 		ret = PTR_ERR(rdesc);
1001*4882a593Smuzhiyun 		goto cdesc_rollback;
1002*4882a593Smuzhiyun 	}
1003*4882a593Smuzhiyun 
1004*4882a593Smuzhiyun 	safexcel_rdr_req_set(priv, ring, rdesc, async);
1005*4882a593Smuzhiyun 
1006*4882a593Smuzhiyun 	return ret;
1007*4882a593Smuzhiyun 
1008*4882a593Smuzhiyun cdesc_rollback:
1009*4882a593Smuzhiyun 	safexcel_ring_rollback_wptr(priv, &priv->ring[ring].cdr);
1010*4882a593Smuzhiyun 
1011*4882a593Smuzhiyun 	return ret;
1012*4882a593Smuzhiyun }
1013*4882a593Smuzhiyun 
safexcel_handle_result_descriptor(struct safexcel_crypto_priv * priv,int ring)1014*4882a593Smuzhiyun static inline void safexcel_handle_result_descriptor(struct safexcel_crypto_priv *priv,
1015*4882a593Smuzhiyun 						     int ring)
1016*4882a593Smuzhiyun {
1017*4882a593Smuzhiyun 	struct crypto_async_request *req;
1018*4882a593Smuzhiyun 	struct safexcel_context *ctx;
1019*4882a593Smuzhiyun 	int ret, i, nreq, ndesc, tot_descs, handled = 0;
1020*4882a593Smuzhiyun 	bool should_complete;
1021*4882a593Smuzhiyun 
1022*4882a593Smuzhiyun handle_results:
1023*4882a593Smuzhiyun 	tot_descs = 0;
1024*4882a593Smuzhiyun 
1025*4882a593Smuzhiyun 	nreq = readl(EIP197_HIA_RDR(priv, ring) + EIP197_HIA_xDR_PROC_COUNT);
1026*4882a593Smuzhiyun 	nreq >>= EIP197_xDR_PROC_xD_PKT_OFFSET;
1027*4882a593Smuzhiyun 	nreq &= EIP197_xDR_PROC_xD_PKT_MASK;
1028*4882a593Smuzhiyun 	if (!nreq)
1029*4882a593Smuzhiyun 		goto requests_left;
1030*4882a593Smuzhiyun 
1031*4882a593Smuzhiyun 	for (i = 0; i < nreq; i++) {
1032*4882a593Smuzhiyun 		req = safexcel_rdr_req_get(priv, ring);
1033*4882a593Smuzhiyun 
1034*4882a593Smuzhiyun 		ctx = crypto_tfm_ctx(req->tfm);
1035*4882a593Smuzhiyun 		ndesc = ctx->handle_result(priv, ring, req,
1036*4882a593Smuzhiyun 					   &should_complete, &ret);
1037*4882a593Smuzhiyun 		if (ndesc < 0) {
1038*4882a593Smuzhiyun 			dev_err(priv->dev, "failed to handle result (%d)\n",
1039*4882a593Smuzhiyun 				ndesc);
1040*4882a593Smuzhiyun 			goto acknowledge;
1041*4882a593Smuzhiyun 		}
1042*4882a593Smuzhiyun 
1043*4882a593Smuzhiyun 		if (should_complete) {
1044*4882a593Smuzhiyun 			local_bh_disable();
1045*4882a593Smuzhiyun 			req->complete(req, ret);
1046*4882a593Smuzhiyun 			local_bh_enable();
1047*4882a593Smuzhiyun 		}
1048*4882a593Smuzhiyun 
1049*4882a593Smuzhiyun 		tot_descs += ndesc;
1050*4882a593Smuzhiyun 		handled++;
1051*4882a593Smuzhiyun 	}
1052*4882a593Smuzhiyun 
1053*4882a593Smuzhiyun acknowledge:
1054*4882a593Smuzhiyun 	if (i)
1055*4882a593Smuzhiyun 		writel(EIP197_xDR_PROC_xD_PKT(i) |
1056*4882a593Smuzhiyun 		       (tot_descs * priv->config.rd_offset),
1057*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, ring) + EIP197_HIA_xDR_PROC_COUNT);
1058*4882a593Smuzhiyun 
1059*4882a593Smuzhiyun 	/* If the number of requests overflowed the counter, try to proceed more
1060*4882a593Smuzhiyun 	 * requests.
1061*4882a593Smuzhiyun 	 */
1062*4882a593Smuzhiyun 	if (nreq == EIP197_xDR_PROC_xD_PKT_MASK)
1063*4882a593Smuzhiyun 		goto handle_results;
1064*4882a593Smuzhiyun 
1065*4882a593Smuzhiyun requests_left:
1066*4882a593Smuzhiyun 	spin_lock_bh(&priv->ring[ring].lock);
1067*4882a593Smuzhiyun 
1068*4882a593Smuzhiyun 	priv->ring[ring].requests -= handled;
1069*4882a593Smuzhiyun 	safexcel_try_push_requests(priv, ring);
1070*4882a593Smuzhiyun 
1071*4882a593Smuzhiyun 	if (!priv->ring[ring].requests)
1072*4882a593Smuzhiyun 		priv->ring[ring].busy = false;
1073*4882a593Smuzhiyun 
1074*4882a593Smuzhiyun 	spin_unlock_bh(&priv->ring[ring].lock);
1075*4882a593Smuzhiyun }
1076*4882a593Smuzhiyun 
safexcel_dequeue_work(struct work_struct * work)1077*4882a593Smuzhiyun static void safexcel_dequeue_work(struct work_struct *work)
1078*4882a593Smuzhiyun {
1079*4882a593Smuzhiyun 	struct safexcel_work_data *data =
1080*4882a593Smuzhiyun 			container_of(work, struct safexcel_work_data, work);
1081*4882a593Smuzhiyun 
1082*4882a593Smuzhiyun 	safexcel_dequeue(data->priv, data->ring);
1083*4882a593Smuzhiyun }
1084*4882a593Smuzhiyun 
1085*4882a593Smuzhiyun struct safexcel_ring_irq_data {
1086*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv;
1087*4882a593Smuzhiyun 	int ring;
1088*4882a593Smuzhiyun };
1089*4882a593Smuzhiyun 
safexcel_irq_ring(int irq,void * data)1090*4882a593Smuzhiyun static irqreturn_t safexcel_irq_ring(int irq, void *data)
1091*4882a593Smuzhiyun {
1092*4882a593Smuzhiyun 	struct safexcel_ring_irq_data *irq_data = data;
1093*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv = irq_data->priv;
1094*4882a593Smuzhiyun 	int ring = irq_data->ring, rc = IRQ_NONE;
1095*4882a593Smuzhiyun 	u32 status, stat;
1096*4882a593Smuzhiyun 
1097*4882a593Smuzhiyun 	status = readl(EIP197_HIA_AIC_R(priv) + EIP197_HIA_AIC_R_ENABLED_STAT(ring));
1098*4882a593Smuzhiyun 	if (!status)
1099*4882a593Smuzhiyun 		return rc;
1100*4882a593Smuzhiyun 
1101*4882a593Smuzhiyun 	/* RDR interrupts */
1102*4882a593Smuzhiyun 	if (status & EIP197_RDR_IRQ(ring)) {
1103*4882a593Smuzhiyun 		stat = readl(EIP197_HIA_RDR(priv, ring) + EIP197_HIA_xDR_STAT);
1104*4882a593Smuzhiyun 
1105*4882a593Smuzhiyun 		if (unlikely(stat & EIP197_xDR_ERR)) {
1106*4882a593Smuzhiyun 			/*
1107*4882a593Smuzhiyun 			 * Fatal error, the RDR is unusable and must be
1108*4882a593Smuzhiyun 			 * reinitialized. This should not happen under
1109*4882a593Smuzhiyun 			 * normal circumstances.
1110*4882a593Smuzhiyun 			 */
1111*4882a593Smuzhiyun 			dev_err(priv->dev, "RDR: fatal error.\n");
1112*4882a593Smuzhiyun 		} else if (likely(stat & EIP197_xDR_THRESH)) {
1113*4882a593Smuzhiyun 			rc = IRQ_WAKE_THREAD;
1114*4882a593Smuzhiyun 		}
1115*4882a593Smuzhiyun 
1116*4882a593Smuzhiyun 		/* ACK the interrupts */
1117*4882a593Smuzhiyun 		writel(stat & 0xff,
1118*4882a593Smuzhiyun 		       EIP197_HIA_RDR(priv, ring) + EIP197_HIA_xDR_STAT);
1119*4882a593Smuzhiyun 	}
1120*4882a593Smuzhiyun 
1121*4882a593Smuzhiyun 	/* ACK the interrupts */
1122*4882a593Smuzhiyun 	writel(status, EIP197_HIA_AIC_R(priv) + EIP197_HIA_AIC_R_ACK(ring));
1123*4882a593Smuzhiyun 
1124*4882a593Smuzhiyun 	return rc;
1125*4882a593Smuzhiyun }
1126*4882a593Smuzhiyun 
safexcel_irq_ring_thread(int irq,void * data)1127*4882a593Smuzhiyun static irqreturn_t safexcel_irq_ring_thread(int irq, void *data)
1128*4882a593Smuzhiyun {
1129*4882a593Smuzhiyun 	struct safexcel_ring_irq_data *irq_data = data;
1130*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv = irq_data->priv;
1131*4882a593Smuzhiyun 	int ring = irq_data->ring;
1132*4882a593Smuzhiyun 
1133*4882a593Smuzhiyun 	safexcel_handle_result_descriptor(priv, ring);
1134*4882a593Smuzhiyun 
1135*4882a593Smuzhiyun 	queue_work(priv->ring[ring].workqueue,
1136*4882a593Smuzhiyun 		   &priv->ring[ring].work_data.work);
1137*4882a593Smuzhiyun 
1138*4882a593Smuzhiyun 	return IRQ_HANDLED;
1139*4882a593Smuzhiyun }
1140*4882a593Smuzhiyun 
safexcel_request_ring_irq(void * pdev,int irqid,int is_pci_dev,int ring_id,irq_handler_t handler,irq_handler_t threaded_handler,struct safexcel_ring_irq_data * ring_irq_priv)1141*4882a593Smuzhiyun static int safexcel_request_ring_irq(void *pdev, int irqid,
1142*4882a593Smuzhiyun 				     int is_pci_dev,
1143*4882a593Smuzhiyun 				     int ring_id,
1144*4882a593Smuzhiyun 				     irq_handler_t handler,
1145*4882a593Smuzhiyun 				     irq_handler_t threaded_handler,
1146*4882a593Smuzhiyun 				     struct safexcel_ring_irq_data *ring_irq_priv)
1147*4882a593Smuzhiyun {
1148*4882a593Smuzhiyun 	int ret, irq, cpu;
1149*4882a593Smuzhiyun 	struct device *dev;
1150*4882a593Smuzhiyun 
1151*4882a593Smuzhiyun 	if (IS_ENABLED(CONFIG_PCI) && is_pci_dev) {
1152*4882a593Smuzhiyun 		struct pci_dev *pci_pdev = pdev;
1153*4882a593Smuzhiyun 
1154*4882a593Smuzhiyun 		dev = &pci_pdev->dev;
1155*4882a593Smuzhiyun 		irq = pci_irq_vector(pci_pdev, irqid);
1156*4882a593Smuzhiyun 		if (irq < 0) {
1157*4882a593Smuzhiyun 			dev_err(dev, "unable to get device MSI IRQ %d (err %d)\n",
1158*4882a593Smuzhiyun 				irqid, irq);
1159*4882a593Smuzhiyun 			return irq;
1160*4882a593Smuzhiyun 		}
1161*4882a593Smuzhiyun 	} else if (IS_ENABLED(CONFIG_OF)) {
1162*4882a593Smuzhiyun 		struct platform_device *plf_pdev = pdev;
1163*4882a593Smuzhiyun 		char irq_name[6] = {0}; /* "ringX\0" */
1164*4882a593Smuzhiyun 
1165*4882a593Smuzhiyun 		snprintf(irq_name, 6, "ring%d", irqid);
1166*4882a593Smuzhiyun 		dev = &plf_pdev->dev;
1167*4882a593Smuzhiyun 		irq = platform_get_irq_byname(plf_pdev, irq_name);
1168*4882a593Smuzhiyun 
1169*4882a593Smuzhiyun 		if (irq < 0) {
1170*4882a593Smuzhiyun 			dev_err(dev, "unable to get IRQ '%s' (err %d)\n",
1171*4882a593Smuzhiyun 				irq_name, irq);
1172*4882a593Smuzhiyun 			return irq;
1173*4882a593Smuzhiyun 		}
1174*4882a593Smuzhiyun 	} else {
1175*4882a593Smuzhiyun 		return -ENXIO;
1176*4882a593Smuzhiyun 	}
1177*4882a593Smuzhiyun 
1178*4882a593Smuzhiyun 	ret = devm_request_threaded_irq(dev, irq, handler,
1179*4882a593Smuzhiyun 					threaded_handler, IRQF_ONESHOT,
1180*4882a593Smuzhiyun 					dev_name(dev), ring_irq_priv);
1181*4882a593Smuzhiyun 	if (ret) {
1182*4882a593Smuzhiyun 		dev_err(dev, "unable to request IRQ %d\n", irq);
1183*4882a593Smuzhiyun 		return ret;
1184*4882a593Smuzhiyun 	}
1185*4882a593Smuzhiyun 
1186*4882a593Smuzhiyun 	/* Set affinity */
1187*4882a593Smuzhiyun 	cpu = cpumask_local_spread(ring_id, NUMA_NO_NODE);
1188*4882a593Smuzhiyun 	irq_set_affinity_hint(irq, get_cpu_mask(cpu));
1189*4882a593Smuzhiyun 
1190*4882a593Smuzhiyun 	return irq;
1191*4882a593Smuzhiyun }
1192*4882a593Smuzhiyun 
1193*4882a593Smuzhiyun static struct safexcel_alg_template *safexcel_algs[] = {
1194*4882a593Smuzhiyun 	&safexcel_alg_ecb_des,
1195*4882a593Smuzhiyun 	&safexcel_alg_cbc_des,
1196*4882a593Smuzhiyun 	&safexcel_alg_ecb_des3_ede,
1197*4882a593Smuzhiyun 	&safexcel_alg_cbc_des3_ede,
1198*4882a593Smuzhiyun 	&safexcel_alg_ecb_aes,
1199*4882a593Smuzhiyun 	&safexcel_alg_cbc_aes,
1200*4882a593Smuzhiyun 	&safexcel_alg_cfb_aes,
1201*4882a593Smuzhiyun 	&safexcel_alg_ofb_aes,
1202*4882a593Smuzhiyun 	&safexcel_alg_ctr_aes,
1203*4882a593Smuzhiyun 	&safexcel_alg_md5,
1204*4882a593Smuzhiyun 	&safexcel_alg_sha1,
1205*4882a593Smuzhiyun 	&safexcel_alg_sha224,
1206*4882a593Smuzhiyun 	&safexcel_alg_sha256,
1207*4882a593Smuzhiyun 	&safexcel_alg_sha384,
1208*4882a593Smuzhiyun 	&safexcel_alg_sha512,
1209*4882a593Smuzhiyun 	&safexcel_alg_hmac_md5,
1210*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha1,
1211*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha224,
1212*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha256,
1213*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha384,
1214*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha512,
1215*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha1_cbc_aes,
1216*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha224_cbc_aes,
1217*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha256_cbc_aes,
1218*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha384_cbc_aes,
1219*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha512_cbc_aes,
1220*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha1_cbc_des3_ede,
1221*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha1_ctr_aes,
1222*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha224_ctr_aes,
1223*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha256_ctr_aes,
1224*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha384_ctr_aes,
1225*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha512_ctr_aes,
1226*4882a593Smuzhiyun 	&safexcel_alg_xts_aes,
1227*4882a593Smuzhiyun 	&safexcel_alg_gcm,
1228*4882a593Smuzhiyun 	&safexcel_alg_ccm,
1229*4882a593Smuzhiyun 	&safexcel_alg_crc32,
1230*4882a593Smuzhiyun 	&safexcel_alg_cbcmac,
1231*4882a593Smuzhiyun 	&safexcel_alg_xcbcmac,
1232*4882a593Smuzhiyun 	&safexcel_alg_cmac,
1233*4882a593Smuzhiyun 	&safexcel_alg_chacha20,
1234*4882a593Smuzhiyun 	&safexcel_alg_chachapoly,
1235*4882a593Smuzhiyun 	&safexcel_alg_chachapoly_esp,
1236*4882a593Smuzhiyun 	&safexcel_alg_sm3,
1237*4882a593Smuzhiyun 	&safexcel_alg_hmac_sm3,
1238*4882a593Smuzhiyun 	&safexcel_alg_ecb_sm4,
1239*4882a593Smuzhiyun 	&safexcel_alg_cbc_sm4,
1240*4882a593Smuzhiyun 	&safexcel_alg_ofb_sm4,
1241*4882a593Smuzhiyun 	&safexcel_alg_cfb_sm4,
1242*4882a593Smuzhiyun 	&safexcel_alg_ctr_sm4,
1243*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha1_cbc_sm4,
1244*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sm3_cbc_sm4,
1245*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha1_ctr_sm4,
1246*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sm3_ctr_sm4,
1247*4882a593Smuzhiyun 	&safexcel_alg_sha3_224,
1248*4882a593Smuzhiyun 	&safexcel_alg_sha3_256,
1249*4882a593Smuzhiyun 	&safexcel_alg_sha3_384,
1250*4882a593Smuzhiyun 	&safexcel_alg_sha3_512,
1251*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha3_224,
1252*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha3_256,
1253*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha3_384,
1254*4882a593Smuzhiyun 	&safexcel_alg_hmac_sha3_512,
1255*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha1_cbc_des,
1256*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha256_cbc_des3_ede,
1257*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha224_cbc_des3_ede,
1258*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha512_cbc_des3_ede,
1259*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha384_cbc_des3_ede,
1260*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha256_cbc_des,
1261*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha224_cbc_des,
1262*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha512_cbc_des,
1263*4882a593Smuzhiyun 	&safexcel_alg_authenc_hmac_sha384_cbc_des,
1264*4882a593Smuzhiyun 	&safexcel_alg_rfc4106_gcm,
1265*4882a593Smuzhiyun 	&safexcel_alg_rfc4543_gcm,
1266*4882a593Smuzhiyun 	&safexcel_alg_rfc4309_ccm,
1267*4882a593Smuzhiyun };
1268*4882a593Smuzhiyun 
safexcel_register_algorithms(struct safexcel_crypto_priv * priv)1269*4882a593Smuzhiyun static int safexcel_register_algorithms(struct safexcel_crypto_priv *priv)
1270*4882a593Smuzhiyun {
1271*4882a593Smuzhiyun 	int i, j, ret = 0;
1272*4882a593Smuzhiyun 
1273*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(safexcel_algs); i++) {
1274*4882a593Smuzhiyun 		safexcel_algs[i]->priv = priv;
1275*4882a593Smuzhiyun 
1276*4882a593Smuzhiyun 		/* Do we have all required base algorithms available? */
1277*4882a593Smuzhiyun 		if ((safexcel_algs[i]->algo_mask & priv->hwconfig.algo_flags) !=
1278*4882a593Smuzhiyun 		    safexcel_algs[i]->algo_mask)
1279*4882a593Smuzhiyun 			/* No, so don't register this ciphersuite */
1280*4882a593Smuzhiyun 			continue;
1281*4882a593Smuzhiyun 
1282*4882a593Smuzhiyun 		if (safexcel_algs[i]->type == SAFEXCEL_ALG_TYPE_SKCIPHER)
1283*4882a593Smuzhiyun 			ret = crypto_register_skcipher(&safexcel_algs[i]->alg.skcipher);
1284*4882a593Smuzhiyun 		else if (safexcel_algs[i]->type == SAFEXCEL_ALG_TYPE_AEAD)
1285*4882a593Smuzhiyun 			ret = crypto_register_aead(&safexcel_algs[i]->alg.aead);
1286*4882a593Smuzhiyun 		else
1287*4882a593Smuzhiyun 			ret = crypto_register_ahash(&safexcel_algs[i]->alg.ahash);
1288*4882a593Smuzhiyun 
1289*4882a593Smuzhiyun 		if (ret)
1290*4882a593Smuzhiyun 			goto fail;
1291*4882a593Smuzhiyun 	}
1292*4882a593Smuzhiyun 
1293*4882a593Smuzhiyun 	return 0;
1294*4882a593Smuzhiyun 
1295*4882a593Smuzhiyun fail:
1296*4882a593Smuzhiyun 	for (j = 0; j < i; j++) {
1297*4882a593Smuzhiyun 		/* Do we have all required base algorithms available? */
1298*4882a593Smuzhiyun 		if ((safexcel_algs[j]->algo_mask & priv->hwconfig.algo_flags) !=
1299*4882a593Smuzhiyun 		    safexcel_algs[j]->algo_mask)
1300*4882a593Smuzhiyun 			/* No, so don't unregister this ciphersuite */
1301*4882a593Smuzhiyun 			continue;
1302*4882a593Smuzhiyun 
1303*4882a593Smuzhiyun 		if (safexcel_algs[j]->type == SAFEXCEL_ALG_TYPE_SKCIPHER)
1304*4882a593Smuzhiyun 			crypto_unregister_skcipher(&safexcel_algs[j]->alg.skcipher);
1305*4882a593Smuzhiyun 		else if (safexcel_algs[j]->type == SAFEXCEL_ALG_TYPE_AEAD)
1306*4882a593Smuzhiyun 			crypto_unregister_aead(&safexcel_algs[j]->alg.aead);
1307*4882a593Smuzhiyun 		else
1308*4882a593Smuzhiyun 			crypto_unregister_ahash(&safexcel_algs[j]->alg.ahash);
1309*4882a593Smuzhiyun 	}
1310*4882a593Smuzhiyun 
1311*4882a593Smuzhiyun 	return ret;
1312*4882a593Smuzhiyun }
1313*4882a593Smuzhiyun 
safexcel_unregister_algorithms(struct safexcel_crypto_priv * priv)1314*4882a593Smuzhiyun static void safexcel_unregister_algorithms(struct safexcel_crypto_priv *priv)
1315*4882a593Smuzhiyun {
1316*4882a593Smuzhiyun 	int i;
1317*4882a593Smuzhiyun 
1318*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(safexcel_algs); i++) {
1319*4882a593Smuzhiyun 		/* Do we have all required base algorithms available? */
1320*4882a593Smuzhiyun 		if ((safexcel_algs[i]->algo_mask & priv->hwconfig.algo_flags) !=
1321*4882a593Smuzhiyun 		    safexcel_algs[i]->algo_mask)
1322*4882a593Smuzhiyun 			/* No, so don't unregister this ciphersuite */
1323*4882a593Smuzhiyun 			continue;
1324*4882a593Smuzhiyun 
1325*4882a593Smuzhiyun 		if (safexcel_algs[i]->type == SAFEXCEL_ALG_TYPE_SKCIPHER)
1326*4882a593Smuzhiyun 			crypto_unregister_skcipher(&safexcel_algs[i]->alg.skcipher);
1327*4882a593Smuzhiyun 		else if (safexcel_algs[i]->type == SAFEXCEL_ALG_TYPE_AEAD)
1328*4882a593Smuzhiyun 			crypto_unregister_aead(&safexcel_algs[i]->alg.aead);
1329*4882a593Smuzhiyun 		else
1330*4882a593Smuzhiyun 			crypto_unregister_ahash(&safexcel_algs[i]->alg.ahash);
1331*4882a593Smuzhiyun 	}
1332*4882a593Smuzhiyun }
1333*4882a593Smuzhiyun 
safexcel_configure(struct safexcel_crypto_priv * priv)1334*4882a593Smuzhiyun static void safexcel_configure(struct safexcel_crypto_priv *priv)
1335*4882a593Smuzhiyun {
1336*4882a593Smuzhiyun 	u32 mask = BIT(priv->hwconfig.hwdataw) - 1;
1337*4882a593Smuzhiyun 
1338*4882a593Smuzhiyun 	priv->config.pes = priv->hwconfig.hwnumpes;
1339*4882a593Smuzhiyun 	priv->config.rings = min_t(u32, priv->hwconfig.hwnumrings, max_rings);
1340*4882a593Smuzhiyun 	/* Cannot currently support more rings than we have ring AICs! */
1341*4882a593Smuzhiyun 	priv->config.rings = min_t(u32, priv->config.rings,
1342*4882a593Smuzhiyun 					priv->hwconfig.hwnumraic);
1343*4882a593Smuzhiyun 
1344*4882a593Smuzhiyun 	priv->config.cd_size = EIP197_CD64_FETCH_SIZE;
1345*4882a593Smuzhiyun 	priv->config.cd_offset = (priv->config.cd_size + mask) & ~mask;
1346*4882a593Smuzhiyun 	priv->config.cdsh_offset = (EIP197_MAX_TOKENS + mask) & ~mask;
1347*4882a593Smuzhiyun 
1348*4882a593Smuzhiyun 	/* res token is behind the descr, but ofs must be rounded to buswdth */
1349*4882a593Smuzhiyun 	priv->config.res_offset = (EIP197_RD64_FETCH_SIZE + mask) & ~mask;
1350*4882a593Smuzhiyun 	/* now the size of the descr is this 1st part plus the result struct */
1351*4882a593Smuzhiyun 	priv->config.rd_size    = priv->config.res_offset +
1352*4882a593Smuzhiyun 				  EIP197_RD64_RESULT_SIZE;
1353*4882a593Smuzhiyun 	priv->config.rd_offset = (priv->config.rd_size + mask) & ~mask;
1354*4882a593Smuzhiyun 
1355*4882a593Smuzhiyun 	/* convert dwords to bytes */
1356*4882a593Smuzhiyun 	priv->config.cd_offset *= sizeof(u32);
1357*4882a593Smuzhiyun 	priv->config.cdsh_offset *= sizeof(u32);
1358*4882a593Smuzhiyun 	priv->config.rd_offset *= sizeof(u32);
1359*4882a593Smuzhiyun 	priv->config.res_offset *= sizeof(u32);
1360*4882a593Smuzhiyun }
1361*4882a593Smuzhiyun 
safexcel_init_register_offsets(struct safexcel_crypto_priv * priv)1362*4882a593Smuzhiyun static void safexcel_init_register_offsets(struct safexcel_crypto_priv *priv)
1363*4882a593Smuzhiyun {
1364*4882a593Smuzhiyun 	struct safexcel_register_offsets *offsets = &priv->offsets;
1365*4882a593Smuzhiyun 
1366*4882a593Smuzhiyun 	if (priv->flags & SAFEXCEL_HW_EIP197) {
1367*4882a593Smuzhiyun 		offsets->hia_aic	= EIP197_HIA_AIC_BASE;
1368*4882a593Smuzhiyun 		offsets->hia_aic_g	= EIP197_HIA_AIC_G_BASE;
1369*4882a593Smuzhiyun 		offsets->hia_aic_r	= EIP197_HIA_AIC_R_BASE;
1370*4882a593Smuzhiyun 		offsets->hia_aic_xdr	= EIP197_HIA_AIC_xDR_BASE;
1371*4882a593Smuzhiyun 		offsets->hia_dfe	= EIP197_HIA_DFE_BASE;
1372*4882a593Smuzhiyun 		offsets->hia_dfe_thr	= EIP197_HIA_DFE_THR_BASE;
1373*4882a593Smuzhiyun 		offsets->hia_dse	= EIP197_HIA_DSE_BASE;
1374*4882a593Smuzhiyun 		offsets->hia_dse_thr	= EIP197_HIA_DSE_THR_BASE;
1375*4882a593Smuzhiyun 		offsets->hia_gen_cfg	= EIP197_HIA_GEN_CFG_BASE;
1376*4882a593Smuzhiyun 		offsets->pe		= EIP197_PE_BASE;
1377*4882a593Smuzhiyun 		offsets->global		= EIP197_GLOBAL_BASE;
1378*4882a593Smuzhiyun 	} else {
1379*4882a593Smuzhiyun 		offsets->hia_aic	= EIP97_HIA_AIC_BASE;
1380*4882a593Smuzhiyun 		offsets->hia_aic_g	= EIP97_HIA_AIC_G_BASE;
1381*4882a593Smuzhiyun 		offsets->hia_aic_r	= EIP97_HIA_AIC_R_BASE;
1382*4882a593Smuzhiyun 		offsets->hia_aic_xdr	= EIP97_HIA_AIC_xDR_BASE;
1383*4882a593Smuzhiyun 		offsets->hia_dfe	= EIP97_HIA_DFE_BASE;
1384*4882a593Smuzhiyun 		offsets->hia_dfe_thr	= EIP97_HIA_DFE_THR_BASE;
1385*4882a593Smuzhiyun 		offsets->hia_dse	= EIP97_HIA_DSE_BASE;
1386*4882a593Smuzhiyun 		offsets->hia_dse_thr	= EIP97_HIA_DSE_THR_BASE;
1387*4882a593Smuzhiyun 		offsets->hia_gen_cfg	= EIP97_HIA_GEN_CFG_BASE;
1388*4882a593Smuzhiyun 		offsets->pe		= EIP97_PE_BASE;
1389*4882a593Smuzhiyun 		offsets->global		= EIP97_GLOBAL_BASE;
1390*4882a593Smuzhiyun 	}
1391*4882a593Smuzhiyun }
1392*4882a593Smuzhiyun 
1393*4882a593Smuzhiyun /*
1394*4882a593Smuzhiyun  * Generic part of probe routine, shared by platform and PCI driver
1395*4882a593Smuzhiyun  *
1396*4882a593Smuzhiyun  * Assumes IO resources have been mapped, private data mem has been allocated,
1397*4882a593Smuzhiyun  * clocks have been enabled, device pointer has been assigned etc.
1398*4882a593Smuzhiyun  *
1399*4882a593Smuzhiyun  */
safexcel_probe_generic(void * pdev,struct safexcel_crypto_priv * priv,int is_pci_dev)1400*4882a593Smuzhiyun static int safexcel_probe_generic(void *pdev,
1401*4882a593Smuzhiyun 				  struct safexcel_crypto_priv *priv,
1402*4882a593Smuzhiyun 				  int is_pci_dev)
1403*4882a593Smuzhiyun {
1404*4882a593Smuzhiyun 	struct device *dev = priv->dev;
1405*4882a593Smuzhiyun 	u32 peid, version, mask, val, hiaopt, hwopt, peopt;
1406*4882a593Smuzhiyun 	int i, ret, hwctg;
1407*4882a593Smuzhiyun 
1408*4882a593Smuzhiyun 	priv->context_pool = dmam_pool_create("safexcel-context", dev,
1409*4882a593Smuzhiyun 					      sizeof(struct safexcel_context_record),
1410*4882a593Smuzhiyun 					      1, 0);
1411*4882a593Smuzhiyun 	if (!priv->context_pool)
1412*4882a593Smuzhiyun 		return -ENOMEM;
1413*4882a593Smuzhiyun 
1414*4882a593Smuzhiyun 	/*
1415*4882a593Smuzhiyun 	 * First try the EIP97 HIA version regs
1416*4882a593Smuzhiyun 	 * For the EIP197, this is guaranteed to NOT return any of the test
1417*4882a593Smuzhiyun 	 * values
1418*4882a593Smuzhiyun 	 */
1419*4882a593Smuzhiyun 	version = readl(priv->base + EIP97_HIA_AIC_BASE + EIP197_HIA_VERSION);
1420*4882a593Smuzhiyun 
1421*4882a593Smuzhiyun 	mask = 0;  /* do not swap */
1422*4882a593Smuzhiyun 	if (EIP197_REG_LO16(version) == EIP197_HIA_VERSION_LE) {
1423*4882a593Smuzhiyun 		priv->hwconfig.hiaver = EIP197_VERSION_MASK(version);
1424*4882a593Smuzhiyun 	} else if (EIP197_REG_HI16(version) == EIP197_HIA_VERSION_BE) {
1425*4882a593Smuzhiyun 		/* read back byte-swapped, so complement byte swap bits */
1426*4882a593Smuzhiyun 		mask = EIP197_MST_CTRL_BYTE_SWAP_BITS;
1427*4882a593Smuzhiyun 		priv->hwconfig.hiaver = EIP197_VERSION_SWAP(version);
1428*4882a593Smuzhiyun 	} else {
1429*4882a593Smuzhiyun 		/* So it wasn't an EIP97 ... maybe it's an EIP197? */
1430*4882a593Smuzhiyun 		version = readl(priv->base + EIP197_HIA_AIC_BASE +
1431*4882a593Smuzhiyun 				EIP197_HIA_VERSION);
1432*4882a593Smuzhiyun 		if (EIP197_REG_LO16(version) == EIP197_HIA_VERSION_LE) {
1433*4882a593Smuzhiyun 			priv->hwconfig.hiaver = EIP197_VERSION_MASK(version);
1434*4882a593Smuzhiyun 			priv->flags |= SAFEXCEL_HW_EIP197;
1435*4882a593Smuzhiyun 		} else if (EIP197_REG_HI16(version) ==
1436*4882a593Smuzhiyun 			   EIP197_HIA_VERSION_BE) {
1437*4882a593Smuzhiyun 			/* read back byte-swapped, so complement swap bits */
1438*4882a593Smuzhiyun 			mask = EIP197_MST_CTRL_BYTE_SWAP_BITS;
1439*4882a593Smuzhiyun 			priv->hwconfig.hiaver = EIP197_VERSION_SWAP(version);
1440*4882a593Smuzhiyun 			priv->flags |= SAFEXCEL_HW_EIP197;
1441*4882a593Smuzhiyun 		} else {
1442*4882a593Smuzhiyun 			return -ENODEV;
1443*4882a593Smuzhiyun 		}
1444*4882a593Smuzhiyun 	}
1445*4882a593Smuzhiyun 
1446*4882a593Smuzhiyun 	/* Now initialize the reg offsets based on the probing info so far */
1447*4882a593Smuzhiyun 	safexcel_init_register_offsets(priv);
1448*4882a593Smuzhiyun 
1449*4882a593Smuzhiyun 	/*
1450*4882a593Smuzhiyun 	 * If the version was read byte-swapped, we need to flip the device
1451*4882a593Smuzhiyun 	 * swapping Keep in mind here, though, that what we write will also be
1452*4882a593Smuzhiyun 	 * byte-swapped ...
1453*4882a593Smuzhiyun 	 */
1454*4882a593Smuzhiyun 	if (mask) {
1455*4882a593Smuzhiyun 		val = readl(EIP197_HIA_AIC(priv) + EIP197_HIA_MST_CTRL);
1456*4882a593Smuzhiyun 		val = val ^ (mask >> 24); /* toggle byte swap bits */
1457*4882a593Smuzhiyun 		writel(val, EIP197_HIA_AIC(priv) + EIP197_HIA_MST_CTRL);
1458*4882a593Smuzhiyun 	}
1459*4882a593Smuzhiyun 
1460*4882a593Smuzhiyun 	/*
1461*4882a593Smuzhiyun 	 * We're not done probing yet! We may fall through to here if no HIA
1462*4882a593Smuzhiyun 	 * was found at all. So, with the endianness presumably correct now and
1463*4882a593Smuzhiyun 	 * the offsets setup, *really* probe for the EIP97/EIP197.
1464*4882a593Smuzhiyun 	 */
1465*4882a593Smuzhiyun 	version = readl(EIP197_GLOBAL(priv) + EIP197_VERSION);
1466*4882a593Smuzhiyun 	if (((priv->flags & SAFEXCEL_HW_EIP197) &&
1467*4882a593Smuzhiyun 	     (EIP197_REG_LO16(version) != EIP197_VERSION_LE) &&
1468*4882a593Smuzhiyun 	     (EIP197_REG_LO16(version) != EIP196_VERSION_LE)) ||
1469*4882a593Smuzhiyun 	    ((!(priv->flags & SAFEXCEL_HW_EIP197) &&
1470*4882a593Smuzhiyun 	     (EIP197_REG_LO16(version) != EIP97_VERSION_LE)))) {
1471*4882a593Smuzhiyun 		/*
1472*4882a593Smuzhiyun 		 * We did not find the device that matched our initial probing
1473*4882a593Smuzhiyun 		 * (or our initial probing failed) Report appropriate error.
1474*4882a593Smuzhiyun 		 */
1475*4882a593Smuzhiyun 		dev_err(priv->dev, "Probing for EIP97/EIP19x failed - no such device (read %08x)\n",
1476*4882a593Smuzhiyun 			version);
1477*4882a593Smuzhiyun 		return -ENODEV;
1478*4882a593Smuzhiyun 	}
1479*4882a593Smuzhiyun 
1480*4882a593Smuzhiyun 	priv->hwconfig.hwver = EIP197_VERSION_MASK(version);
1481*4882a593Smuzhiyun 	hwctg = version >> 28;
1482*4882a593Smuzhiyun 	peid = version & 255;
1483*4882a593Smuzhiyun 
1484*4882a593Smuzhiyun 	/* Detect EIP206 processing pipe */
1485*4882a593Smuzhiyun 	version = readl(EIP197_PE(priv) + + EIP197_PE_VERSION(0));
1486*4882a593Smuzhiyun 	if (EIP197_REG_LO16(version) != EIP206_VERSION_LE) {
1487*4882a593Smuzhiyun 		dev_err(priv->dev, "EIP%d: EIP206 not detected\n", peid);
1488*4882a593Smuzhiyun 		return -ENODEV;
1489*4882a593Smuzhiyun 	}
1490*4882a593Smuzhiyun 	priv->hwconfig.ppver = EIP197_VERSION_MASK(version);
1491*4882a593Smuzhiyun 
1492*4882a593Smuzhiyun 	/* Detect EIP96 packet engine and version */
1493*4882a593Smuzhiyun 	version = readl(EIP197_PE(priv) + EIP197_PE_EIP96_VERSION(0));
1494*4882a593Smuzhiyun 	if (EIP197_REG_LO16(version) != EIP96_VERSION_LE) {
1495*4882a593Smuzhiyun 		dev_err(dev, "EIP%d: EIP96 not detected.\n", peid);
1496*4882a593Smuzhiyun 		return -ENODEV;
1497*4882a593Smuzhiyun 	}
1498*4882a593Smuzhiyun 	priv->hwconfig.pever = EIP197_VERSION_MASK(version);
1499*4882a593Smuzhiyun 
1500*4882a593Smuzhiyun 	hwopt = readl(EIP197_GLOBAL(priv) + EIP197_OPTIONS);
1501*4882a593Smuzhiyun 	hiaopt = readl(EIP197_HIA_AIC(priv) + EIP197_HIA_OPTIONS);
1502*4882a593Smuzhiyun 
1503*4882a593Smuzhiyun 	priv->hwconfig.icever = 0;
1504*4882a593Smuzhiyun 	priv->hwconfig.ocever = 0;
1505*4882a593Smuzhiyun 	priv->hwconfig.psever = 0;
1506*4882a593Smuzhiyun 	if (priv->flags & SAFEXCEL_HW_EIP197) {
1507*4882a593Smuzhiyun 		/* EIP197 */
1508*4882a593Smuzhiyun 		peopt = readl(EIP197_PE(priv) + EIP197_PE_OPTIONS(0));
1509*4882a593Smuzhiyun 
1510*4882a593Smuzhiyun 		priv->hwconfig.hwdataw  = (hiaopt >> EIP197_HWDATAW_OFFSET) &
1511*4882a593Smuzhiyun 					  EIP197_HWDATAW_MASK;
1512*4882a593Smuzhiyun 		priv->hwconfig.hwcfsize = ((hiaopt >> EIP197_CFSIZE_OFFSET) &
1513*4882a593Smuzhiyun 					   EIP197_CFSIZE_MASK) +
1514*4882a593Smuzhiyun 					  EIP197_CFSIZE_ADJUST;
1515*4882a593Smuzhiyun 		priv->hwconfig.hwrfsize = ((hiaopt >> EIP197_RFSIZE_OFFSET) &
1516*4882a593Smuzhiyun 					   EIP197_RFSIZE_MASK) +
1517*4882a593Smuzhiyun 					  EIP197_RFSIZE_ADJUST;
1518*4882a593Smuzhiyun 		priv->hwconfig.hwnumpes	= (hiaopt >> EIP197_N_PES_OFFSET) &
1519*4882a593Smuzhiyun 					  EIP197_N_PES_MASK;
1520*4882a593Smuzhiyun 		priv->hwconfig.hwnumrings = (hiaopt >> EIP197_N_RINGS_OFFSET) &
1521*4882a593Smuzhiyun 					    EIP197_N_RINGS_MASK;
1522*4882a593Smuzhiyun 		if (hiaopt & EIP197_HIA_OPT_HAS_PE_ARB)
1523*4882a593Smuzhiyun 			priv->flags |= EIP197_PE_ARB;
1524*4882a593Smuzhiyun 		if (EIP206_OPT_ICE_TYPE(peopt) == 1) {
1525*4882a593Smuzhiyun 			priv->flags |= EIP197_ICE;
1526*4882a593Smuzhiyun 			/* Detect ICE EIP207 class. engine and version */
1527*4882a593Smuzhiyun 			version = readl(EIP197_PE(priv) +
1528*4882a593Smuzhiyun 				  EIP197_PE_ICE_VERSION(0));
1529*4882a593Smuzhiyun 			if (EIP197_REG_LO16(version) != EIP207_VERSION_LE) {
1530*4882a593Smuzhiyun 				dev_err(dev, "EIP%d: ICE EIP207 not detected.\n",
1531*4882a593Smuzhiyun 					peid);
1532*4882a593Smuzhiyun 				return -ENODEV;
1533*4882a593Smuzhiyun 			}
1534*4882a593Smuzhiyun 			priv->hwconfig.icever = EIP197_VERSION_MASK(version);
1535*4882a593Smuzhiyun 		}
1536*4882a593Smuzhiyun 		if (EIP206_OPT_OCE_TYPE(peopt) == 1) {
1537*4882a593Smuzhiyun 			priv->flags |= EIP197_OCE;
1538*4882a593Smuzhiyun 			/* Detect EIP96PP packet stream editor and version */
1539*4882a593Smuzhiyun 			version = readl(EIP197_PE(priv) + EIP197_PE_PSE_VERSION(0));
1540*4882a593Smuzhiyun 			if (EIP197_REG_LO16(version) != EIP96_VERSION_LE) {
1541*4882a593Smuzhiyun 				dev_err(dev, "EIP%d: EIP96PP not detected.\n", peid);
1542*4882a593Smuzhiyun 				return -ENODEV;
1543*4882a593Smuzhiyun 			}
1544*4882a593Smuzhiyun 			priv->hwconfig.psever = EIP197_VERSION_MASK(version);
1545*4882a593Smuzhiyun 			/* Detect OCE EIP207 class. engine and version */
1546*4882a593Smuzhiyun 			version = readl(EIP197_PE(priv) +
1547*4882a593Smuzhiyun 				  EIP197_PE_ICE_VERSION(0));
1548*4882a593Smuzhiyun 			if (EIP197_REG_LO16(version) != EIP207_VERSION_LE) {
1549*4882a593Smuzhiyun 				dev_err(dev, "EIP%d: OCE EIP207 not detected.\n",
1550*4882a593Smuzhiyun 					peid);
1551*4882a593Smuzhiyun 				return -ENODEV;
1552*4882a593Smuzhiyun 			}
1553*4882a593Smuzhiyun 			priv->hwconfig.ocever = EIP197_VERSION_MASK(version);
1554*4882a593Smuzhiyun 		}
1555*4882a593Smuzhiyun 		/* If not a full TRC, then assume simple TRC */
1556*4882a593Smuzhiyun 		if (!(hwopt & EIP197_OPT_HAS_TRC))
1557*4882a593Smuzhiyun 			priv->flags |= EIP197_SIMPLE_TRC;
1558*4882a593Smuzhiyun 		/* EIP197 always has SOME form of TRC */
1559*4882a593Smuzhiyun 		priv->flags |= EIP197_TRC_CACHE;
1560*4882a593Smuzhiyun 	} else {
1561*4882a593Smuzhiyun 		/* EIP97 */
1562*4882a593Smuzhiyun 		priv->hwconfig.hwdataw  = (hiaopt >> EIP197_HWDATAW_OFFSET) &
1563*4882a593Smuzhiyun 					  EIP97_HWDATAW_MASK;
1564*4882a593Smuzhiyun 		priv->hwconfig.hwcfsize = (hiaopt >> EIP97_CFSIZE_OFFSET) &
1565*4882a593Smuzhiyun 					  EIP97_CFSIZE_MASK;
1566*4882a593Smuzhiyun 		priv->hwconfig.hwrfsize = (hiaopt >> EIP97_RFSIZE_OFFSET) &
1567*4882a593Smuzhiyun 					  EIP97_RFSIZE_MASK;
1568*4882a593Smuzhiyun 		priv->hwconfig.hwnumpes	= 1; /* by definition */
1569*4882a593Smuzhiyun 		priv->hwconfig.hwnumrings = (hiaopt >> EIP197_N_RINGS_OFFSET) &
1570*4882a593Smuzhiyun 					    EIP197_N_RINGS_MASK;
1571*4882a593Smuzhiyun 	}
1572*4882a593Smuzhiyun 
1573*4882a593Smuzhiyun 	/* Scan for ring AIC's */
1574*4882a593Smuzhiyun 	for (i = 0; i < EIP197_MAX_RING_AIC; i++) {
1575*4882a593Smuzhiyun 		version = readl(EIP197_HIA_AIC_R(priv) +
1576*4882a593Smuzhiyun 				EIP197_HIA_AIC_R_VERSION(i));
1577*4882a593Smuzhiyun 		if (EIP197_REG_LO16(version) != EIP201_VERSION_LE)
1578*4882a593Smuzhiyun 			break;
1579*4882a593Smuzhiyun 	}
1580*4882a593Smuzhiyun 	priv->hwconfig.hwnumraic = i;
1581*4882a593Smuzhiyun 	/* Low-end EIP196 may not have any ring AIC's ... */
1582*4882a593Smuzhiyun 	if (!priv->hwconfig.hwnumraic) {
1583*4882a593Smuzhiyun 		dev_err(priv->dev, "No ring interrupt controller present!\n");
1584*4882a593Smuzhiyun 		return -ENODEV;
1585*4882a593Smuzhiyun 	}
1586*4882a593Smuzhiyun 
1587*4882a593Smuzhiyun 	/* Get supported algorithms from EIP96 transform engine */
1588*4882a593Smuzhiyun 	priv->hwconfig.algo_flags = readl(EIP197_PE(priv) +
1589*4882a593Smuzhiyun 				    EIP197_PE_EIP96_OPTIONS(0));
1590*4882a593Smuzhiyun 
1591*4882a593Smuzhiyun 	/* Print single info line describing what we just detected */
1592*4882a593Smuzhiyun 	dev_info(priv->dev, "EIP%d:%x(%d,%d,%d,%d)-HIA:%x(%d,%d,%d),PE:%x/%x(alg:%08x)/%x/%x/%x\n",
1593*4882a593Smuzhiyun 		 peid, priv->hwconfig.hwver, hwctg, priv->hwconfig.hwnumpes,
1594*4882a593Smuzhiyun 		 priv->hwconfig.hwnumrings, priv->hwconfig.hwnumraic,
1595*4882a593Smuzhiyun 		 priv->hwconfig.hiaver, priv->hwconfig.hwdataw,
1596*4882a593Smuzhiyun 		 priv->hwconfig.hwcfsize, priv->hwconfig.hwrfsize,
1597*4882a593Smuzhiyun 		 priv->hwconfig.ppver, priv->hwconfig.pever,
1598*4882a593Smuzhiyun 		 priv->hwconfig.algo_flags, priv->hwconfig.icever,
1599*4882a593Smuzhiyun 		 priv->hwconfig.ocever, priv->hwconfig.psever);
1600*4882a593Smuzhiyun 
1601*4882a593Smuzhiyun 	safexcel_configure(priv);
1602*4882a593Smuzhiyun 
1603*4882a593Smuzhiyun 	if (IS_ENABLED(CONFIG_PCI) && priv->version == EIP197_DEVBRD) {
1604*4882a593Smuzhiyun 		/*
1605*4882a593Smuzhiyun 		 * Request MSI vectors for global + 1 per ring -
1606*4882a593Smuzhiyun 		 * or just 1 for older dev images
1607*4882a593Smuzhiyun 		 */
1608*4882a593Smuzhiyun 		struct pci_dev *pci_pdev = pdev;
1609*4882a593Smuzhiyun 
1610*4882a593Smuzhiyun 		ret = pci_alloc_irq_vectors(pci_pdev,
1611*4882a593Smuzhiyun 					    priv->config.rings + 1,
1612*4882a593Smuzhiyun 					    priv->config.rings + 1,
1613*4882a593Smuzhiyun 					    PCI_IRQ_MSI | PCI_IRQ_MSIX);
1614*4882a593Smuzhiyun 		if (ret < 0) {
1615*4882a593Smuzhiyun 			dev_err(dev, "Failed to allocate PCI MSI interrupts\n");
1616*4882a593Smuzhiyun 			return ret;
1617*4882a593Smuzhiyun 		}
1618*4882a593Smuzhiyun 	}
1619*4882a593Smuzhiyun 
1620*4882a593Smuzhiyun 	/* Register the ring IRQ handlers and configure the rings */
1621*4882a593Smuzhiyun 	priv->ring = devm_kcalloc(dev, priv->config.rings,
1622*4882a593Smuzhiyun 				  sizeof(*priv->ring),
1623*4882a593Smuzhiyun 				  GFP_KERNEL);
1624*4882a593Smuzhiyun 	if (!priv->ring)
1625*4882a593Smuzhiyun 		return -ENOMEM;
1626*4882a593Smuzhiyun 
1627*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
1628*4882a593Smuzhiyun 		char wq_name[9] = {0};
1629*4882a593Smuzhiyun 		int irq;
1630*4882a593Smuzhiyun 		struct safexcel_ring_irq_data *ring_irq;
1631*4882a593Smuzhiyun 
1632*4882a593Smuzhiyun 		ret = safexcel_init_ring_descriptors(priv,
1633*4882a593Smuzhiyun 						     &priv->ring[i].cdr,
1634*4882a593Smuzhiyun 						     &priv->ring[i].rdr);
1635*4882a593Smuzhiyun 		if (ret) {
1636*4882a593Smuzhiyun 			dev_err(dev, "Failed to initialize rings\n");
1637*4882a593Smuzhiyun 			return ret;
1638*4882a593Smuzhiyun 		}
1639*4882a593Smuzhiyun 
1640*4882a593Smuzhiyun 		priv->ring[i].rdr_req = devm_kcalloc(dev,
1641*4882a593Smuzhiyun 			EIP197_DEFAULT_RING_SIZE,
1642*4882a593Smuzhiyun 			sizeof(*priv->ring[i].rdr_req),
1643*4882a593Smuzhiyun 			GFP_KERNEL);
1644*4882a593Smuzhiyun 		if (!priv->ring[i].rdr_req)
1645*4882a593Smuzhiyun 			return -ENOMEM;
1646*4882a593Smuzhiyun 
1647*4882a593Smuzhiyun 		ring_irq = devm_kzalloc(dev, sizeof(*ring_irq), GFP_KERNEL);
1648*4882a593Smuzhiyun 		if (!ring_irq)
1649*4882a593Smuzhiyun 			return -ENOMEM;
1650*4882a593Smuzhiyun 
1651*4882a593Smuzhiyun 		ring_irq->priv = priv;
1652*4882a593Smuzhiyun 		ring_irq->ring = i;
1653*4882a593Smuzhiyun 
1654*4882a593Smuzhiyun 		irq = safexcel_request_ring_irq(pdev,
1655*4882a593Smuzhiyun 						EIP197_IRQ_NUMBER(i, is_pci_dev),
1656*4882a593Smuzhiyun 						is_pci_dev,
1657*4882a593Smuzhiyun 						i,
1658*4882a593Smuzhiyun 						safexcel_irq_ring,
1659*4882a593Smuzhiyun 						safexcel_irq_ring_thread,
1660*4882a593Smuzhiyun 						ring_irq);
1661*4882a593Smuzhiyun 		if (irq < 0) {
1662*4882a593Smuzhiyun 			dev_err(dev, "Failed to get IRQ ID for ring %d\n", i);
1663*4882a593Smuzhiyun 			return irq;
1664*4882a593Smuzhiyun 		}
1665*4882a593Smuzhiyun 
1666*4882a593Smuzhiyun 		priv->ring[i].irq = irq;
1667*4882a593Smuzhiyun 		priv->ring[i].work_data.priv = priv;
1668*4882a593Smuzhiyun 		priv->ring[i].work_data.ring = i;
1669*4882a593Smuzhiyun 		INIT_WORK(&priv->ring[i].work_data.work,
1670*4882a593Smuzhiyun 			  safexcel_dequeue_work);
1671*4882a593Smuzhiyun 
1672*4882a593Smuzhiyun 		snprintf(wq_name, 9, "wq_ring%d", i);
1673*4882a593Smuzhiyun 		priv->ring[i].workqueue =
1674*4882a593Smuzhiyun 			create_singlethread_workqueue(wq_name);
1675*4882a593Smuzhiyun 		if (!priv->ring[i].workqueue)
1676*4882a593Smuzhiyun 			return -ENOMEM;
1677*4882a593Smuzhiyun 
1678*4882a593Smuzhiyun 		priv->ring[i].requests = 0;
1679*4882a593Smuzhiyun 		priv->ring[i].busy = false;
1680*4882a593Smuzhiyun 
1681*4882a593Smuzhiyun 		crypto_init_queue(&priv->ring[i].queue,
1682*4882a593Smuzhiyun 				  EIP197_DEFAULT_RING_SIZE);
1683*4882a593Smuzhiyun 
1684*4882a593Smuzhiyun 		spin_lock_init(&priv->ring[i].lock);
1685*4882a593Smuzhiyun 		spin_lock_init(&priv->ring[i].queue_lock);
1686*4882a593Smuzhiyun 	}
1687*4882a593Smuzhiyun 
1688*4882a593Smuzhiyun 	atomic_set(&priv->ring_used, 0);
1689*4882a593Smuzhiyun 
1690*4882a593Smuzhiyun 	ret = safexcel_hw_init(priv);
1691*4882a593Smuzhiyun 	if (ret) {
1692*4882a593Smuzhiyun 		dev_err(dev, "HW init failed (%d)\n", ret);
1693*4882a593Smuzhiyun 		return ret;
1694*4882a593Smuzhiyun 	}
1695*4882a593Smuzhiyun 
1696*4882a593Smuzhiyun 	ret = safexcel_register_algorithms(priv);
1697*4882a593Smuzhiyun 	if (ret) {
1698*4882a593Smuzhiyun 		dev_err(dev, "Failed to register algorithms (%d)\n", ret);
1699*4882a593Smuzhiyun 		return ret;
1700*4882a593Smuzhiyun 	}
1701*4882a593Smuzhiyun 
1702*4882a593Smuzhiyun 	return 0;
1703*4882a593Smuzhiyun }
1704*4882a593Smuzhiyun 
safexcel_hw_reset_rings(struct safexcel_crypto_priv * priv)1705*4882a593Smuzhiyun static void safexcel_hw_reset_rings(struct safexcel_crypto_priv *priv)
1706*4882a593Smuzhiyun {
1707*4882a593Smuzhiyun 	int i;
1708*4882a593Smuzhiyun 
1709*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
1710*4882a593Smuzhiyun 		/* clear any pending interrupt */
1711*4882a593Smuzhiyun 		writel(GENMASK(5, 0), EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_STAT);
1712*4882a593Smuzhiyun 		writel(GENMASK(7, 0), EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_STAT);
1713*4882a593Smuzhiyun 
1714*4882a593Smuzhiyun 		/* Reset the CDR base address */
1715*4882a593Smuzhiyun 		writel(0, EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_LO);
1716*4882a593Smuzhiyun 		writel(0, EIP197_HIA_CDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_HI);
1717*4882a593Smuzhiyun 
1718*4882a593Smuzhiyun 		/* Reset the RDR base address */
1719*4882a593Smuzhiyun 		writel(0, EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_LO);
1720*4882a593Smuzhiyun 		writel(0, EIP197_HIA_RDR(priv, i) + EIP197_HIA_xDR_RING_BASE_ADDR_HI);
1721*4882a593Smuzhiyun 	}
1722*4882a593Smuzhiyun }
1723*4882a593Smuzhiyun 
1724*4882a593Smuzhiyun /* for Device Tree platform driver */
1725*4882a593Smuzhiyun 
safexcel_probe(struct platform_device * pdev)1726*4882a593Smuzhiyun static int safexcel_probe(struct platform_device *pdev)
1727*4882a593Smuzhiyun {
1728*4882a593Smuzhiyun 	struct device *dev = &pdev->dev;
1729*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv;
1730*4882a593Smuzhiyun 	int ret;
1731*4882a593Smuzhiyun 
1732*4882a593Smuzhiyun 	priv = devm_kzalloc(dev, sizeof(*priv), GFP_KERNEL);
1733*4882a593Smuzhiyun 	if (!priv)
1734*4882a593Smuzhiyun 		return -ENOMEM;
1735*4882a593Smuzhiyun 
1736*4882a593Smuzhiyun 	priv->dev = dev;
1737*4882a593Smuzhiyun 	priv->version = (enum safexcel_eip_version)of_device_get_match_data(dev);
1738*4882a593Smuzhiyun 
1739*4882a593Smuzhiyun 	platform_set_drvdata(pdev, priv);
1740*4882a593Smuzhiyun 
1741*4882a593Smuzhiyun 	priv->base = devm_platform_ioremap_resource(pdev, 0);
1742*4882a593Smuzhiyun 	if (IS_ERR(priv->base)) {
1743*4882a593Smuzhiyun 		dev_err(dev, "failed to get resource\n");
1744*4882a593Smuzhiyun 		return PTR_ERR(priv->base);
1745*4882a593Smuzhiyun 	}
1746*4882a593Smuzhiyun 
1747*4882a593Smuzhiyun 	priv->clk = devm_clk_get(&pdev->dev, NULL);
1748*4882a593Smuzhiyun 	ret = PTR_ERR_OR_ZERO(priv->clk);
1749*4882a593Smuzhiyun 	/* The clock isn't mandatory */
1750*4882a593Smuzhiyun 	if  (ret != -ENOENT) {
1751*4882a593Smuzhiyun 		if (ret)
1752*4882a593Smuzhiyun 			return ret;
1753*4882a593Smuzhiyun 
1754*4882a593Smuzhiyun 		ret = clk_prepare_enable(priv->clk);
1755*4882a593Smuzhiyun 		if (ret) {
1756*4882a593Smuzhiyun 			dev_err(dev, "unable to enable clk (%d)\n", ret);
1757*4882a593Smuzhiyun 			return ret;
1758*4882a593Smuzhiyun 		}
1759*4882a593Smuzhiyun 	}
1760*4882a593Smuzhiyun 
1761*4882a593Smuzhiyun 	priv->reg_clk = devm_clk_get(&pdev->dev, "reg");
1762*4882a593Smuzhiyun 	ret = PTR_ERR_OR_ZERO(priv->reg_clk);
1763*4882a593Smuzhiyun 	/* The clock isn't mandatory */
1764*4882a593Smuzhiyun 	if  (ret != -ENOENT) {
1765*4882a593Smuzhiyun 		if (ret)
1766*4882a593Smuzhiyun 			goto err_core_clk;
1767*4882a593Smuzhiyun 
1768*4882a593Smuzhiyun 		ret = clk_prepare_enable(priv->reg_clk);
1769*4882a593Smuzhiyun 		if (ret) {
1770*4882a593Smuzhiyun 			dev_err(dev, "unable to enable reg clk (%d)\n", ret);
1771*4882a593Smuzhiyun 			goto err_core_clk;
1772*4882a593Smuzhiyun 		}
1773*4882a593Smuzhiyun 	}
1774*4882a593Smuzhiyun 
1775*4882a593Smuzhiyun 	ret = dma_set_mask_and_coherent(dev, DMA_BIT_MASK(64));
1776*4882a593Smuzhiyun 	if (ret)
1777*4882a593Smuzhiyun 		goto err_reg_clk;
1778*4882a593Smuzhiyun 
1779*4882a593Smuzhiyun 	/* Generic EIP97/EIP197 device probing */
1780*4882a593Smuzhiyun 	ret = safexcel_probe_generic(pdev, priv, 0);
1781*4882a593Smuzhiyun 	if (ret)
1782*4882a593Smuzhiyun 		goto err_reg_clk;
1783*4882a593Smuzhiyun 
1784*4882a593Smuzhiyun 	return 0;
1785*4882a593Smuzhiyun 
1786*4882a593Smuzhiyun err_reg_clk:
1787*4882a593Smuzhiyun 	clk_disable_unprepare(priv->reg_clk);
1788*4882a593Smuzhiyun err_core_clk:
1789*4882a593Smuzhiyun 	clk_disable_unprepare(priv->clk);
1790*4882a593Smuzhiyun 	return ret;
1791*4882a593Smuzhiyun }
1792*4882a593Smuzhiyun 
safexcel_remove(struct platform_device * pdev)1793*4882a593Smuzhiyun static int safexcel_remove(struct platform_device *pdev)
1794*4882a593Smuzhiyun {
1795*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv = platform_get_drvdata(pdev);
1796*4882a593Smuzhiyun 	int i;
1797*4882a593Smuzhiyun 
1798*4882a593Smuzhiyun 	safexcel_unregister_algorithms(priv);
1799*4882a593Smuzhiyun 	safexcel_hw_reset_rings(priv);
1800*4882a593Smuzhiyun 
1801*4882a593Smuzhiyun 	clk_disable_unprepare(priv->reg_clk);
1802*4882a593Smuzhiyun 	clk_disable_unprepare(priv->clk);
1803*4882a593Smuzhiyun 
1804*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++) {
1805*4882a593Smuzhiyun 		irq_set_affinity_hint(priv->ring[i].irq, NULL);
1806*4882a593Smuzhiyun 		destroy_workqueue(priv->ring[i].workqueue);
1807*4882a593Smuzhiyun 	}
1808*4882a593Smuzhiyun 
1809*4882a593Smuzhiyun 	return 0;
1810*4882a593Smuzhiyun }
1811*4882a593Smuzhiyun 
1812*4882a593Smuzhiyun static const struct of_device_id safexcel_of_match_table[] = {
1813*4882a593Smuzhiyun 	{
1814*4882a593Smuzhiyun 		.compatible = "inside-secure,safexcel-eip97ies",
1815*4882a593Smuzhiyun 		.data = (void *)EIP97IES_MRVL,
1816*4882a593Smuzhiyun 	},
1817*4882a593Smuzhiyun 	{
1818*4882a593Smuzhiyun 		.compatible = "inside-secure,safexcel-eip197b",
1819*4882a593Smuzhiyun 		.data = (void *)EIP197B_MRVL,
1820*4882a593Smuzhiyun 	},
1821*4882a593Smuzhiyun 	{
1822*4882a593Smuzhiyun 		.compatible = "inside-secure,safexcel-eip197d",
1823*4882a593Smuzhiyun 		.data = (void *)EIP197D_MRVL,
1824*4882a593Smuzhiyun 	},
1825*4882a593Smuzhiyun 	/* For backward compatibility and intended for generic use */
1826*4882a593Smuzhiyun 	{
1827*4882a593Smuzhiyun 		.compatible = "inside-secure,safexcel-eip97",
1828*4882a593Smuzhiyun 		.data = (void *)EIP97IES_MRVL,
1829*4882a593Smuzhiyun 	},
1830*4882a593Smuzhiyun 	{
1831*4882a593Smuzhiyun 		.compatible = "inside-secure,safexcel-eip197",
1832*4882a593Smuzhiyun 		.data = (void *)EIP197B_MRVL,
1833*4882a593Smuzhiyun 	},
1834*4882a593Smuzhiyun 	{},
1835*4882a593Smuzhiyun };
1836*4882a593Smuzhiyun 
1837*4882a593Smuzhiyun MODULE_DEVICE_TABLE(of, safexcel_of_match_table);
1838*4882a593Smuzhiyun 
1839*4882a593Smuzhiyun static struct platform_driver  crypto_safexcel = {
1840*4882a593Smuzhiyun 	.probe		= safexcel_probe,
1841*4882a593Smuzhiyun 	.remove		= safexcel_remove,
1842*4882a593Smuzhiyun 	.driver		= {
1843*4882a593Smuzhiyun 		.name	= "crypto-safexcel",
1844*4882a593Smuzhiyun 		.of_match_table = safexcel_of_match_table,
1845*4882a593Smuzhiyun 	},
1846*4882a593Smuzhiyun };
1847*4882a593Smuzhiyun 
1848*4882a593Smuzhiyun /* PCIE devices - i.e. Inside Secure development boards */
1849*4882a593Smuzhiyun 
safexcel_pci_probe(struct pci_dev * pdev,const struct pci_device_id * ent)1850*4882a593Smuzhiyun static int safexcel_pci_probe(struct pci_dev *pdev,
1851*4882a593Smuzhiyun 			       const struct pci_device_id *ent)
1852*4882a593Smuzhiyun {
1853*4882a593Smuzhiyun 	struct device *dev = &pdev->dev;
1854*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv;
1855*4882a593Smuzhiyun 	void __iomem *pciebase;
1856*4882a593Smuzhiyun 	int rc;
1857*4882a593Smuzhiyun 	u32 val;
1858*4882a593Smuzhiyun 
1859*4882a593Smuzhiyun 	dev_dbg(dev, "Probing PCIE device: vendor %04x, device %04x, subv %04x, subdev %04x, ctxt %lx\n",
1860*4882a593Smuzhiyun 		ent->vendor, ent->device, ent->subvendor,
1861*4882a593Smuzhiyun 		ent->subdevice, ent->driver_data);
1862*4882a593Smuzhiyun 
1863*4882a593Smuzhiyun 	priv = kzalloc(sizeof(*priv), GFP_KERNEL);
1864*4882a593Smuzhiyun 	if (!priv)
1865*4882a593Smuzhiyun 		return -ENOMEM;
1866*4882a593Smuzhiyun 
1867*4882a593Smuzhiyun 	priv->dev = dev;
1868*4882a593Smuzhiyun 	priv->version = (enum safexcel_eip_version)ent->driver_data;
1869*4882a593Smuzhiyun 
1870*4882a593Smuzhiyun 	pci_set_drvdata(pdev, priv);
1871*4882a593Smuzhiyun 
1872*4882a593Smuzhiyun 	/* enable the device */
1873*4882a593Smuzhiyun 	rc = pcim_enable_device(pdev);
1874*4882a593Smuzhiyun 	if (rc) {
1875*4882a593Smuzhiyun 		dev_err(dev, "Failed to enable PCI device\n");
1876*4882a593Smuzhiyun 		return rc;
1877*4882a593Smuzhiyun 	}
1878*4882a593Smuzhiyun 
1879*4882a593Smuzhiyun 	/* take ownership of PCI BAR0 */
1880*4882a593Smuzhiyun 	rc = pcim_iomap_regions(pdev, 1, "crypto_safexcel");
1881*4882a593Smuzhiyun 	if (rc) {
1882*4882a593Smuzhiyun 		dev_err(dev, "Failed to map IO region for BAR0\n");
1883*4882a593Smuzhiyun 		return rc;
1884*4882a593Smuzhiyun 	}
1885*4882a593Smuzhiyun 	priv->base = pcim_iomap_table(pdev)[0];
1886*4882a593Smuzhiyun 
1887*4882a593Smuzhiyun 	if (priv->version == EIP197_DEVBRD) {
1888*4882a593Smuzhiyun 		dev_dbg(dev, "Device identified as FPGA based development board - applying HW reset\n");
1889*4882a593Smuzhiyun 
1890*4882a593Smuzhiyun 		rc = pcim_iomap_regions(pdev, 4, "crypto_safexcel");
1891*4882a593Smuzhiyun 		if (rc) {
1892*4882a593Smuzhiyun 			dev_err(dev, "Failed to map IO region for BAR4\n");
1893*4882a593Smuzhiyun 			return rc;
1894*4882a593Smuzhiyun 		}
1895*4882a593Smuzhiyun 
1896*4882a593Smuzhiyun 		pciebase = pcim_iomap_table(pdev)[2];
1897*4882a593Smuzhiyun 		val = readl(pciebase + EIP197_XLX_IRQ_BLOCK_ID_ADDR);
1898*4882a593Smuzhiyun 		if ((val >> 16) == EIP197_XLX_IRQ_BLOCK_ID_VALUE) {
1899*4882a593Smuzhiyun 			dev_dbg(dev, "Detected Xilinx PCIE IRQ block version %d, multiple MSI support enabled\n",
1900*4882a593Smuzhiyun 				(val & 0xff));
1901*4882a593Smuzhiyun 
1902*4882a593Smuzhiyun 			/* Setup MSI identity map mapping */
1903*4882a593Smuzhiyun 			writel(EIP197_XLX_USER_VECT_LUT0_IDENT,
1904*4882a593Smuzhiyun 			       pciebase + EIP197_XLX_USER_VECT_LUT0_ADDR);
1905*4882a593Smuzhiyun 			writel(EIP197_XLX_USER_VECT_LUT1_IDENT,
1906*4882a593Smuzhiyun 			       pciebase + EIP197_XLX_USER_VECT_LUT1_ADDR);
1907*4882a593Smuzhiyun 			writel(EIP197_XLX_USER_VECT_LUT2_IDENT,
1908*4882a593Smuzhiyun 			       pciebase + EIP197_XLX_USER_VECT_LUT2_ADDR);
1909*4882a593Smuzhiyun 			writel(EIP197_XLX_USER_VECT_LUT3_IDENT,
1910*4882a593Smuzhiyun 			       pciebase + EIP197_XLX_USER_VECT_LUT3_ADDR);
1911*4882a593Smuzhiyun 
1912*4882a593Smuzhiyun 			/* Enable all device interrupts */
1913*4882a593Smuzhiyun 			writel(GENMASK(31, 0),
1914*4882a593Smuzhiyun 			       pciebase + EIP197_XLX_USER_INT_ENB_MSK);
1915*4882a593Smuzhiyun 		} else {
1916*4882a593Smuzhiyun 			dev_err(dev, "Unrecognised IRQ block identifier %x\n",
1917*4882a593Smuzhiyun 				val);
1918*4882a593Smuzhiyun 			return -ENODEV;
1919*4882a593Smuzhiyun 		}
1920*4882a593Smuzhiyun 
1921*4882a593Smuzhiyun 		/* HW reset FPGA dev board */
1922*4882a593Smuzhiyun 		/* assert reset */
1923*4882a593Smuzhiyun 		writel(1, priv->base + EIP197_XLX_GPIO_BASE);
1924*4882a593Smuzhiyun 		wmb(); /* maintain strict ordering for accesses here */
1925*4882a593Smuzhiyun 		/* deassert reset */
1926*4882a593Smuzhiyun 		writel(0, priv->base + EIP197_XLX_GPIO_BASE);
1927*4882a593Smuzhiyun 		wmb(); /* maintain strict ordering for accesses here */
1928*4882a593Smuzhiyun 	}
1929*4882a593Smuzhiyun 
1930*4882a593Smuzhiyun 	/* enable bus mastering */
1931*4882a593Smuzhiyun 	pci_set_master(pdev);
1932*4882a593Smuzhiyun 
1933*4882a593Smuzhiyun 	/* Generic EIP97/EIP197 device probing */
1934*4882a593Smuzhiyun 	rc = safexcel_probe_generic(pdev, priv, 1);
1935*4882a593Smuzhiyun 	return rc;
1936*4882a593Smuzhiyun }
1937*4882a593Smuzhiyun 
safexcel_pci_remove(struct pci_dev * pdev)1938*4882a593Smuzhiyun static void safexcel_pci_remove(struct pci_dev *pdev)
1939*4882a593Smuzhiyun {
1940*4882a593Smuzhiyun 	struct safexcel_crypto_priv *priv = pci_get_drvdata(pdev);
1941*4882a593Smuzhiyun 	int i;
1942*4882a593Smuzhiyun 
1943*4882a593Smuzhiyun 	safexcel_unregister_algorithms(priv);
1944*4882a593Smuzhiyun 
1945*4882a593Smuzhiyun 	for (i = 0; i < priv->config.rings; i++)
1946*4882a593Smuzhiyun 		destroy_workqueue(priv->ring[i].workqueue);
1947*4882a593Smuzhiyun 
1948*4882a593Smuzhiyun 	safexcel_hw_reset_rings(priv);
1949*4882a593Smuzhiyun }
1950*4882a593Smuzhiyun 
1951*4882a593Smuzhiyun static const struct pci_device_id safexcel_pci_ids[] = {
1952*4882a593Smuzhiyun 	{
1953*4882a593Smuzhiyun 		PCI_DEVICE_SUB(PCI_VENDOR_ID_XILINX, 0x9038,
1954*4882a593Smuzhiyun 			       0x16ae, 0xc522),
1955*4882a593Smuzhiyun 		.driver_data = EIP197_DEVBRD,
1956*4882a593Smuzhiyun 	},
1957*4882a593Smuzhiyun 	{},
1958*4882a593Smuzhiyun };
1959*4882a593Smuzhiyun 
1960*4882a593Smuzhiyun MODULE_DEVICE_TABLE(pci, safexcel_pci_ids);
1961*4882a593Smuzhiyun 
1962*4882a593Smuzhiyun static struct pci_driver safexcel_pci_driver = {
1963*4882a593Smuzhiyun 	.name          = "crypto-safexcel",
1964*4882a593Smuzhiyun 	.id_table      = safexcel_pci_ids,
1965*4882a593Smuzhiyun 	.probe         = safexcel_pci_probe,
1966*4882a593Smuzhiyun 	.remove        = safexcel_pci_remove,
1967*4882a593Smuzhiyun };
1968*4882a593Smuzhiyun 
safexcel_init(void)1969*4882a593Smuzhiyun static int __init safexcel_init(void)
1970*4882a593Smuzhiyun {
1971*4882a593Smuzhiyun 	int ret;
1972*4882a593Smuzhiyun 
1973*4882a593Smuzhiyun 	/* Register PCI driver */
1974*4882a593Smuzhiyun 	ret = pci_register_driver(&safexcel_pci_driver);
1975*4882a593Smuzhiyun 
1976*4882a593Smuzhiyun 	/* Register platform driver */
1977*4882a593Smuzhiyun 	if (IS_ENABLED(CONFIG_OF) && !ret) {
1978*4882a593Smuzhiyun 		ret = platform_driver_register(&crypto_safexcel);
1979*4882a593Smuzhiyun 		if (ret)
1980*4882a593Smuzhiyun 			pci_unregister_driver(&safexcel_pci_driver);
1981*4882a593Smuzhiyun 	}
1982*4882a593Smuzhiyun 
1983*4882a593Smuzhiyun 	return ret;
1984*4882a593Smuzhiyun }
1985*4882a593Smuzhiyun 
safexcel_exit(void)1986*4882a593Smuzhiyun static void __exit safexcel_exit(void)
1987*4882a593Smuzhiyun {
1988*4882a593Smuzhiyun 	/* Unregister platform driver */
1989*4882a593Smuzhiyun 	if (IS_ENABLED(CONFIG_OF))
1990*4882a593Smuzhiyun 		platform_driver_unregister(&crypto_safexcel);
1991*4882a593Smuzhiyun 
1992*4882a593Smuzhiyun 	/* Unregister PCI driver if successfully registered before */
1993*4882a593Smuzhiyun 	pci_unregister_driver(&safexcel_pci_driver);
1994*4882a593Smuzhiyun }
1995*4882a593Smuzhiyun 
1996*4882a593Smuzhiyun module_init(safexcel_init);
1997*4882a593Smuzhiyun module_exit(safexcel_exit);
1998*4882a593Smuzhiyun 
1999*4882a593Smuzhiyun MODULE_AUTHOR("Antoine Tenart <antoine.tenart@free-electrons.com>");
2000*4882a593Smuzhiyun MODULE_AUTHOR("Ofer Heifetz <oferh@marvell.com>");
2001*4882a593Smuzhiyun MODULE_AUTHOR("Igal Liberman <igall@marvell.com>");
2002*4882a593Smuzhiyun MODULE_DESCRIPTION("Support for SafeXcel cryptographic engines: EIP97 & EIP197");
2003*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
2004*4882a593Smuzhiyun MODULE_IMPORT_NS(CRYPTO_INTERNAL);
2005