1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright 2008-2014 Freescale Semiconductor, Inc.
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * SPDX-License-Identifier: GPL-2.0+
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * Based on CAAM driver in drivers/crypto/caam in Linux
7*4882a593Smuzhiyun */
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <common.h>
10*4882a593Smuzhiyun #include <malloc.h>
11*4882a593Smuzhiyun #include "fsl_sec.h"
12*4882a593Smuzhiyun #include "jr.h"
13*4882a593Smuzhiyun #include "jobdesc.h"
14*4882a593Smuzhiyun #include "desc_constr.h"
15*4882a593Smuzhiyun #ifdef CONFIG_FSL_CORENET
16*4882a593Smuzhiyun #include <asm/fsl_pamu.h>
17*4882a593Smuzhiyun #endif
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #define CIRC_CNT(head, tail, size) (((head) - (tail)) & (size - 1))
20*4882a593Smuzhiyun #define CIRC_SPACE(head, tail, size) CIRC_CNT((tail), (head) + 1, (size))
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun uint32_t sec_offset[CONFIG_SYS_FSL_MAX_NUM_OF_SEC] = {
23*4882a593Smuzhiyun 0,
24*4882a593Smuzhiyun #if defined(CONFIG_ARCH_C29X)
25*4882a593Smuzhiyun CONFIG_SYS_FSL_SEC_IDX_OFFSET,
26*4882a593Smuzhiyun 2 * CONFIG_SYS_FSL_SEC_IDX_OFFSET
27*4882a593Smuzhiyun #endif
28*4882a593Smuzhiyun };
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun #define SEC_ADDR(idx) \
31*4882a593Smuzhiyun ((CONFIG_SYS_FSL_SEC_ADDR + sec_offset[idx]))
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun #define SEC_JR0_ADDR(idx) \
34*4882a593Smuzhiyun (SEC_ADDR(idx) + \
35*4882a593Smuzhiyun (CONFIG_SYS_FSL_JR0_OFFSET - CONFIG_SYS_FSL_SEC_OFFSET))
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun struct jobring jr0[CONFIG_SYS_FSL_MAX_NUM_OF_SEC];
38*4882a593Smuzhiyun
start_jr0(uint8_t sec_idx)39*4882a593Smuzhiyun static inline void start_jr0(uint8_t sec_idx)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
42*4882a593Smuzhiyun u32 ctpr_ms = sec_in32(&sec->ctpr_ms);
43*4882a593Smuzhiyun u32 scfgr = sec_in32(&sec->scfgr);
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun if (ctpr_ms & SEC_CTPR_MS_VIRT_EN_INCL) {
46*4882a593Smuzhiyun /* VIRT_EN_INCL = 1 & VIRT_EN_POR = 1 or
47*4882a593Smuzhiyun * VIRT_EN_INCL = 1 & VIRT_EN_POR = 0 & SEC_SCFGR_VIRT_EN = 1
48*4882a593Smuzhiyun */
49*4882a593Smuzhiyun if ((ctpr_ms & SEC_CTPR_MS_VIRT_EN_POR) ||
50*4882a593Smuzhiyun (scfgr & SEC_SCFGR_VIRT_EN))
51*4882a593Smuzhiyun sec_out32(&sec->jrstartr, CONFIG_JRSTARTR_JR0);
52*4882a593Smuzhiyun } else {
53*4882a593Smuzhiyun /* VIRT_EN_INCL = 0 && VIRT_EN_POR_VALUE = 1 */
54*4882a593Smuzhiyun if (ctpr_ms & SEC_CTPR_MS_VIRT_EN_POR)
55*4882a593Smuzhiyun sec_out32(&sec->jrstartr, CONFIG_JRSTARTR_JR0);
56*4882a593Smuzhiyun }
57*4882a593Smuzhiyun }
58*4882a593Smuzhiyun
jr_reset_liodn(uint8_t sec_idx)59*4882a593Smuzhiyun static inline void jr_reset_liodn(uint8_t sec_idx)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
62*4882a593Smuzhiyun sec_out32(&sec->jrliodnr[0].ls, 0);
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun
jr_disable_irq(uint8_t sec_idx)65*4882a593Smuzhiyun static inline void jr_disable_irq(uint8_t sec_idx)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
68*4882a593Smuzhiyun uint32_t jrcfg = sec_in32(®s->jrcfg1);
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun jrcfg = jrcfg | JR_INTMASK;
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun sec_out32(®s->jrcfg1, jrcfg);
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun
jr_initregs(uint8_t sec_idx)75*4882a593Smuzhiyun static void jr_initregs(uint8_t sec_idx)
76*4882a593Smuzhiyun {
77*4882a593Smuzhiyun struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
78*4882a593Smuzhiyun struct jobring *jr = &jr0[sec_idx];
79*4882a593Smuzhiyun phys_addr_t ip_base = virt_to_phys((void *)jr->input_ring);
80*4882a593Smuzhiyun phys_addr_t op_base = virt_to_phys((void *)jr->output_ring);
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
83*4882a593Smuzhiyun sec_out32(®s->irba_h, ip_base >> 32);
84*4882a593Smuzhiyun #else
85*4882a593Smuzhiyun sec_out32(®s->irba_h, 0x0);
86*4882a593Smuzhiyun #endif
87*4882a593Smuzhiyun sec_out32(®s->irba_l, (uint32_t)ip_base);
88*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
89*4882a593Smuzhiyun sec_out32(®s->orba_h, op_base >> 32);
90*4882a593Smuzhiyun #else
91*4882a593Smuzhiyun sec_out32(®s->orba_h, 0x0);
92*4882a593Smuzhiyun #endif
93*4882a593Smuzhiyun sec_out32(®s->orba_l, (uint32_t)op_base);
94*4882a593Smuzhiyun sec_out32(®s->ors, JR_SIZE);
95*4882a593Smuzhiyun sec_out32(®s->irs, JR_SIZE);
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun if (!jr->irq)
98*4882a593Smuzhiyun jr_disable_irq(sec_idx);
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
jr_init(uint8_t sec_idx)101*4882a593Smuzhiyun static int jr_init(uint8_t sec_idx)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun struct jobring *jr = &jr0[sec_idx];
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun memset(jr, 0, sizeof(struct jobring));
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun jr->jq_id = DEFAULT_JR_ID;
108*4882a593Smuzhiyun jr->irq = DEFAULT_IRQ;
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun #ifdef CONFIG_FSL_CORENET
111*4882a593Smuzhiyun jr->liodn = DEFAULT_JR_LIODN;
112*4882a593Smuzhiyun #endif
113*4882a593Smuzhiyun jr->size = JR_SIZE;
114*4882a593Smuzhiyun jr->input_ring = (dma_addr_t *)memalign(ARCH_DMA_MINALIGN,
115*4882a593Smuzhiyun JR_SIZE * sizeof(dma_addr_t));
116*4882a593Smuzhiyun if (!jr->input_ring)
117*4882a593Smuzhiyun return -1;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun jr->op_size = roundup(JR_SIZE * sizeof(struct op_ring),
120*4882a593Smuzhiyun ARCH_DMA_MINALIGN);
121*4882a593Smuzhiyun jr->output_ring =
122*4882a593Smuzhiyun (struct op_ring *)memalign(ARCH_DMA_MINALIGN, jr->op_size);
123*4882a593Smuzhiyun if (!jr->output_ring)
124*4882a593Smuzhiyun return -1;
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun memset(jr->input_ring, 0, JR_SIZE * sizeof(dma_addr_t));
127*4882a593Smuzhiyun memset(jr->output_ring, 0, jr->op_size);
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun start_jr0(sec_idx);
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun jr_initregs(sec_idx);
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun return 0;
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun
jr_sw_cleanup(uint8_t sec_idx)136*4882a593Smuzhiyun static int jr_sw_cleanup(uint8_t sec_idx)
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun struct jobring *jr = &jr0[sec_idx];
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun jr->head = 0;
141*4882a593Smuzhiyun jr->tail = 0;
142*4882a593Smuzhiyun jr->read_idx = 0;
143*4882a593Smuzhiyun jr->write_idx = 0;
144*4882a593Smuzhiyun memset(jr->info, 0, sizeof(jr->info));
145*4882a593Smuzhiyun memset(jr->input_ring, 0, jr->size * sizeof(dma_addr_t));
146*4882a593Smuzhiyun memset(jr->output_ring, 0, jr->size * sizeof(struct op_ring));
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun return 0;
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
jr_hw_reset(uint8_t sec_idx)151*4882a593Smuzhiyun static int jr_hw_reset(uint8_t sec_idx)
152*4882a593Smuzhiyun {
153*4882a593Smuzhiyun struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
154*4882a593Smuzhiyun uint32_t timeout = 100000;
155*4882a593Smuzhiyun uint32_t jrint, jrcr;
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun sec_out32(®s->jrcr, JRCR_RESET);
158*4882a593Smuzhiyun do {
159*4882a593Smuzhiyun jrint = sec_in32(®s->jrint);
160*4882a593Smuzhiyun } while (((jrint & JRINT_ERR_HALT_MASK) ==
161*4882a593Smuzhiyun JRINT_ERR_HALT_INPROGRESS) && --timeout);
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun jrint = sec_in32(®s->jrint);
164*4882a593Smuzhiyun if (((jrint & JRINT_ERR_HALT_MASK) !=
165*4882a593Smuzhiyun JRINT_ERR_HALT_INPROGRESS) && timeout == 0)
166*4882a593Smuzhiyun return -1;
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun timeout = 100000;
169*4882a593Smuzhiyun sec_out32(®s->jrcr, JRCR_RESET);
170*4882a593Smuzhiyun do {
171*4882a593Smuzhiyun jrcr = sec_in32(®s->jrcr);
172*4882a593Smuzhiyun } while ((jrcr & JRCR_RESET) && --timeout);
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun if (timeout == 0)
175*4882a593Smuzhiyun return -1;
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun return 0;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun /* -1 --- error, can't enqueue -- no space available */
jr_enqueue(uint32_t * desc_addr,void (* callback)(uint32_t status,void * arg),void * arg,uint8_t sec_idx)181*4882a593Smuzhiyun static int jr_enqueue(uint32_t *desc_addr,
182*4882a593Smuzhiyun void (*callback)(uint32_t status, void *arg),
183*4882a593Smuzhiyun void *arg, uint8_t sec_idx)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
186*4882a593Smuzhiyun struct jobring *jr = &jr0[sec_idx];
187*4882a593Smuzhiyun int head = jr->head;
188*4882a593Smuzhiyun uint32_t desc_word;
189*4882a593Smuzhiyun int length = desc_len(desc_addr);
190*4882a593Smuzhiyun int i;
191*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
192*4882a593Smuzhiyun uint32_t *addr_hi, *addr_lo;
193*4882a593Smuzhiyun #endif
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun /* The descriptor must be submitted to SEC block as per endianness
196*4882a593Smuzhiyun * of the SEC Block.
197*4882a593Smuzhiyun * So, if the endianness of Core and SEC block is different, each word
198*4882a593Smuzhiyun * of the descriptor will be byte-swapped.
199*4882a593Smuzhiyun */
200*4882a593Smuzhiyun for (i = 0; i < length; i++) {
201*4882a593Smuzhiyun desc_word = desc_addr[i];
202*4882a593Smuzhiyun sec_out32((uint32_t *)&desc_addr[i], desc_word);
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun phys_addr_t desc_phys_addr = virt_to_phys(desc_addr);
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun jr->info[head].desc_phys_addr = desc_phys_addr;
208*4882a593Smuzhiyun jr->info[head].callback = (void *)callback;
209*4882a593Smuzhiyun jr->info[head].arg = arg;
210*4882a593Smuzhiyun jr->info[head].op_done = 0;
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun unsigned long start = (unsigned long)&jr->info[head] &
213*4882a593Smuzhiyun ~(ARCH_DMA_MINALIGN - 1);
214*4882a593Smuzhiyun unsigned long end = ALIGN((unsigned long)&jr->info[head] +
215*4882a593Smuzhiyun sizeof(struct jr_info), ARCH_DMA_MINALIGN);
216*4882a593Smuzhiyun flush_dcache_range(start, end);
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
219*4882a593Smuzhiyun /* Write the 64 bit Descriptor address on Input Ring.
220*4882a593Smuzhiyun * The 32 bit hign and low part of the address will
221*4882a593Smuzhiyun * depend on endianness of SEC block.
222*4882a593Smuzhiyun */
223*4882a593Smuzhiyun #ifdef CONFIG_SYS_FSL_SEC_LE
224*4882a593Smuzhiyun addr_lo = (uint32_t *)(&jr->input_ring[head]);
225*4882a593Smuzhiyun addr_hi = (uint32_t *)(&jr->input_ring[head]) + 1;
226*4882a593Smuzhiyun #elif defined(CONFIG_SYS_FSL_SEC_BE)
227*4882a593Smuzhiyun addr_hi = (uint32_t *)(&jr->input_ring[head]);
228*4882a593Smuzhiyun addr_lo = (uint32_t *)(&jr->input_ring[head]) + 1;
229*4882a593Smuzhiyun #endif /* ifdef CONFIG_SYS_FSL_SEC_LE */
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun sec_out32(addr_hi, (uint32_t)(desc_phys_addr >> 32));
232*4882a593Smuzhiyun sec_out32(addr_lo, (uint32_t)(desc_phys_addr));
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun #else
235*4882a593Smuzhiyun /* Write the 32 bit Descriptor address on Input Ring. */
236*4882a593Smuzhiyun sec_out32(&jr->input_ring[head], desc_phys_addr);
237*4882a593Smuzhiyun #endif /* ifdef CONFIG_PHYS_64BIT */
238*4882a593Smuzhiyun
239*4882a593Smuzhiyun start = (unsigned long)&jr->input_ring[head] & ~(ARCH_DMA_MINALIGN - 1);
240*4882a593Smuzhiyun end = ALIGN((unsigned long)&jr->input_ring[head] +
241*4882a593Smuzhiyun sizeof(dma_addr_t), ARCH_DMA_MINALIGN);
242*4882a593Smuzhiyun flush_dcache_range(start, end);
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun jr->head = (head + 1) & (jr->size - 1);
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun /* Invalidate output ring */
247*4882a593Smuzhiyun start = (unsigned long)jr->output_ring &
248*4882a593Smuzhiyun ~(ARCH_DMA_MINALIGN - 1);
249*4882a593Smuzhiyun end = ALIGN((unsigned long)jr->output_ring + jr->op_size,
250*4882a593Smuzhiyun ARCH_DMA_MINALIGN);
251*4882a593Smuzhiyun invalidate_dcache_range(start, end);
252*4882a593Smuzhiyun
253*4882a593Smuzhiyun sec_out32(®s->irja, 1);
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun return 0;
256*4882a593Smuzhiyun }
257*4882a593Smuzhiyun
jr_dequeue(int sec_idx)258*4882a593Smuzhiyun static int jr_dequeue(int sec_idx)
259*4882a593Smuzhiyun {
260*4882a593Smuzhiyun struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
261*4882a593Smuzhiyun struct jobring *jr = &jr0[sec_idx];
262*4882a593Smuzhiyun int head = jr->head;
263*4882a593Smuzhiyun int tail = jr->tail;
264*4882a593Smuzhiyun int idx, i, found;
265*4882a593Smuzhiyun void (*callback)(uint32_t status, void *arg);
266*4882a593Smuzhiyun void *arg = NULL;
267*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
268*4882a593Smuzhiyun uint32_t *addr_hi, *addr_lo;
269*4882a593Smuzhiyun #else
270*4882a593Smuzhiyun uint32_t *addr;
271*4882a593Smuzhiyun #endif
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun while (sec_in32(®s->orsf) && CIRC_CNT(jr->head, jr->tail,
274*4882a593Smuzhiyun jr->size)) {
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun found = 0;
277*4882a593Smuzhiyun
278*4882a593Smuzhiyun phys_addr_t op_desc;
279*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
280*4882a593Smuzhiyun /* Read the 64 bit Descriptor address from Output Ring.
281*4882a593Smuzhiyun * The 32 bit hign and low part of the address will
282*4882a593Smuzhiyun * depend on endianness of SEC block.
283*4882a593Smuzhiyun */
284*4882a593Smuzhiyun #ifdef CONFIG_SYS_FSL_SEC_LE
285*4882a593Smuzhiyun addr_lo = (uint32_t *)(&jr->output_ring[jr->tail].desc);
286*4882a593Smuzhiyun addr_hi = (uint32_t *)(&jr->output_ring[jr->tail].desc) + 1;
287*4882a593Smuzhiyun #elif defined(CONFIG_SYS_FSL_SEC_BE)
288*4882a593Smuzhiyun addr_hi = (uint32_t *)(&jr->output_ring[jr->tail].desc);
289*4882a593Smuzhiyun addr_lo = (uint32_t *)(&jr->output_ring[jr->tail].desc) + 1;
290*4882a593Smuzhiyun #endif /* ifdef CONFIG_SYS_FSL_SEC_LE */
291*4882a593Smuzhiyun
292*4882a593Smuzhiyun op_desc = ((u64)sec_in32(addr_hi) << 32) |
293*4882a593Smuzhiyun ((u64)sec_in32(addr_lo));
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun #else
296*4882a593Smuzhiyun /* Read the 32 bit Descriptor address from Output Ring. */
297*4882a593Smuzhiyun addr = (uint32_t *)&jr->output_ring[jr->tail].desc;
298*4882a593Smuzhiyun op_desc = sec_in32(addr);
299*4882a593Smuzhiyun #endif /* ifdef CONFIG_PHYS_64BIT */
300*4882a593Smuzhiyun
301*4882a593Smuzhiyun uint32_t status = sec_in32(&jr->output_ring[jr->tail].status);
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun for (i = 0; CIRC_CNT(head, tail + i, jr->size) >= 1; i++) {
304*4882a593Smuzhiyun idx = (tail + i) & (jr->size - 1);
305*4882a593Smuzhiyun if (op_desc == jr->info[idx].desc_phys_addr) {
306*4882a593Smuzhiyun found = 1;
307*4882a593Smuzhiyun break;
308*4882a593Smuzhiyun }
309*4882a593Smuzhiyun }
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun /* Error condition if match not found */
312*4882a593Smuzhiyun if (!found)
313*4882a593Smuzhiyun return -1;
314*4882a593Smuzhiyun
315*4882a593Smuzhiyun jr->info[idx].op_done = 1;
316*4882a593Smuzhiyun callback = (void *)jr->info[idx].callback;
317*4882a593Smuzhiyun arg = jr->info[idx].arg;
318*4882a593Smuzhiyun
319*4882a593Smuzhiyun /* When the job on tail idx gets done, increment
320*4882a593Smuzhiyun * tail till the point where job completed out of oredr has
321*4882a593Smuzhiyun * been taken into account
322*4882a593Smuzhiyun */
323*4882a593Smuzhiyun if (idx == tail)
324*4882a593Smuzhiyun do {
325*4882a593Smuzhiyun tail = (tail + 1) & (jr->size - 1);
326*4882a593Smuzhiyun } while (jr->info[tail].op_done);
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun jr->tail = tail;
329*4882a593Smuzhiyun jr->read_idx = (jr->read_idx + 1) & (jr->size - 1);
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun sec_out32(®s->orjr, 1);
332*4882a593Smuzhiyun jr->info[idx].op_done = 0;
333*4882a593Smuzhiyun
334*4882a593Smuzhiyun callback(status, arg);
335*4882a593Smuzhiyun }
336*4882a593Smuzhiyun
337*4882a593Smuzhiyun return 0;
338*4882a593Smuzhiyun }
339*4882a593Smuzhiyun
desc_done(uint32_t status,void * arg)340*4882a593Smuzhiyun static void desc_done(uint32_t status, void *arg)
341*4882a593Smuzhiyun {
342*4882a593Smuzhiyun struct result *x = arg;
343*4882a593Smuzhiyun x->status = status;
344*4882a593Smuzhiyun #ifndef CONFIG_SPL_BUILD
345*4882a593Smuzhiyun caam_jr_strstatus(status);
346*4882a593Smuzhiyun #endif
347*4882a593Smuzhiyun x->done = 1;
348*4882a593Smuzhiyun }
349*4882a593Smuzhiyun
run_descriptor_jr_idx(uint32_t * desc,uint8_t sec_idx)350*4882a593Smuzhiyun static inline int run_descriptor_jr_idx(uint32_t *desc, uint8_t sec_idx)
351*4882a593Smuzhiyun {
352*4882a593Smuzhiyun unsigned long long timeval = get_ticks();
353*4882a593Smuzhiyun unsigned long long timeout = usec2ticks(CONFIG_SEC_DEQ_TIMEOUT);
354*4882a593Smuzhiyun struct result op;
355*4882a593Smuzhiyun int ret = 0;
356*4882a593Smuzhiyun
357*4882a593Smuzhiyun memset(&op, 0, sizeof(op));
358*4882a593Smuzhiyun
359*4882a593Smuzhiyun ret = jr_enqueue(desc, desc_done, &op, sec_idx);
360*4882a593Smuzhiyun if (ret) {
361*4882a593Smuzhiyun debug("Error in SEC enq\n");
362*4882a593Smuzhiyun ret = JQ_ENQ_ERR;
363*4882a593Smuzhiyun goto out;
364*4882a593Smuzhiyun }
365*4882a593Smuzhiyun
366*4882a593Smuzhiyun timeval = get_ticks();
367*4882a593Smuzhiyun timeout = usec2ticks(CONFIG_SEC_DEQ_TIMEOUT);
368*4882a593Smuzhiyun while (op.done != 1) {
369*4882a593Smuzhiyun ret = jr_dequeue(sec_idx);
370*4882a593Smuzhiyun if (ret) {
371*4882a593Smuzhiyun debug("Error in SEC deq\n");
372*4882a593Smuzhiyun ret = JQ_DEQ_ERR;
373*4882a593Smuzhiyun goto out;
374*4882a593Smuzhiyun }
375*4882a593Smuzhiyun
376*4882a593Smuzhiyun if ((get_ticks() - timeval) > timeout) {
377*4882a593Smuzhiyun debug("SEC Dequeue timed out\n");
378*4882a593Smuzhiyun ret = JQ_DEQ_TO_ERR;
379*4882a593Smuzhiyun goto out;
380*4882a593Smuzhiyun }
381*4882a593Smuzhiyun }
382*4882a593Smuzhiyun
383*4882a593Smuzhiyun if (op.status) {
384*4882a593Smuzhiyun debug("Error %x\n", op.status);
385*4882a593Smuzhiyun ret = op.status;
386*4882a593Smuzhiyun }
387*4882a593Smuzhiyun out:
388*4882a593Smuzhiyun return ret;
389*4882a593Smuzhiyun }
390*4882a593Smuzhiyun
run_descriptor_jr(uint32_t * desc)391*4882a593Smuzhiyun int run_descriptor_jr(uint32_t *desc)
392*4882a593Smuzhiyun {
393*4882a593Smuzhiyun return run_descriptor_jr_idx(desc, 0);
394*4882a593Smuzhiyun }
395*4882a593Smuzhiyun
jr_reset_sec(uint8_t sec_idx)396*4882a593Smuzhiyun static inline int jr_reset_sec(uint8_t sec_idx)
397*4882a593Smuzhiyun {
398*4882a593Smuzhiyun if (jr_hw_reset(sec_idx) < 0)
399*4882a593Smuzhiyun return -1;
400*4882a593Smuzhiyun
401*4882a593Smuzhiyun /* Clean up the jobring structure maintained by software */
402*4882a593Smuzhiyun jr_sw_cleanup(sec_idx);
403*4882a593Smuzhiyun
404*4882a593Smuzhiyun return 0;
405*4882a593Smuzhiyun }
406*4882a593Smuzhiyun
jr_reset(void)407*4882a593Smuzhiyun int jr_reset(void)
408*4882a593Smuzhiyun {
409*4882a593Smuzhiyun return jr_reset_sec(0);
410*4882a593Smuzhiyun }
411*4882a593Smuzhiyun
sec_reset_idx(uint8_t sec_idx)412*4882a593Smuzhiyun static inline int sec_reset_idx(uint8_t sec_idx)
413*4882a593Smuzhiyun {
414*4882a593Smuzhiyun ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
415*4882a593Smuzhiyun uint32_t mcfgr = sec_in32(&sec->mcfgr);
416*4882a593Smuzhiyun uint32_t timeout = 100000;
417*4882a593Smuzhiyun
418*4882a593Smuzhiyun mcfgr |= MCFGR_SWRST;
419*4882a593Smuzhiyun sec_out32(&sec->mcfgr, mcfgr);
420*4882a593Smuzhiyun
421*4882a593Smuzhiyun mcfgr |= MCFGR_DMA_RST;
422*4882a593Smuzhiyun sec_out32(&sec->mcfgr, mcfgr);
423*4882a593Smuzhiyun do {
424*4882a593Smuzhiyun mcfgr = sec_in32(&sec->mcfgr);
425*4882a593Smuzhiyun } while ((mcfgr & MCFGR_DMA_RST) == MCFGR_DMA_RST && --timeout);
426*4882a593Smuzhiyun
427*4882a593Smuzhiyun if (timeout == 0)
428*4882a593Smuzhiyun return -1;
429*4882a593Smuzhiyun
430*4882a593Smuzhiyun timeout = 100000;
431*4882a593Smuzhiyun do {
432*4882a593Smuzhiyun mcfgr = sec_in32(&sec->mcfgr);
433*4882a593Smuzhiyun } while ((mcfgr & MCFGR_SWRST) == MCFGR_SWRST && --timeout);
434*4882a593Smuzhiyun
435*4882a593Smuzhiyun if (timeout == 0)
436*4882a593Smuzhiyun return -1;
437*4882a593Smuzhiyun
438*4882a593Smuzhiyun return 0;
439*4882a593Smuzhiyun }
sec_reset(void)440*4882a593Smuzhiyun int sec_reset(void)
441*4882a593Smuzhiyun {
442*4882a593Smuzhiyun return sec_reset_idx(0);
443*4882a593Smuzhiyun }
444*4882a593Smuzhiyun #ifndef CONFIG_SPL_BUILD
instantiate_rng(uint8_t sec_idx)445*4882a593Smuzhiyun static int instantiate_rng(uint8_t sec_idx)
446*4882a593Smuzhiyun {
447*4882a593Smuzhiyun struct result op;
448*4882a593Smuzhiyun u32 *desc;
449*4882a593Smuzhiyun u32 rdsta_val;
450*4882a593Smuzhiyun int ret = 0;
451*4882a593Smuzhiyun ccsr_sec_t __iomem *sec = (ccsr_sec_t __iomem *)SEC_ADDR(sec_idx);
452*4882a593Smuzhiyun struct rng4tst __iomem *rng =
453*4882a593Smuzhiyun (struct rng4tst __iomem *)&sec->rng;
454*4882a593Smuzhiyun
455*4882a593Smuzhiyun memset(&op, 0, sizeof(struct result));
456*4882a593Smuzhiyun
457*4882a593Smuzhiyun desc = memalign(ARCH_DMA_MINALIGN, sizeof(uint32_t) * 6);
458*4882a593Smuzhiyun if (!desc) {
459*4882a593Smuzhiyun printf("cannot allocate RNG init descriptor memory\n");
460*4882a593Smuzhiyun return -1;
461*4882a593Smuzhiyun }
462*4882a593Smuzhiyun
463*4882a593Smuzhiyun inline_cnstr_jobdesc_rng_instantiation(desc);
464*4882a593Smuzhiyun int size = roundup(sizeof(uint32_t) * 6, ARCH_DMA_MINALIGN);
465*4882a593Smuzhiyun flush_dcache_range((unsigned long)desc,
466*4882a593Smuzhiyun (unsigned long)desc + size);
467*4882a593Smuzhiyun
468*4882a593Smuzhiyun ret = run_descriptor_jr_idx(desc, sec_idx);
469*4882a593Smuzhiyun
470*4882a593Smuzhiyun if (ret)
471*4882a593Smuzhiyun printf("RNG: Instantiation failed with error %x\n", ret);
472*4882a593Smuzhiyun
473*4882a593Smuzhiyun rdsta_val = sec_in32(&rng->rdsta);
474*4882a593Smuzhiyun if (op.status || !(rdsta_val & RNG_STATE0_HANDLE_INSTANTIATED))
475*4882a593Smuzhiyun return -1;
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun return ret;
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun
get_rng_vid(uint8_t sec_idx)480*4882a593Smuzhiyun static u8 get_rng_vid(uint8_t sec_idx)
481*4882a593Smuzhiyun {
482*4882a593Smuzhiyun ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
483*4882a593Smuzhiyun u32 cha_vid = sec_in32(&sec->chavid_ls);
484*4882a593Smuzhiyun
485*4882a593Smuzhiyun return (cha_vid & SEC_CHAVID_RNG_LS_MASK) >> SEC_CHAVID_LS_RNG_SHIFT;
486*4882a593Smuzhiyun }
487*4882a593Smuzhiyun
488*4882a593Smuzhiyun /*
489*4882a593Smuzhiyun * By default, the TRNG runs for 200 clocks per sample;
490*4882a593Smuzhiyun * 1200 clocks per sample generates better entropy.
491*4882a593Smuzhiyun */
kick_trng(int ent_delay,uint8_t sec_idx)492*4882a593Smuzhiyun static void kick_trng(int ent_delay, uint8_t sec_idx)
493*4882a593Smuzhiyun {
494*4882a593Smuzhiyun ccsr_sec_t __iomem *sec = (ccsr_sec_t __iomem *)SEC_ADDR(sec_idx);
495*4882a593Smuzhiyun struct rng4tst __iomem *rng =
496*4882a593Smuzhiyun (struct rng4tst __iomem *)&sec->rng;
497*4882a593Smuzhiyun u32 val;
498*4882a593Smuzhiyun
499*4882a593Smuzhiyun /* put RNG4 into program mode */
500*4882a593Smuzhiyun sec_setbits32(&rng->rtmctl, RTMCTL_PRGM);
501*4882a593Smuzhiyun /* rtsdctl bits 0-15 contain "Entropy Delay, which defines the
502*4882a593Smuzhiyun * length (in system clocks) of each Entropy sample taken
503*4882a593Smuzhiyun * */
504*4882a593Smuzhiyun val = sec_in32(&rng->rtsdctl);
505*4882a593Smuzhiyun val = (val & ~RTSDCTL_ENT_DLY_MASK) |
506*4882a593Smuzhiyun (ent_delay << RTSDCTL_ENT_DLY_SHIFT);
507*4882a593Smuzhiyun sec_out32(&rng->rtsdctl, val);
508*4882a593Smuzhiyun /* min. freq. count, equal to 1/4 of the entropy sample length */
509*4882a593Smuzhiyun sec_out32(&rng->rtfreqmin, ent_delay >> 2);
510*4882a593Smuzhiyun /* disable maximum frequency count */
511*4882a593Smuzhiyun sec_out32(&rng->rtfreqmax, RTFRQMAX_DISABLE);
512*4882a593Smuzhiyun /*
513*4882a593Smuzhiyun * select raw sampling in both entropy shifter
514*4882a593Smuzhiyun * and statistical checker
515*4882a593Smuzhiyun */
516*4882a593Smuzhiyun sec_setbits32(&rng->rtmctl, RTMCTL_SAMP_MODE_RAW_ES_SC);
517*4882a593Smuzhiyun /* put RNG4 into run mode */
518*4882a593Smuzhiyun sec_clrbits32(&rng->rtmctl, RTMCTL_PRGM);
519*4882a593Smuzhiyun }
520*4882a593Smuzhiyun
rng_init(uint8_t sec_idx)521*4882a593Smuzhiyun static int rng_init(uint8_t sec_idx)
522*4882a593Smuzhiyun {
523*4882a593Smuzhiyun int ret, ent_delay = RTSDCTL_ENT_DLY_MIN;
524*4882a593Smuzhiyun ccsr_sec_t __iomem *sec = (ccsr_sec_t __iomem *)SEC_ADDR(sec_idx);
525*4882a593Smuzhiyun struct rng4tst __iomem *rng =
526*4882a593Smuzhiyun (struct rng4tst __iomem *)&sec->rng;
527*4882a593Smuzhiyun
528*4882a593Smuzhiyun u32 rdsta = sec_in32(&rng->rdsta);
529*4882a593Smuzhiyun
530*4882a593Smuzhiyun /* Check if RNG state 0 handler is already instantiated */
531*4882a593Smuzhiyun if (rdsta & RNG_STATE0_HANDLE_INSTANTIATED)
532*4882a593Smuzhiyun return 0;
533*4882a593Smuzhiyun
534*4882a593Smuzhiyun do {
535*4882a593Smuzhiyun /*
536*4882a593Smuzhiyun * If either of the SH's were instantiated by somebody else
537*4882a593Smuzhiyun * then it is assumed that the entropy
538*4882a593Smuzhiyun * parameters are properly set and thus the function
539*4882a593Smuzhiyun * setting these (kick_trng(...)) is skipped.
540*4882a593Smuzhiyun * Also, if a handle was instantiated, do not change
541*4882a593Smuzhiyun * the TRNG parameters.
542*4882a593Smuzhiyun */
543*4882a593Smuzhiyun kick_trng(ent_delay, sec_idx);
544*4882a593Smuzhiyun ent_delay += 400;
545*4882a593Smuzhiyun /*
546*4882a593Smuzhiyun * if instantiate_rng(...) fails, the loop will rerun
547*4882a593Smuzhiyun * and the kick_trng(...) function will modfiy the
548*4882a593Smuzhiyun * upper and lower limits of the entropy sampling
549*4882a593Smuzhiyun * interval, leading to a sucessful initialization of
550*4882a593Smuzhiyun * the RNG.
551*4882a593Smuzhiyun */
552*4882a593Smuzhiyun ret = instantiate_rng(sec_idx);
553*4882a593Smuzhiyun } while ((ret == -1) && (ent_delay < RTSDCTL_ENT_DLY_MAX));
554*4882a593Smuzhiyun if (ret) {
555*4882a593Smuzhiyun printf("RNG: Failed to instantiate RNG\n");
556*4882a593Smuzhiyun return ret;
557*4882a593Smuzhiyun }
558*4882a593Smuzhiyun
559*4882a593Smuzhiyun /* Enable RDB bit so that RNG works faster */
560*4882a593Smuzhiyun sec_setbits32(&sec->scfgr, SEC_SCFGR_RDBENABLE);
561*4882a593Smuzhiyun
562*4882a593Smuzhiyun return ret;
563*4882a593Smuzhiyun }
564*4882a593Smuzhiyun #endif
sec_init_idx(uint8_t sec_idx)565*4882a593Smuzhiyun int sec_init_idx(uint8_t sec_idx)
566*4882a593Smuzhiyun {
567*4882a593Smuzhiyun ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
568*4882a593Smuzhiyun uint32_t mcr = sec_in32(&sec->mcfgr);
569*4882a593Smuzhiyun int ret = 0;
570*4882a593Smuzhiyun
571*4882a593Smuzhiyun #ifdef CONFIG_FSL_CORENET
572*4882a593Smuzhiyun uint32_t liodnr;
573*4882a593Smuzhiyun uint32_t liodn_ns;
574*4882a593Smuzhiyun uint32_t liodn_s;
575*4882a593Smuzhiyun #endif
576*4882a593Smuzhiyun
577*4882a593Smuzhiyun if (!(sec_idx < CONFIG_SYS_FSL_MAX_NUM_OF_SEC)) {
578*4882a593Smuzhiyun printf("SEC initialization failed\n");
579*4882a593Smuzhiyun return -1;
580*4882a593Smuzhiyun }
581*4882a593Smuzhiyun
582*4882a593Smuzhiyun /*
583*4882a593Smuzhiyun * Modifying CAAM Read/Write Attributes
584*4882a593Smuzhiyun * For LS2080A
585*4882a593Smuzhiyun * For AXI Write - Cacheable, Write Back, Write allocate
586*4882a593Smuzhiyun * For AXI Read - Cacheable, Read allocate
587*4882a593Smuzhiyun * Only For LS2080a, to solve CAAM coherency issues
588*4882a593Smuzhiyun */
589*4882a593Smuzhiyun #ifdef CONFIG_ARCH_LS2080A
590*4882a593Smuzhiyun mcr = (mcr & ~MCFGR_AWCACHE_MASK) | (0xb << MCFGR_AWCACHE_SHIFT);
591*4882a593Smuzhiyun mcr = (mcr & ~MCFGR_ARCACHE_MASK) | (0x6 << MCFGR_ARCACHE_SHIFT);
592*4882a593Smuzhiyun #else
593*4882a593Smuzhiyun mcr = (mcr & ~MCFGR_AWCACHE_MASK) | (0x2 << MCFGR_AWCACHE_SHIFT);
594*4882a593Smuzhiyun #endif
595*4882a593Smuzhiyun
596*4882a593Smuzhiyun #ifdef CONFIG_PHYS_64BIT
597*4882a593Smuzhiyun mcr |= (1 << MCFGR_PS_SHIFT);
598*4882a593Smuzhiyun #endif
599*4882a593Smuzhiyun sec_out32(&sec->mcfgr, mcr);
600*4882a593Smuzhiyun
601*4882a593Smuzhiyun #ifdef CONFIG_FSL_CORENET
602*4882a593Smuzhiyun #ifdef CONFIG_SPL_BUILD
603*4882a593Smuzhiyun /*
604*4882a593Smuzhiyun * For SPL Build, Set the Liodns in SEC JR0 for
605*4882a593Smuzhiyun * creating PAMU entries corresponding to these.
606*4882a593Smuzhiyun * For normal build, these are set in set_liodns().
607*4882a593Smuzhiyun */
608*4882a593Smuzhiyun liodn_ns = CONFIG_SPL_JR0_LIODN_NS & JRNSLIODN_MASK;
609*4882a593Smuzhiyun liodn_s = CONFIG_SPL_JR0_LIODN_S & JRSLIODN_MASK;
610*4882a593Smuzhiyun
611*4882a593Smuzhiyun liodnr = sec_in32(&sec->jrliodnr[0].ls) &
612*4882a593Smuzhiyun ~(JRNSLIODN_MASK | JRSLIODN_MASK);
613*4882a593Smuzhiyun liodnr = liodnr |
614*4882a593Smuzhiyun (liodn_ns << JRNSLIODN_SHIFT) |
615*4882a593Smuzhiyun (liodn_s << JRSLIODN_SHIFT);
616*4882a593Smuzhiyun sec_out32(&sec->jrliodnr[0].ls, liodnr);
617*4882a593Smuzhiyun #else
618*4882a593Smuzhiyun liodnr = sec_in32(&sec->jrliodnr[0].ls);
619*4882a593Smuzhiyun liodn_ns = (liodnr & JRNSLIODN_MASK) >> JRNSLIODN_SHIFT;
620*4882a593Smuzhiyun liodn_s = (liodnr & JRSLIODN_MASK) >> JRSLIODN_SHIFT;
621*4882a593Smuzhiyun #endif
622*4882a593Smuzhiyun #endif
623*4882a593Smuzhiyun
624*4882a593Smuzhiyun ret = jr_init(sec_idx);
625*4882a593Smuzhiyun if (ret < 0) {
626*4882a593Smuzhiyun printf("SEC initialization failed\n");
627*4882a593Smuzhiyun return -1;
628*4882a593Smuzhiyun }
629*4882a593Smuzhiyun
630*4882a593Smuzhiyun #ifdef CONFIG_FSL_CORENET
631*4882a593Smuzhiyun ret = sec_config_pamu_table(liodn_ns, liodn_s);
632*4882a593Smuzhiyun if (ret < 0)
633*4882a593Smuzhiyun return -1;
634*4882a593Smuzhiyun
635*4882a593Smuzhiyun pamu_enable();
636*4882a593Smuzhiyun #endif
637*4882a593Smuzhiyun #ifndef CONFIG_SPL_BUILD
638*4882a593Smuzhiyun if (get_rng_vid(sec_idx) >= 4) {
639*4882a593Smuzhiyun if (rng_init(sec_idx) < 0) {
640*4882a593Smuzhiyun printf("SEC%u: RNG instantiation failed\n", sec_idx);
641*4882a593Smuzhiyun return -1;
642*4882a593Smuzhiyun }
643*4882a593Smuzhiyun printf("SEC%u: RNG instantiated\n", sec_idx);
644*4882a593Smuzhiyun }
645*4882a593Smuzhiyun #endif
646*4882a593Smuzhiyun return ret;
647*4882a593Smuzhiyun }
648*4882a593Smuzhiyun
sec_init(void)649*4882a593Smuzhiyun int sec_init(void)
650*4882a593Smuzhiyun {
651*4882a593Smuzhiyun return sec_init_idx(0);
652*4882a593Smuzhiyun }
653