1 // SPDX-License-Identifier: GPL-2.0+
3 * Copyright 2008-2014 Freescale Semiconductor, Inc.
6 * Based on CAAM driver in drivers/crypto/caam in Linux
11 #include <linux/kernel.h>
17 #include "desc_constr.h"
19 #include <asm/cache.h>
20 #ifdef CONFIG_FSL_CORENET
21 #include <asm/cache.h>
22 #include <asm/fsl_pamu.h>
25 #include <linux/delay.h>
27 #define CIRC_CNT(head, tail, size) (((head) - (tail)) & (size - 1))
28 #define CIRC_SPACE(head, tail, size) CIRC_CNT((tail), (head) + 1, (size))
30 uint32_t sec_offset[CONFIG_SYS_FSL_MAX_NUM_OF_SEC] = {
32 #if defined(CONFIG_ARCH_C29X)
33 CONFIG_SYS_FSL_SEC_IDX_OFFSET,
34 2 * CONFIG_SYS_FSL_SEC_IDX_OFFSET
38 #define SEC_ADDR(idx) \
39 (ulong)((CONFIG_SYS_FSL_SEC_ADDR + sec_offset[idx]))
41 #define SEC_JR0_ADDR(idx) \
42 (ulong)(SEC_ADDR(idx) + \
43 (CONFIG_SYS_FSL_JR0_OFFSET - CONFIG_SYS_FSL_SEC_OFFSET))
45 struct jobring jr0[CONFIG_SYS_FSL_MAX_NUM_OF_SEC];
47 static inline void start_jr0(uint8_t sec_idx)
49 ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
50 u32 ctpr_ms = sec_in32(&sec->ctpr_ms);
51 u32 scfgr = sec_in32(&sec->scfgr);
53 if (ctpr_ms & SEC_CTPR_MS_VIRT_EN_INCL) {
54 /* VIRT_EN_INCL = 1 & VIRT_EN_POR = 1 or
55 * VIRT_EN_INCL = 1 & VIRT_EN_POR = 0 & SEC_SCFGR_VIRT_EN = 1
57 if ((ctpr_ms & SEC_CTPR_MS_VIRT_EN_POR) ||
58 (scfgr & SEC_SCFGR_VIRT_EN))
59 sec_out32(&sec->jrstartr, CONFIG_JRSTARTR_JR0);
61 /* VIRT_EN_INCL = 0 && VIRT_EN_POR_VALUE = 1 */
62 if (ctpr_ms & SEC_CTPR_MS_VIRT_EN_POR)
63 sec_out32(&sec->jrstartr, CONFIG_JRSTARTR_JR0);
67 static inline void jr_reset_liodn(uint8_t sec_idx)
69 ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
70 sec_out32(&sec->jrliodnr[0].ls, 0);
73 static inline void jr_disable_irq(uint8_t sec_idx)
75 struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
76 uint32_t jrcfg = sec_in32(®s->jrcfg1);
78 jrcfg = jrcfg | JR_INTMASK;
80 sec_out32(®s->jrcfg1, jrcfg);
83 static void jr_initregs(uint8_t sec_idx)
85 struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
86 struct jobring *jr = &jr0[sec_idx];
87 phys_addr_t ip_base = virt_to_phys((void *)jr->input_ring);
88 phys_addr_t op_base = virt_to_phys((void *)jr->output_ring);
90 #ifdef CONFIG_PHYS_64BIT
91 sec_out32(®s->irba_h, ip_base >> 32);
93 sec_out32(®s->irba_h, 0x0);
95 sec_out32(®s->irba_l, (uint32_t)ip_base);
96 #ifdef CONFIG_PHYS_64BIT
97 sec_out32(®s->orba_h, op_base >> 32);
99 sec_out32(®s->orba_h, 0x0);
101 sec_out32(®s->orba_l, (uint32_t)op_base);
102 sec_out32(®s->ors, JR_SIZE);
103 sec_out32(®s->irs, JR_SIZE);
106 jr_disable_irq(sec_idx);
109 static int jr_init(uint8_t sec_idx)
111 struct jobring *jr = &jr0[sec_idx];
113 memset(jr, 0, sizeof(struct jobring));
115 jr->jq_id = DEFAULT_JR_ID;
116 jr->irq = DEFAULT_IRQ;
118 #ifdef CONFIG_FSL_CORENET
119 jr->liodn = DEFAULT_JR_LIODN;
122 jr->input_ring = (dma_addr_t *)memalign(ARCH_DMA_MINALIGN,
123 JR_SIZE * sizeof(dma_addr_t));
127 jr->op_size = roundup(JR_SIZE * sizeof(struct op_ring),
130 (struct op_ring *)memalign(ARCH_DMA_MINALIGN, jr->op_size);
131 if (!jr->output_ring)
134 memset(jr->input_ring, 0, JR_SIZE * sizeof(dma_addr_t));
135 memset(jr->output_ring, 0, jr->op_size);
139 jr_initregs(sec_idx);
144 static int jr_sw_cleanup(uint8_t sec_idx)
146 struct jobring *jr = &jr0[sec_idx];
152 memset(jr->info, 0, sizeof(jr->info));
153 memset(jr->input_ring, 0, jr->size * sizeof(dma_addr_t));
154 memset(jr->output_ring, 0, jr->size * sizeof(struct op_ring));
159 static int jr_hw_reset(uint8_t sec_idx)
161 struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
162 uint32_t timeout = 100000;
163 uint32_t jrint, jrcr;
165 sec_out32(®s->jrcr, JRCR_RESET);
167 jrint = sec_in32(®s->jrint);
168 } while (((jrint & JRINT_ERR_HALT_MASK) ==
169 JRINT_ERR_HALT_INPROGRESS) && --timeout);
171 jrint = sec_in32(®s->jrint);
172 if (((jrint & JRINT_ERR_HALT_MASK) !=
173 JRINT_ERR_HALT_INPROGRESS) && timeout == 0)
177 sec_out32(®s->jrcr, JRCR_RESET);
179 jrcr = sec_in32(®s->jrcr);
180 } while ((jrcr & JRCR_RESET) && --timeout);
188 /* -1 --- error, can't enqueue -- no space available */
189 static int jr_enqueue(uint32_t *desc_addr,
190 void (*callback)(uint32_t status, void *arg),
191 void *arg, uint8_t sec_idx)
193 struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
194 struct jobring *jr = &jr0[sec_idx];
197 int length = desc_len(desc_addr);
199 #ifdef CONFIG_PHYS_64BIT
200 uint32_t *addr_hi, *addr_lo;
203 /* The descriptor must be submitted to SEC block as per endianness
205 * So, if the endianness of Core and SEC block is different, each word
206 * of the descriptor will be byte-swapped.
208 for (i = 0; i < length; i++) {
209 desc_word = desc_addr[i];
210 sec_out32((uint32_t *)&desc_addr[i], desc_word);
213 phys_addr_t desc_phys_addr = virt_to_phys(desc_addr);
215 jr->info[head].desc_phys_addr = desc_phys_addr;
216 jr->info[head].callback = (void *)callback;
217 jr->info[head].arg = arg;
218 jr->info[head].op_done = 0;
220 unsigned long start = (unsigned long)&jr->info[head] &
221 ~(ARCH_DMA_MINALIGN - 1);
222 unsigned long end = ALIGN((unsigned long)&jr->info[head] +
223 sizeof(struct jr_info), ARCH_DMA_MINALIGN);
224 flush_dcache_range(start, end);
226 #ifdef CONFIG_PHYS_64BIT
227 /* Write the 64 bit Descriptor address on Input Ring.
228 * The 32 bit hign and low part of the address will
229 * depend on endianness of SEC block.
231 #ifdef CONFIG_SYS_FSL_SEC_LE
232 addr_lo = (uint32_t *)(&jr->input_ring[head]);
233 addr_hi = (uint32_t *)(&jr->input_ring[head]) + 1;
234 #elif defined(CONFIG_SYS_FSL_SEC_BE)
235 addr_hi = (uint32_t *)(&jr->input_ring[head]);
236 addr_lo = (uint32_t *)(&jr->input_ring[head]) + 1;
237 #endif /* ifdef CONFIG_SYS_FSL_SEC_LE */
239 sec_out32(addr_hi, (uint32_t)(desc_phys_addr >> 32));
240 sec_out32(addr_lo, (uint32_t)(desc_phys_addr));
243 /* Write the 32 bit Descriptor address on Input Ring. */
244 sec_out32(&jr->input_ring[head], desc_phys_addr);
245 #endif /* ifdef CONFIG_PHYS_64BIT */
247 start = (unsigned long)&jr->input_ring[head] & ~(ARCH_DMA_MINALIGN - 1);
248 end = ALIGN((unsigned long)&jr->input_ring[head] +
249 sizeof(dma_addr_t), ARCH_DMA_MINALIGN);
250 flush_dcache_range(start, end);
252 jr->head = (head + 1) & (jr->size - 1);
254 /* Invalidate output ring */
255 start = (unsigned long)jr->output_ring &
256 ~(ARCH_DMA_MINALIGN - 1);
257 end = ALIGN((unsigned long)jr->output_ring + jr->op_size,
259 invalidate_dcache_range(start, end);
261 sec_out32(®s->irja, 1);
266 static int jr_dequeue(int sec_idx)
268 struct jr_regs *regs = (struct jr_regs *)SEC_JR0_ADDR(sec_idx);
269 struct jobring *jr = &jr0[sec_idx];
273 void (*callback)(uint32_t status, void *arg);
275 #ifdef CONFIG_PHYS_64BIT
276 uint32_t *addr_hi, *addr_lo;
281 while (sec_in32(®s->orsf) && CIRC_CNT(jr->head, jr->tail,
287 #ifdef CONFIG_PHYS_64BIT
288 /* Read the 64 bit Descriptor address from Output Ring.
289 * The 32 bit hign and low part of the address will
290 * depend on endianness of SEC block.
292 #ifdef CONFIG_SYS_FSL_SEC_LE
293 addr_lo = (uint32_t *)(&jr->output_ring[jr->tail].desc);
294 addr_hi = (uint32_t *)(&jr->output_ring[jr->tail].desc) + 1;
295 #elif defined(CONFIG_SYS_FSL_SEC_BE)
296 addr_hi = (uint32_t *)(&jr->output_ring[jr->tail].desc);
297 addr_lo = (uint32_t *)(&jr->output_ring[jr->tail].desc) + 1;
298 #endif /* ifdef CONFIG_SYS_FSL_SEC_LE */
300 op_desc = ((u64)sec_in32(addr_hi) << 32) |
301 ((u64)sec_in32(addr_lo));
304 /* Read the 32 bit Descriptor address from Output Ring. */
305 addr = (uint32_t *)&jr->output_ring[jr->tail].desc;
306 op_desc = sec_in32(addr);
307 #endif /* ifdef CONFIG_PHYS_64BIT */
309 uint32_t status = sec_in32(&jr->output_ring[jr->tail].status);
311 for (i = 0; CIRC_CNT(head, tail + i, jr->size) >= 1; i++) {
312 idx = (tail + i) & (jr->size - 1);
313 if (op_desc == jr->info[idx].desc_phys_addr) {
319 /* Error condition if match not found */
323 jr->info[idx].op_done = 1;
324 callback = (void *)jr->info[idx].callback;
325 arg = jr->info[idx].arg;
327 /* When the job on tail idx gets done, increment
328 * tail till the point where job completed out of oredr has
329 * been taken into account
333 tail = (tail + 1) & (jr->size - 1);
334 } while (jr->info[tail].op_done);
337 jr->read_idx = (jr->read_idx + 1) & (jr->size - 1);
339 sec_out32(®s->orjr, 1);
340 jr->info[idx].op_done = 0;
342 callback(status, arg);
348 static void desc_done(uint32_t status, void *arg)
350 struct result *x = arg;
352 #ifndef CONFIG_SPL_BUILD
353 caam_jr_strstatus(status);
358 static inline int run_descriptor_jr_idx(uint32_t *desc, uint8_t sec_idx)
360 unsigned long long timeval = 0;
361 unsigned long long timeout = CONFIG_USEC_DEQ_TIMEOUT;
365 memset(&op, 0, sizeof(op));
367 ret = jr_enqueue(desc, desc_done, &op, sec_idx);
369 debug("Error in SEC enq\n");
374 while (op.done != 1) {
378 ret = jr_dequeue(sec_idx);
380 debug("Error in SEC deq\n");
385 if (timeval > timeout) {
386 debug("SEC Dequeue timed out\n");
393 debug("Error %x\n", op.status);
400 int run_descriptor_jr(uint32_t *desc)
402 return run_descriptor_jr_idx(desc, 0);
405 static inline int jr_reset_sec(uint8_t sec_idx)
407 if (jr_hw_reset(sec_idx) < 0)
410 /* Clean up the jobring structure maintained by software */
411 jr_sw_cleanup(sec_idx);
418 return jr_reset_sec(0);
421 static inline int sec_reset_idx(uint8_t sec_idx)
423 ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
424 uint32_t mcfgr = sec_in32(&sec->mcfgr);
425 uint32_t timeout = 100000;
427 mcfgr |= MCFGR_SWRST;
428 sec_out32(&sec->mcfgr, mcfgr);
430 mcfgr |= MCFGR_DMA_RST;
431 sec_out32(&sec->mcfgr, mcfgr);
433 mcfgr = sec_in32(&sec->mcfgr);
434 } while ((mcfgr & MCFGR_DMA_RST) == MCFGR_DMA_RST && --timeout);
441 mcfgr = sec_in32(&sec->mcfgr);
442 } while ((mcfgr & MCFGR_SWRST) == MCFGR_SWRST && --timeout);
451 return sec_reset_idx(0);
453 #ifndef CONFIG_SPL_BUILD
454 static int deinstantiate_rng(u8 sec_idx, int state_handle_mask)
458 int desc_size = ALIGN(sizeof(u32) * 2, ARCH_DMA_MINALIGN);
460 desc = memalign(ARCH_DMA_MINALIGN, desc_size);
462 debug("cannot allocate RNG init descriptor memory\n");
466 for (sh_idx = 0; sh_idx < RNG4_MAX_HANDLES; sh_idx++) {
468 * If the corresponding bit is set, then it means the state
469 * handle was initialized by us, and thus it needs to be
470 * deinitialized as well
473 if (state_handle_mask & RDSTA_IF(sh_idx)) {
475 * Create the descriptor for deinstantating this state
478 inline_cnstr_jobdesc_rng_deinstantiation(desc, sh_idx);
479 flush_dcache_range((unsigned long)desc,
480 (unsigned long)desc + desc_size);
482 ret = run_descriptor_jr_idx(desc, sec_idx);
484 printf("SEC%u: RNG4 SH%d deinstantiation failed with error 0x%x\n",
485 sec_idx, sh_idx, ret);
490 printf("SEC%u: Deinstantiated RNG4 SH%d\n",
499 static int instantiate_rng(u8 sec_idx, int gen_sk)
503 int ret = 0, sh_idx, size;
504 ccsr_sec_t __iomem *sec = (ccsr_sec_t __iomem *)SEC_ADDR(sec_idx);
505 struct rng4tst __iomem *rng =
506 (struct rng4tst __iomem *)&sec->rng;
508 desc = memalign(ARCH_DMA_MINALIGN, sizeof(uint32_t) * 6);
510 printf("cannot allocate RNG init descriptor memory\n");
514 for (sh_idx = 0; sh_idx < RNG4_MAX_HANDLES; sh_idx++) {
516 * If the corresponding bit is set, this state handle
517 * was initialized by somebody else, so it's left alone.
519 rdsta_val = sec_in32(&rng->rdsta);
520 if (rdsta_val & (RDSTA_IF(sh_idx))) {
521 if (rdsta_val & RDSTA_PR(sh_idx))
524 printf("SEC%u: RNG4 SH%d was instantiated w/o prediction resistance. Tearing it down\n",
527 ret = deinstantiate_rng(sec_idx, RDSTA_IF(sh_idx));
532 inline_cnstr_jobdesc_rng_instantiation(desc, sh_idx, gen_sk);
533 size = roundup(sizeof(uint32_t) * 6, ARCH_DMA_MINALIGN);
534 flush_dcache_range((unsigned long)desc,
535 (unsigned long)desc + size);
537 ret = run_descriptor_jr_idx(desc, sec_idx);
540 printf("SEC%u: RNG4 SH%d instantiation failed with error 0x%x\n",
541 sec_idx, sh_idx, ret);
543 rdsta_val = sec_in32(&rng->rdsta);
544 if (!(rdsta_val & RDSTA_IF(sh_idx))) {
549 memset(desc, 0, sizeof(uint32_t) * 6);
557 static u8 get_rng_vid(uint8_t sec_idx)
559 ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
562 if (caam_get_era() < 10) {
563 vid = (sec_in32(&sec->chavid_ls) & SEC_CHAVID_RNG_LS_MASK)
564 >> SEC_CHAVID_LS_RNG_SHIFT;
566 vid = (sec_in32(&sec->vreg.rng) & CHA_VER_VID_MASK)
567 >> CHA_VER_VID_SHIFT;
574 * By default, the TRNG runs for 200 clocks per sample;
575 * 1200 clocks per sample generates better entropy.
577 static void kick_trng(int ent_delay, uint8_t sec_idx)
579 ccsr_sec_t __iomem *sec = (ccsr_sec_t __iomem *)SEC_ADDR(sec_idx);
580 struct rng4tst __iomem *rng =
581 (struct rng4tst __iomem *)&sec->rng;
584 /* put RNG4 into program mode */
585 sec_setbits32(&rng->rtmctl, RTMCTL_PRGM);
586 /* rtsdctl bits 0-15 contain "Entropy Delay, which defines the
587 * length (in system clocks) of each Entropy sample taken
589 val = sec_in32(&rng->rtsdctl);
590 val = (val & ~RTSDCTL_ENT_DLY_MASK) |
591 (ent_delay << RTSDCTL_ENT_DLY_SHIFT);
592 sec_out32(&rng->rtsdctl, val);
593 /* min. freq. count, equal to 1/4 of the entropy sample length */
594 sec_out32(&rng->rtfreqmin, ent_delay >> 2);
595 /* disable maximum frequency count */
596 sec_out32(&rng->rtfreqmax, RTFRQMAX_DISABLE);
598 * select raw sampling in both entropy shifter
599 * and statistical checker
601 sec_setbits32(&rng->rtmctl, RTMCTL_SAMP_MODE_RAW_ES_SC);
602 /* put RNG4 into run mode */
603 sec_clrbits32(&rng->rtmctl, RTMCTL_PRGM);
606 static int rng_init(uint8_t sec_idx)
608 int ret, gen_sk, ent_delay = RTSDCTL_ENT_DLY_MIN;
609 ccsr_sec_t __iomem *sec = (ccsr_sec_t __iomem *)SEC_ADDR(sec_idx);
610 struct rng4tst __iomem *rng =
611 (struct rng4tst __iomem *)&sec->rng;
614 gen_sk = !(sec_in32(&rng->rdsta) & RDSTA_SKVN);
616 inst_handles = sec_in32(&rng->rdsta) & RDSTA_MASK;
619 * If either of the SH's were instantiated by somebody else
620 * then it is assumed that the entropy
621 * parameters are properly set and thus the function
622 * setting these (kick_trng(...)) is skipped.
623 * Also, if a handle was instantiated, do not change
624 * the TRNG parameters.
627 kick_trng(ent_delay, sec_idx);
631 * if instantiate_rng(...) fails, the loop will rerun
632 * and the kick_trng(...) function will modfiy the
633 * upper and lower limits of the entropy sampling
634 * interval, leading to a sucessful initialization of
637 ret = instantiate_rng(sec_idx, gen_sk);
638 } while ((ret == -1) && (ent_delay < RTSDCTL_ENT_DLY_MAX));
640 printf("SEC%u: Failed to instantiate RNG\n", sec_idx);
644 /* Enable RDB bit so that RNG works faster */
645 sec_setbits32(&sec->scfgr, SEC_SCFGR_RDBENABLE);
650 int sec_init_idx(uint8_t sec_idx)
652 ccsr_sec_t *sec = (void *)SEC_ADDR(sec_idx);
653 uint32_t mcr = sec_in32(&sec->mcfgr);
656 #ifdef CONFIG_FSL_CORENET
662 if (!(sec_idx < CONFIG_SYS_FSL_MAX_NUM_OF_SEC)) {
663 printf("SEC%u: initialization failed\n", sec_idx);
668 * Modifying CAAM Read/Write Attributes
670 * For AXI Write - Cacheable, Write Back, Write allocate
671 * For AXI Read - Cacheable, Read allocate
672 * Only For LS2080a, to solve CAAM coherency issues
674 #ifdef CONFIG_ARCH_LS2080A
675 mcr = (mcr & ~MCFGR_AWCACHE_MASK) | (0xb << MCFGR_AWCACHE_SHIFT);
676 mcr = (mcr & ~MCFGR_ARCACHE_MASK) | (0x6 << MCFGR_ARCACHE_SHIFT);
678 mcr = (mcr & ~MCFGR_AWCACHE_MASK) | (0x2 << MCFGR_AWCACHE_SHIFT);
681 #ifdef CONFIG_PHYS_64BIT
682 mcr |= (1 << MCFGR_PS_SHIFT);
684 sec_out32(&sec->mcfgr, mcr);
686 #ifdef CONFIG_FSL_CORENET
687 #ifdef CONFIG_SPL_BUILD
689 * For SPL Build, Set the Liodns in SEC JR0 for
690 * creating PAMU entries corresponding to these.
691 * For normal build, these are set in set_liodns().
693 liodn_ns = CONFIG_SPL_JR0_LIODN_NS & JRNSLIODN_MASK;
694 liodn_s = CONFIG_SPL_JR0_LIODN_S & JRSLIODN_MASK;
696 liodnr = sec_in32(&sec->jrliodnr[0].ls) &
697 ~(JRNSLIODN_MASK | JRSLIODN_MASK);
699 (liodn_ns << JRNSLIODN_SHIFT) |
700 (liodn_s << JRSLIODN_SHIFT);
701 sec_out32(&sec->jrliodnr[0].ls, liodnr);
703 liodnr = sec_in32(&sec->jrliodnr[0].ls);
704 liodn_ns = (liodnr & JRNSLIODN_MASK) >> JRNSLIODN_SHIFT;
705 liodn_s = (liodnr & JRSLIODN_MASK) >> JRSLIODN_SHIFT;
709 ret = jr_init(sec_idx);
711 printf("SEC%u: initialization failed\n", sec_idx);
715 #ifdef CONFIG_FSL_CORENET
716 ret = sec_config_pamu_table(liodn_ns, liodn_s);
722 #ifndef CONFIG_SPL_BUILD
723 if (get_rng_vid(sec_idx) >= 4) {
724 if (rng_init(sec_idx) < 0) {
725 printf("SEC%u: RNG instantiation failed\n", sec_idx);
729 if (IS_ENABLED(CONFIG_DM_RNG)) {
730 ret = device_bind_driver(NULL, "caam-rng", "caam-rng",
733 printf("Couldn't bind rng driver (%d)\n", ret);
736 printf("SEC%u: RNG instantiated\n", sec_idx);
744 return sec_init_idx(0);