1 // SPDX-License-Identifier: GPL-2.0-only
3 // Copyright (C) 2020 NVIDIA CORPORATION.
6 #include <linux/completion.h>
7 #include <linux/delay.h>
8 #include <linux/dmaengine.h>
9 #include <linux/dma-mapping.h>
10 #include <linux/dmapool.h>
11 #include <linux/err.h>
12 #include <linux/interrupt.h>
14 #include <linux/iopoll.h>
15 #include <linux/kernel.h>
16 #include <linux/kthread.h>
17 #include <linux/module.h>
18 #include <linux/platform_device.h>
19 #include <linux/pm_runtime.h>
21 #include <linux/of_device.h>
22 #include <linux/reset.h>
23 #include <linux/spi/spi.h>
24 #include <linux/acpi.h>
25 #include <linux/property.h>
27 #define QSPI_COMMAND1 0x000
28 #define QSPI_BIT_LENGTH(x) (((x) & 0x1f) << 0)
29 #define QSPI_PACKED BIT(5)
30 #define QSPI_INTERFACE_WIDTH_MASK (0x03 << 7)
31 #define QSPI_INTERFACE_WIDTH(x) (((x) & 0x03) << 7)
32 #define QSPI_INTERFACE_WIDTH_SINGLE QSPI_INTERFACE_WIDTH(0)
33 #define QSPI_INTERFACE_WIDTH_DUAL QSPI_INTERFACE_WIDTH(1)
34 #define QSPI_INTERFACE_WIDTH_QUAD QSPI_INTERFACE_WIDTH(2)
35 #define QSPI_SDR_DDR_SEL BIT(9)
36 #define QSPI_TX_EN BIT(11)
37 #define QSPI_RX_EN BIT(12)
38 #define QSPI_CS_SW_VAL BIT(20)
39 #define QSPI_CS_SW_HW BIT(21)
41 #define QSPI_CS_POL_INACTIVE(n) (1 << (22 + (n)))
42 #define QSPI_CS_POL_INACTIVE_MASK (0xF << 22)
43 #define QSPI_CS_SEL_0 (0 << 26)
44 #define QSPI_CS_SEL_1 (1 << 26)
45 #define QSPI_CS_SEL_2 (2 << 26)
46 #define QSPI_CS_SEL_3 (3 << 26)
47 #define QSPI_CS_SEL_MASK (3 << 26)
48 #define QSPI_CS_SEL(x) (((x) & 0x3) << 26)
50 #define QSPI_CONTROL_MODE_0 (0 << 28)
51 #define QSPI_CONTROL_MODE_3 (3 << 28)
52 #define QSPI_CONTROL_MODE_MASK (3 << 28)
53 #define QSPI_M_S BIT(30)
54 #define QSPI_PIO BIT(31)
56 #define QSPI_COMMAND2 0x004
57 #define QSPI_TX_TAP_DELAY(x) (((x) & 0x3f) << 10)
58 #define QSPI_RX_TAP_DELAY(x) (((x) & 0xff) << 0)
60 #define QSPI_CS_TIMING1 0x008
61 #define QSPI_SETUP_HOLD(setup, hold) (((setup) << 4) | (hold))
63 #define QSPI_CS_TIMING2 0x00c
64 #define CYCLES_BETWEEN_PACKETS_0(x) (((x) & 0x1f) << 0)
65 #define CS_ACTIVE_BETWEEN_PACKETS_0 BIT(5)
67 #define QSPI_TRANS_STATUS 0x010
68 #define QSPI_BLK_CNT(val) (((val) >> 0) & 0xffff)
69 #define QSPI_RDY BIT(30)
71 #define QSPI_FIFO_STATUS 0x014
72 #define QSPI_RX_FIFO_EMPTY BIT(0)
73 #define QSPI_RX_FIFO_FULL BIT(1)
74 #define QSPI_TX_FIFO_EMPTY BIT(2)
75 #define QSPI_TX_FIFO_FULL BIT(3)
76 #define QSPI_RX_FIFO_UNF BIT(4)
77 #define QSPI_RX_FIFO_OVF BIT(5)
78 #define QSPI_TX_FIFO_UNF BIT(6)
79 #define QSPI_TX_FIFO_OVF BIT(7)
80 #define QSPI_ERR BIT(8)
81 #define QSPI_TX_FIFO_FLUSH BIT(14)
82 #define QSPI_RX_FIFO_FLUSH BIT(15)
83 #define QSPI_TX_FIFO_EMPTY_COUNT(val) (((val) >> 16) & 0x7f)
84 #define QSPI_RX_FIFO_FULL_COUNT(val) (((val) >> 23) & 0x7f)
86 #define QSPI_FIFO_ERROR (QSPI_RX_FIFO_UNF | \
90 #define QSPI_FIFO_EMPTY (QSPI_RX_FIFO_EMPTY | \
93 #define QSPI_TX_DATA 0x018
94 #define QSPI_RX_DATA 0x01c
96 #define QSPI_DMA_CTL 0x020
97 #define QSPI_TX_TRIG(n) (((n) & 0x3) << 15)
98 #define QSPI_TX_TRIG_1 QSPI_TX_TRIG(0)
99 #define QSPI_TX_TRIG_4 QSPI_TX_TRIG(1)
100 #define QSPI_TX_TRIG_8 QSPI_TX_TRIG(2)
101 #define QSPI_TX_TRIG_16 QSPI_TX_TRIG(3)
103 #define QSPI_RX_TRIG(n) (((n) & 0x3) << 19)
104 #define QSPI_RX_TRIG_1 QSPI_RX_TRIG(0)
105 #define QSPI_RX_TRIG_4 QSPI_RX_TRIG(1)
106 #define QSPI_RX_TRIG_8 QSPI_RX_TRIG(2)
107 #define QSPI_RX_TRIG_16 QSPI_RX_TRIG(3)
109 #define QSPI_DMA_EN BIT(31)
111 #define QSPI_DMA_BLK 0x024
112 #define QSPI_DMA_BLK_SET(x) (((x) & 0xffff) << 0)
114 #define QSPI_TX_FIFO 0x108
115 #define QSPI_RX_FIFO 0x188
117 #define QSPI_FIFO_DEPTH 64
119 #define QSPI_INTR_MASK 0x18c
120 #define QSPI_INTR_RX_FIFO_UNF_MASK BIT(25)
121 #define QSPI_INTR_RX_FIFO_OVF_MASK BIT(26)
122 #define QSPI_INTR_TX_FIFO_UNF_MASK BIT(27)
123 #define QSPI_INTR_TX_FIFO_OVF_MASK BIT(28)
124 #define QSPI_INTR_RDY_MASK BIT(29)
125 #define QSPI_INTR_RX_TX_FIFO_ERR (QSPI_INTR_RX_FIFO_UNF_MASK | \
126 QSPI_INTR_RX_FIFO_OVF_MASK | \
127 QSPI_INTR_TX_FIFO_UNF_MASK | \
128 QSPI_INTR_TX_FIFO_OVF_MASK)
130 #define QSPI_MISC_REG 0x194
131 #define QSPI_NUM_DUMMY_CYCLE(x) (((x) & 0xff) << 0)
132 #define QSPI_DUMMY_CYCLES_MAX 0xff
134 #define QSPI_CMB_SEQ_CMD 0x19c
135 #define QSPI_COMMAND_VALUE_SET(X) (((x) & 0xFF) << 0)
137 #define QSPI_CMB_SEQ_CMD_CFG 0x1a0
138 #define QSPI_COMMAND_X1_X2_X4(x) (((x) & 0x3) << 13)
139 #define QSPI_COMMAND_X1_X2_X4_MASK (0x03 << 13)
140 #define QSPI_COMMAND_SDR_DDR BIT(12)
141 #define QSPI_COMMAND_SIZE_SET(x) (((x) & 0xFF) << 0)
143 #define QSPI_GLOBAL_CONFIG 0X1a4
144 #define QSPI_CMB_SEQ_EN BIT(0)
145 #define QSPI_TPM_WAIT_POLL_EN BIT(1)
147 #define QSPI_CMB_SEQ_ADDR 0x1a8
148 #define QSPI_ADDRESS_VALUE_SET(X) (((x) & 0xFFFF) << 0)
150 #define QSPI_CMB_SEQ_ADDR_CFG 0x1ac
151 #define QSPI_ADDRESS_X1_X2_X4(x) (((x) & 0x3) << 13)
152 #define QSPI_ADDRESS_X1_X2_X4_MASK (0x03 << 13)
153 #define QSPI_ADDRESS_SDR_DDR BIT(12)
154 #define QSPI_ADDRESS_SIZE_SET(x) (((x) & 0xFF) << 0)
156 #define DATA_DIR_TX BIT(0)
157 #define DATA_DIR_RX BIT(1)
159 #define QSPI_DMA_TIMEOUT (msecs_to_jiffies(1000))
160 #define DEFAULT_QSPI_DMA_BUF_LEN (64 * 1024)
161 #define CMD_TRANSFER 0
162 #define ADDR_TRANSFER 1
163 #define DATA_TRANSFER 2
165 struct tegra_qspi_soc_data {
167 bool cmb_xfer_capable;
169 unsigned int cs_count;
172 struct tegra_qspi_client_data {
173 int tx_clk_tap_delay;
174 int rx_clk_tap_delay;
179 struct spi_master *master;
180 /* lock to protect data accessed by irq */
189 unsigned int cur_pos;
190 unsigned int words_per_32bit;
191 unsigned int bytes_per_word;
192 unsigned int curr_dma_words;
193 unsigned int cur_direction;
195 unsigned int cur_rx_pos;
196 unsigned int cur_tx_pos;
198 unsigned int dma_buf_size;
199 unsigned int max_buf_size;
200 bool is_curr_dma_xfer;
202 struct completion rx_dma_complete;
203 struct completion tx_dma_complete;
213 u32 def_command1_reg;
214 u32 def_command2_reg;
219 struct completion xfer_completion;
220 struct spi_transfer *curr_xfer;
222 struct dma_chan *rx_dma_chan;
224 dma_addr_t rx_dma_phys;
225 struct dma_async_tx_descriptor *rx_dma_desc;
227 struct dma_chan *tx_dma_chan;
229 dma_addr_t tx_dma_phys;
230 struct dma_async_tx_descriptor *tx_dma_desc;
231 const struct tegra_qspi_soc_data *soc_data;
234 static inline u32 tegra_qspi_readl(struct tegra_qspi *tqspi, unsigned long offset)
236 return readl(tqspi->base + offset);
239 static inline void tegra_qspi_writel(struct tegra_qspi *tqspi, u32 value, unsigned long offset)
241 writel(value, tqspi->base + offset);
243 /* read back register to make sure that register writes completed */
244 if (offset != QSPI_TX_FIFO)
245 readl(tqspi->base + QSPI_COMMAND1);
248 static void tegra_qspi_mask_clear_irq(struct tegra_qspi *tqspi)
252 /* write 1 to clear status register */
253 value = tegra_qspi_readl(tqspi, QSPI_TRANS_STATUS);
254 tegra_qspi_writel(tqspi, value, QSPI_TRANS_STATUS);
256 value = tegra_qspi_readl(tqspi, QSPI_INTR_MASK);
257 if (!(value & QSPI_INTR_RDY_MASK)) {
258 value |= (QSPI_INTR_RDY_MASK | QSPI_INTR_RX_TX_FIFO_ERR);
259 tegra_qspi_writel(tqspi, value, QSPI_INTR_MASK);
262 /* clear fifo status error if any */
263 value = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
264 if (value & QSPI_ERR)
265 tegra_qspi_writel(tqspi, QSPI_ERR | QSPI_FIFO_ERROR, QSPI_FIFO_STATUS);
269 tegra_qspi_calculate_curr_xfer_param(struct tegra_qspi *tqspi, struct spi_transfer *t)
271 unsigned int max_word, max_len, total_fifo_words;
272 unsigned int remain_len = t->len - tqspi->cur_pos;
273 unsigned int bits_per_word = t->bits_per_word;
275 tqspi->bytes_per_word = DIV_ROUND_UP(bits_per_word, 8);
278 * Tegra QSPI controller supports packed or unpacked mode transfers.
279 * Packed mode is used for data transfers using 8, 16, or 32 bits per
280 * word with a minimum transfer of 1 word and for all other transfers
281 * unpacked mode will be used.
284 if ((bits_per_word == 8 || bits_per_word == 16 ||
285 bits_per_word == 32) && t->len > 3) {
286 tqspi->is_packed = true;
287 tqspi->words_per_32bit = 32 / bits_per_word;
289 tqspi->is_packed = false;
290 tqspi->words_per_32bit = 1;
293 if (tqspi->is_packed) {
294 max_len = min(remain_len, tqspi->max_buf_size);
295 tqspi->curr_dma_words = max_len / tqspi->bytes_per_word;
296 total_fifo_words = (max_len + 3) / 4;
298 max_word = (remain_len - 1) / tqspi->bytes_per_word + 1;
299 max_word = min(max_word, tqspi->max_buf_size / 4);
300 tqspi->curr_dma_words = max_word;
301 total_fifo_words = max_word;
304 return total_fifo_words;
308 tegra_qspi_fill_tx_fifo_from_client_txbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
310 unsigned int written_words, fifo_words_left, count;
311 unsigned int len, tx_empty_count, max_n_32bit, i;
312 u8 *tx_buf = (u8 *)t->tx_buf + tqspi->cur_tx_pos;
315 fifo_status = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
316 tx_empty_count = QSPI_TX_FIFO_EMPTY_COUNT(fifo_status);
318 if (tqspi->is_packed) {
319 fifo_words_left = tx_empty_count * tqspi->words_per_32bit;
320 written_words = min(fifo_words_left, tqspi->curr_dma_words);
321 len = written_words * tqspi->bytes_per_word;
322 max_n_32bit = DIV_ROUND_UP(len, 4);
323 for (count = 0; count < max_n_32bit; count++) {
326 for (i = 0; (i < 4) && len; i++, len--)
327 x |= (u32)(*tx_buf++) << (i * 8);
328 tegra_qspi_writel(tqspi, x, QSPI_TX_FIFO);
331 tqspi->cur_tx_pos += written_words * tqspi->bytes_per_word;
333 unsigned int write_bytes;
334 u8 bytes_per_word = tqspi->bytes_per_word;
336 max_n_32bit = min(tqspi->curr_dma_words, tx_empty_count);
337 written_words = max_n_32bit;
338 len = written_words * tqspi->bytes_per_word;
339 if (len > t->len - tqspi->cur_pos)
340 len = t->len - tqspi->cur_pos;
342 for (count = 0; count < max_n_32bit; count++) {
345 for (i = 0; len && (i < bytes_per_word); i++, len--)
346 x |= (u32)(*tx_buf++) << (i * 8);
347 tegra_qspi_writel(tqspi, x, QSPI_TX_FIFO);
350 tqspi->cur_tx_pos += write_bytes;
353 return written_words;
357 tegra_qspi_read_rx_fifo_to_client_rxbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
359 u8 *rx_buf = (u8 *)t->rx_buf + tqspi->cur_rx_pos;
360 unsigned int len, rx_full_count, count, i;
361 unsigned int read_words = 0;
364 fifo_status = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
365 rx_full_count = QSPI_RX_FIFO_FULL_COUNT(fifo_status);
366 if (tqspi->is_packed) {
367 len = tqspi->curr_dma_words * tqspi->bytes_per_word;
368 for (count = 0; count < rx_full_count; count++) {
369 x = tegra_qspi_readl(tqspi, QSPI_RX_FIFO);
371 for (i = 0; len && (i < 4); i++, len--)
372 *rx_buf++ = (x >> i * 8) & 0xff;
375 read_words += tqspi->curr_dma_words;
376 tqspi->cur_rx_pos += tqspi->curr_dma_words * tqspi->bytes_per_word;
378 u32 rx_mask = ((u32)1 << t->bits_per_word) - 1;
379 u8 bytes_per_word = tqspi->bytes_per_word;
380 unsigned int read_bytes;
382 len = rx_full_count * bytes_per_word;
383 if (len > t->len - tqspi->cur_pos)
384 len = t->len - tqspi->cur_pos;
386 for (count = 0; count < rx_full_count; count++) {
387 x = tegra_qspi_readl(tqspi, QSPI_RX_FIFO) & rx_mask;
389 for (i = 0; len && (i < bytes_per_word); i++, len--)
390 *rx_buf++ = (x >> (i * 8)) & 0xff;
393 read_words += rx_full_count;
394 tqspi->cur_rx_pos += read_bytes;
401 tegra_qspi_copy_client_txbuf_to_qspi_txbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
403 dma_sync_single_for_cpu(tqspi->dev, tqspi->tx_dma_phys,
404 tqspi->dma_buf_size, DMA_TO_DEVICE);
407 * In packed mode, each word in FIFO may contain multiple packets
408 * based on bits per word. So all bytes in each FIFO word are valid.
410 * In unpacked mode, each word in FIFO contains single packet and
411 * based on bits per word any remaining bits in FIFO word will be
412 * ignored by the hardware and are invalid bits.
414 if (tqspi->is_packed) {
415 tqspi->cur_tx_pos += tqspi->curr_dma_words * tqspi->bytes_per_word;
417 u8 *tx_buf = (u8 *)t->tx_buf + tqspi->cur_tx_pos;
418 unsigned int i, count, consume, write_bytes;
421 * Fill tx_dma_buf to contain single packet in each word based
422 * on bits per word from SPI core tx_buf.
424 consume = tqspi->curr_dma_words * tqspi->bytes_per_word;
425 if (consume > t->len - tqspi->cur_pos)
426 consume = t->len - tqspi->cur_pos;
427 write_bytes = consume;
428 for (count = 0; count < tqspi->curr_dma_words; count++) {
431 for (i = 0; consume && (i < tqspi->bytes_per_word); i++, consume--)
432 x |= (u32)(*tx_buf++) << (i * 8);
433 tqspi->tx_dma_buf[count] = x;
436 tqspi->cur_tx_pos += write_bytes;
439 dma_sync_single_for_device(tqspi->dev, tqspi->tx_dma_phys,
440 tqspi->dma_buf_size, DMA_TO_DEVICE);
444 tegra_qspi_copy_qspi_rxbuf_to_client_rxbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
446 dma_sync_single_for_cpu(tqspi->dev, tqspi->rx_dma_phys,
447 tqspi->dma_buf_size, DMA_FROM_DEVICE);
449 if (tqspi->is_packed) {
450 tqspi->cur_rx_pos += tqspi->curr_dma_words * tqspi->bytes_per_word;
452 unsigned char *rx_buf = t->rx_buf + tqspi->cur_rx_pos;
453 u32 rx_mask = ((u32)1 << t->bits_per_word) - 1;
454 unsigned int i, count, consume, read_bytes;
457 * Each FIFO word contains single data packet.
458 * Skip invalid bits in each FIFO word based on bits per word
459 * and align bytes while filling in SPI core rx_buf.
461 consume = tqspi->curr_dma_words * tqspi->bytes_per_word;
462 if (consume > t->len - tqspi->cur_pos)
463 consume = t->len - tqspi->cur_pos;
464 read_bytes = consume;
465 for (count = 0; count < tqspi->curr_dma_words; count++) {
466 u32 x = tqspi->rx_dma_buf[count] & rx_mask;
468 for (i = 0; consume && (i < tqspi->bytes_per_word); i++, consume--)
469 *rx_buf++ = (x >> (i * 8)) & 0xff;
472 tqspi->cur_rx_pos += read_bytes;
475 dma_sync_single_for_device(tqspi->dev, tqspi->rx_dma_phys,
476 tqspi->dma_buf_size, DMA_FROM_DEVICE);
479 static void tegra_qspi_dma_complete(void *args)
481 struct completion *dma_complete = args;
483 complete(dma_complete);
486 static int tegra_qspi_start_tx_dma(struct tegra_qspi *tqspi, struct spi_transfer *t, int len)
488 dma_addr_t tx_dma_phys;
490 reinit_completion(&tqspi->tx_dma_complete);
492 if (tqspi->is_packed)
493 tx_dma_phys = t->tx_dma;
495 tx_dma_phys = tqspi->tx_dma_phys;
497 tqspi->tx_dma_desc = dmaengine_prep_slave_single(tqspi->tx_dma_chan, tx_dma_phys,
499 DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
501 if (!tqspi->tx_dma_desc) {
502 dev_err(tqspi->dev, "Unable to get TX descriptor\n");
506 tqspi->tx_dma_desc->callback = tegra_qspi_dma_complete;
507 tqspi->tx_dma_desc->callback_param = &tqspi->tx_dma_complete;
508 dmaengine_submit(tqspi->tx_dma_desc);
509 dma_async_issue_pending(tqspi->tx_dma_chan);
514 static int tegra_qspi_start_rx_dma(struct tegra_qspi *tqspi, struct spi_transfer *t, int len)
516 dma_addr_t rx_dma_phys;
518 reinit_completion(&tqspi->rx_dma_complete);
520 if (tqspi->is_packed)
521 rx_dma_phys = t->rx_dma;
523 rx_dma_phys = tqspi->rx_dma_phys;
525 tqspi->rx_dma_desc = dmaengine_prep_slave_single(tqspi->rx_dma_chan, rx_dma_phys,
527 DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
529 if (!tqspi->rx_dma_desc) {
530 dev_err(tqspi->dev, "Unable to get RX descriptor\n");
534 tqspi->rx_dma_desc->callback = tegra_qspi_dma_complete;
535 tqspi->rx_dma_desc->callback_param = &tqspi->rx_dma_complete;
536 dmaengine_submit(tqspi->rx_dma_desc);
537 dma_async_issue_pending(tqspi->rx_dma_chan);
542 static int tegra_qspi_flush_fifos(struct tegra_qspi *tqspi, bool atomic)
544 void __iomem *addr = tqspi->base + QSPI_FIFO_STATUS;
547 val = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
548 if ((val & QSPI_FIFO_EMPTY) == QSPI_FIFO_EMPTY)
551 val |= QSPI_RX_FIFO_FLUSH | QSPI_TX_FIFO_FLUSH;
552 tegra_qspi_writel(tqspi, val, QSPI_FIFO_STATUS);
555 return readl_relaxed_poll_timeout(addr, val,
556 (val & QSPI_FIFO_EMPTY) == QSPI_FIFO_EMPTY,
559 return readl_relaxed_poll_timeout_atomic(addr, val,
560 (val & QSPI_FIFO_EMPTY) == QSPI_FIFO_EMPTY,
564 static void tegra_qspi_unmask_irq(struct tegra_qspi *tqspi)
568 intr_mask = tegra_qspi_readl(tqspi, QSPI_INTR_MASK);
569 intr_mask &= ~(QSPI_INTR_RDY_MASK | QSPI_INTR_RX_TX_FIFO_ERR);
570 tegra_qspi_writel(tqspi, intr_mask, QSPI_INTR_MASK);
573 static int tegra_qspi_dma_map_xfer(struct tegra_qspi *tqspi, struct spi_transfer *t)
575 u8 *tx_buf = (u8 *)t->tx_buf + tqspi->cur_tx_pos;
576 u8 *rx_buf = (u8 *)t->rx_buf + tqspi->cur_rx_pos;
579 len = DIV_ROUND_UP(tqspi->curr_dma_words * tqspi->bytes_per_word, 4) * 4;
582 t->tx_dma = dma_map_single(tqspi->dev, (void *)tx_buf, len, DMA_TO_DEVICE);
583 if (dma_mapping_error(tqspi->dev, t->tx_dma))
588 t->rx_dma = dma_map_single(tqspi->dev, (void *)rx_buf, len, DMA_FROM_DEVICE);
589 if (dma_mapping_error(tqspi->dev, t->rx_dma)) {
590 dma_unmap_single(tqspi->dev, t->tx_dma, len, DMA_TO_DEVICE);
598 static void tegra_qspi_dma_unmap_xfer(struct tegra_qspi *tqspi, struct spi_transfer *t)
602 len = DIV_ROUND_UP(tqspi->curr_dma_words * tqspi->bytes_per_word, 4) * 4;
604 dma_unmap_single(tqspi->dev, t->tx_dma, len, DMA_TO_DEVICE);
605 dma_unmap_single(tqspi->dev, t->rx_dma, len, DMA_FROM_DEVICE);
608 static int tegra_qspi_start_dma_based_transfer(struct tegra_qspi *tqspi, struct spi_transfer *t)
610 struct dma_slave_config dma_sconfig = { 0 };
616 if (tqspi->is_packed) {
617 ret = tegra_qspi_dma_map_xfer(tqspi, t);
622 val = QSPI_DMA_BLK_SET(tqspi->curr_dma_words - 1);
623 tegra_qspi_writel(tqspi, val, QSPI_DMA_BLK);
625 tegra_qspi_unmask_irq(tqspi);
627 if (tqspi->is_packed)
628 len = DIV_ROUND_UP(tqspi->curr_dma_words * tqspi->bytes_per_word, 4) * 4;
630 len = tqspi->curr_dma_words * 4;
632 /* set attention level based on length of transfer */
635 val |= QSPI_TX_TRIG_1 | QSPI_RX_TRIG_1;
637 } else if (((len) >> 4) & 0x1) {
638 val |= QSPI_TX_TRIG_4 | QSPI_RX_TRIG_4;
641 val |= QSPI_TX_TRIG_8 | QSPI_RX_TRIG_8;
645 tegra_qspi_writel(tqspi, val, QSPI_DMA_CTL);
646 tqspi->dma_control_reg = val;
648 dma_sconfig.device_fc = true;
649 if (tqspi->cur_direction & DATA_DIR_TX) {
650 dma_sconfig.dst_addr = tqspi->phys + QSPI_TX_FIFO;
651 dma_sconfig.dst_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
652 dma_sconfig.dst_maxburst = dma_burst;
653 ret = dmaengine_slave_config(tqspi->tx_dma_chan, &dma_sconfig);
655 dev_err(tqspi->dev, "failed DMA slave config: %d\n", ret);
659 tegra_qspi_copy_client_txbuf_to_qspi_txbuf(tqspi, t);
660 ret = tegra_qspi_start_tx_dma(tqspi, t, len);
662 dev_err(tqspi->dev, "failed to starting TX DMA: %d\n", ret);
667 if (tqspi->cur_direction & DATA_DIR_RX) {
668 dma_sconfig.src_addr = tqspi->phys + QSPI_RX_FIFO;
669 dma_sconfig.src_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
670 dma_sconfig.src_maxburst = dma_burst;
671 ret = dmaengine_slave_config(tqspi->rx_dma_chan, &dma_sconfig);
673 dev_err(tqspi->dev, "failed DMA slave config: %d\n", ret);
677 dma_sync_single_for_device(tqspi->dev, tqspi->rx_dma_phys,
681 ret = tegra_qspi_start_rx_dma(tqspi, t, len);
683 dev_err(tqspi->dev, "failed to start RX DMA: %d\n", ret);
684 if (tqspi->cur_direction & DATA_DIR_TX)
685 dmaengine_terminate_all(tqspi->tx_dma_chan);
690 tegra_qspi_writel(tqspi, tqspi->command1_reg, QSPI_COMMAND1);
692 tqspi->is_curr_dma_xfer = true;
693 tqspi->dma_control_reg = val;
695 tegra_qspi_writel(tqspi, val, QSPI_DMA_CTL);
700 static int tegra_qspi_start_cpu_based_transfer(struct tegra_qspi *qspi, struct spi_transfer *t)
703 unsigned int cur_words;
705 if (qspi->cur_direction & DATA_DIR_TX)
706 cur_words = tegra_qspi_fill_tx_fifo_from_client_txbuf(qspi, t);
708 cur_words = qspi->curr_dma_words;
710 val = QSPI_DMA_BLK_SET(cur_words - 1);
711 tegra_qspi_writel(qspi, val, QSPI_DMA_BLK);
713 tegra_qspi_unmask_irq(qspi);
715 qspi->is_curr_dma_xfer = false;
716 val = qspi->command1_reg;
718 tegra_qspi_writel(qspi, val, QSPI_COMMAND1);
723 static void tegra_qspi_deinit_dma(struct tegra_qspi *tqspi)
725 if (!tqspi->soc_data->has_dma)
728 if (tqspi->tx_dma_buf) {
729 dma_free_coherent(tqspi->dev, tqspi->dma_buf_size,
730 tqspi->tx_dma_buf, tqspi->tx_dma_phys);
731 tqspi->tx_dma_buf = NULL;
734 if (tqspi->tx_dma_chan) {
735 dma_release_channel(tqspi->tx_dma_chan);
736 tqspi->tx_dma_chan = NULL;
739 if (tqspi->rx_dma_buf) {
740 dma_free_coherent(tqspi->dev, tqspi->dma_buf_size,
741 tqspi->rx_dma_buf, tqspi->rx_dma_phys);
742 tqspi->rx_dma_buf = NULL;
745 if (tqspi->rx_dma_chan) {
746 dma_release_channel(tqspi->rx_dma_chan);
747 tqspi->rx_dma_chan = NULL;
751 static int tegra_qspi_init_dma(struct tegra_qspi *tqspi)
753 struct dma_chan *dma_chan;
758 if (!tqspi->soc_data->has_dma)
761 dma_chan = dma_request_chan(tqspi->dev, "rx");
762 if (IS_ERR(dma_chan)) {
763 err = PTR_ERR(dma_chan);
767 tqspi->rx_dma_chan = dma_chan;
769 dma_buf = dma_alloc_coherent(tqspi->dev, tqspi->dma_buf_size, &dma_phys, GFP_KERNEL);
775 tqspi->rx_dma_buf = dma_buf;
776 tqspi->rx_dma_phys = dma_phys;
778 dma_chan = dma_request_chan(tqspi->dev, "tx");
779 if (IS_ERR(dma_chan)) {
780 err = PTR_ERR(dma_chan);
784 tqspi->tx_dma_chan = dma_chan;
786 dma_buf = dma_alloc_coherent(tqspi->dev, tqspi->dma_buf_size, &dma_phys, GFP_KERNEL);
792 tqspi->tx_dma_buf = dma_buf;
793 tqspi->tx_dma_phys = dma_phys;
794 tqspi->use_dma = true;
799 tegra_qspi_deinit_dma(tqspi);
801 if (err != -EPROBE_DEFER) {
802 dev_err(tqspi->dev, "cannot use DMA: %d\n", err);
803 dev_err(tqspi->dev, "falling back to PIO\n");
810 static u32 tegra_qspi_setup_transfer_one(struct spi_device *spi, struct spi_transfer *t,
811 bool is_first_of_msg)
813 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
814 struct tegra_qspi_client_data *cdata = spi->controller_data;
815 u32 command1, command2, speed = t->speed_hz;
816 u8 bits_per_word = t->bits_per_word;
817 u32 tx_tap = 0, rx_tap = 0;
820 if (!has_acpi_companion(tqspi->dev) && speed != tqspi->cur_speed) {
821 clk_set_rate(tqspi->clk, speed);
822 tqspi->cur_speed = speed;
826 tqspi->cur_rx_pos = 0;
827 tqspi->cur_tx_pos = 0;
828 tqspi->curr_xfer = t;
830 if (is_first_of_msg) {
831 tegra_qspi_mask_clear_irq(tqspi);
833 command1 = tqspi->def_command1_reg;
834 command1 |= QSPI_CS_SEL(spi_get_chipselect(spi, 0));
835 command1 |= QSPI_BIT_LENGTH(bits_per_word - 1);
837 command1 &= ~QSPI_CONTROL_MODE_MASK;
838 req_mode = spi->mode & 0x3;
839 if (req_mode == SPI_MODE_3)
840 command1 |= QSPI_CONTROL_MODE_3;
842 command1 |= QSPI_CONTROL_MODE_0;
844 if (spi->mode & SPI_CS_HIGH)
845 command1 |= QSPI_CS_SW_VAL;
847 command1 &= ~QSPI_CS_SW_VAL;
848 tegra_qspi_writel(tqspi, command1, QSPI_COMMAND1);
850 if (cdata && cdata->tx_clk_tap_delay)
851 tx_tap = cdata->tx_clk_tap_delay;
853 if (cdata && cdata->rx_clk_tap_delay)
854 rx_tap = cdata->rx_clk_tap_delay;
856 command2 = QSPI_TX_TAP_DELAY(tx_tap) | QSPI_RX_TAP_DELAY(rx_tap);
857 if (command2 != tqspi->def_command2_reg)
858 tegra_qspi_writel(tqspi, command2, QSPI_COMMAND2);
861 command1 = tqspi->command1_reg;
862 command1 &= ~QSPI_BIT_LENGTH(~0);
863 command1 |= QSPI_BIT_LENGTH(bits_per_word - 1);
866 command1 &= ~QSPI_SDR_DDR_SEL;
871 static int tegra_qspi_start_transfer_one(struct spi_device *spi,
872 struct spi_transfer *t, u32 command1)
874 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
875 unsigned int total_fifo_words;
879 total_fifo_words = tegra_qspi_calculate_curr_xfer_param(tqspi, t);
881 command1 &= ~QSPI_PACKED;
882 if (tqspi->is_packed)
883 command1 |= QSPI_PACKED;
884 tegra_qspi_writel(tqspi, command1, QSPI_COMMAND1);
886 tqspi->cur_direction = 0;
888 command1 &= ~(QSPI_TX_EN | QSPI_RX_EN);
890 command1 |= QSPI_RX_EN;
891 tqspi->cur_direction |= DATA_DIR_RX;
892 bus_width = t->rx_nbits;
896 command1 |= QSPI_TX_EN;
897 tqspi->cur_direction |= DATA_DIR_TX;
898 bus_width = t->tx_nbits;
901 command1 &= ~QSPI_INTERFACE_WIDTH_MASK;
903 if (bus_width == SPI_NBITS_QUAD)
904 command1 |= QSPI_INTERFACE_WIDTH_QUAD;
905 else if (bus_width == SPI_NBITS_DUAL)
906 command1 |= QSPI_INTERFACE_WIDTH_DUAL;
908 command1 |= QSPI_INTERFACE_WIDTH_SINGLE;
910 tqspi->command1_reg = command1;
912 tegra_qspi_writel(tqspi, QSPI_NUM_DUMMY_CYCLE(tqspi->dummy_cycles), QSPI_MISC_REG);
914 ret = tegra_qspi_flush_fifos(tqspi, false);
918 if (tqspi->use_dma && total_fifo_words > QSPI_FIFO_DEPTH)
919 ret = tegra_qspi_start_dma_based_transfer(tqspi, t);
921 ret = tegra_qspi_start_cpu_based_transfer(tqspi, t);
926 static struct tegra_qspi_client_data *tegra_qspi_parse_cdata_dt(struct spi_device *spi)
928 struct tegra_qspi_client_data *cdata;
929 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
931 cdata = devm_kzalloc(tqspi->dev, sizeof(*cdata), GFP_KERNEL);
935 device_property_read_u32(&spi->dev, "nvidia,tx-clk-tap-delay",
936 &cdata->tx_clk_tap_delay);
937 device_property_read_u32(&spi->dev, "nvidia,rx-clk-tap-delay",
938 &cdata->rx_clk_tap_delay);
943 static int tegra_qspi_setup(struct spi_device *spi)
945 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
946 struct tegra_qspi_client_data *cdata = spi->controller_data;
951 ret = pm_runtime_resume_and_get(tqspi->dev);
953 dev_err(tqspi->dev, "failed to get runtime PM: %d\n", ret);
958 cdata = tegra_qspi_parse_cdata_dt(spi);
959 spi->controller_data = cdata;
961 spin_lock_irqsave(&tqspi->lock, flags);
963 /* keep default cs state to inactive */
964 val = tqspi->def_command1_reg;
965 val |= QSPI_CS_SEL(spi_get_chipselect(spi, 0));
966 if (spi->mode & SPI_CS_HIGH)
967 val &= ~QSPI_CS_POL_INACTIVE(spi_get_chipselect(spi, 0));
969 val |= QSPI_CS_POL_INACTIVE(spi_get_chipselect(spi, 0));
971 tqspi->def_command1_reg = val;
972 tegra_qspi_writel(tqspi, tqspi->def_command1_reg, QSPI_COMMAND1);
974 spin_unlock_irqrestore(&tqspi->lock, flags);
976 pm_runtime_put(tqspi->dev);
981 static void tegra_qspi_dump_regs(struct tegra_qspi *tqspi)
983 dev_dbg(tqspi->dev, "============ QSPI REGISTER DUMP ============\n");
984 dev_dbg(tqspi->dev, "Command1: 0x%08x | Command2: 0x%08x\n",
985 tegra_qspi_readl(tqspi, QSPI_COMMAND1),
986 tegra_qspi_readl(tqspi, QSPI_COMMAND2));
987 dev_dbg(tqspi->dev, "DMA_CTL: 0x%08x | DMA_BLK: 0x%08x\n",
988 tegra_qspi_readl(tqspi, QSPI_DMA_CTL),
989 tegra_qspi_readl(tqspi, QSPI_DMA_BLK));
990 dev_dbg(tqspi->dev, "INTR_MASK: 0x%08x | MISC: 0x%08x\n",
991 tegra_qspi_readl(tqspi, QSPI_INTR_MASK),
992 tegra_qspi_readl(tqspi, QSPI_MISC_REG));
993 dev_dbg(tqspi->dev, "TRANS_STAT: 0x%08x | FIFO_STATUS: 0x%08x\n",
994 tegra_qspi_readl(tqspi, QSPI_TRANS_STATUS),
995 tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS));
998 static void tegra_qspi_handle_error(struct tegra_qspi *tqspi)
1000 dev_err(tqspi->dev, "error in transfer, fifo status 0x%08x\n", tqspi->status_reg);
1001 tegra_qspi_dump_regs(tqspi);
1002 tegra_qspi_flush_fifos(tqspi, true);
1003 if (device_reset(tqspi->dev) < 0)
1004 dev_warn_once(tqspi->dev, "device reset failed\n");
1007 static void tegra_qspi_transfer_end(struct spi_device *spi)
1009 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
1010 int cs_val = (spi->mode & SPI_CS_HIGH) ? 0 : 1;
1013 tqspi->command1_reg |= QSPI_CS_SW_VAL;
1015 tqspi->command1_reg &= ~QSPI_CS_SW_VAL;
1016 tegra_qspi_writel(tqspi, tqspi->command1_reg, QSPI_COMMAND1);
1017 tegra_qspi_writel(tqspi, tqspi->def_command1_reg, QSPI_COMMAND1);
1020 static u32 tegra_qspi_cmd_config(bool is_ddr, u8 bus_width, u8 len)
1024 /* Extract Command configuration and value */
1026 cmd_config |= QSPI_COMMAND_SDR_DDR;
1028 cmd_config &= ~QSPI_COMMAND_SDR_DDR;
1030 cmd_config |= QSPI_COMMAND_X1_X2_X4(bus_width);
1031 cmd_config |= QSPI_COMMAND_SIZE_SET((len * 8) - 1);
1036 static u32 tegra_qspi_addr_config(bool is_ddr, u8 bus_width, u8 len)
1038 u32 addr_config = 0;
1040 /* Extract Address configuration and value */
1041 is_ddr = 0; //Only SDR mode supported
1042 bus_width = 0; //X1 mode
1045 addr_config |= QSPI_ADDRESS_SDR_DDR;
1047 addr_config &= ~QSPI_ADDRESS_SDR_DDR;
1049 addr_config |= QSPI_ADDRESS_X1_X2_X4(bus_width);
1050 addr_config |= QSPI_ADDRESS_SIZE_SET((len * 8) - 1);
1055 static int tegra_qspi_combined_seq_xfer(struct tegra_qspi *tqspi,
1056 struct spi_message *msg)
1058 bool is_first_msg = true;
1059 struct spi_transfer *xfer;
1060 struct spi_device *spi = msg->spi;
1061 u8 transfer_phase = 0;
1062 u32 cmd1 = 0, dma_ctl = 0;
1064 u32 address_value = 0;
1065 u32 cmd_config = 0, addr_config = 0;
1066 u8 cmd_value = 0, val = 0;
1068 /* Enable Combined sequence mode */
1069 val = tegra_qspi_readl(tqspi, QSPI_GLOBAL_CONFIG);
1070 if (spi->mode & SPI_TPM_HW_FLOW) {
1071 if (tqspi->soc_data->supports_tpm)
1072 val |= QSPI_TPM_WAIT_POLL_EN;
1076 val |= QSPI_CMB_SEQ_EN;
1077 tegra_qspi_writel(tqspi, val, QSPI_GLOBAL_CONFIG);
1078 /* Process individual transfer list */
1079 list_for_each_entry(xfer, &msg->transfers, transfer_list) {
1080 switch (transfer_phase) {
1083 cmd_config = tegra_qspi_cmd_config(false, 0,
1085 cmd_value = *((const u8 *)(xfer->tx_buf));
1089 addr_config = tegra_qspi_addr_config(false, 0,
1091 address_value = *((const u32 *)(xfer->tx_buf));
1094 /* Program Command, Address value in register */
1095 tegra_qspi_writel(tqspi, cmd_value, QSPI_CMB_SEQ_CMD);
1096 tegra_qspi_writel(tqspi, address_value,
1098 /* Program Command and Address config in register */
1099 tegra_qspi_writel(tqspi, cmd_config,
1100 QSPI_CMB_SEQ_CMD_CFG);
1101 tegra_qspi_writel(tqspi, addr_config,
1102 QSPI_CMB_SEQ_ADDR_CFG);
1104 reinit_completion(&tqspi->xfer_completion);
1105 cmd1 = tegra_qspi_setup_transfer_one(spi, xfer,
1107 ret = tegra_qspi_start_transfer_one(spi, xfer,
1111 dev_err(tqspi->dev, "Failed to start transfer-one: %d\n",
1116 is_first_msg = false;
1117 ret = wait_for_completion_timeout
1118 (&tqspi->xfer_completion,
1121 if (WARN_ON(ret == 0)) {
1122 dev_err(tqspi->dev, "QSPI Transfer failed with timeout: %d\n",
1124 if (tqspi->is_curr_dma_xfer &&
1125 (tqspi->cur_direction & DATA_DIR_TX))
1126 dmaengine_terminate_all
1127 (tqspi->tx_dma_chan);
1129 if (tqspi->is_curr_dma_xfer &&
1130 (tqspi->cur_direction & DATA_DIR_RX))
1131 dmaengine_terminate_all
1132 (tqspi->rx_dma_chan);
1134 /* Abort transfer by resetting pio/dma bit */
1135 if (!tqspi->is_curr_dma_xfer) {
1136 cmd1 = tegra_qspi_readl
1144 dma_ctl = tegra_qspi_readl
1147 dma_ctl &= ~QSPI_DMA_EN;
1148 tegra_qspi_writel(tqspi, dma_ctl,
1152 /* Reset controller if timeout happens */
1153 if (device_reset(tqspi->dev) < 0)
1154 dev_warn_once(tqspi->dev,
1155 "device reset failed\n");
1160 if (tqspi->tx_status || tqspi->rx_status) {
1161 dev_err(tqspi->dev, "QSPI Transfer failed\n");
1162 tqspi->tx_status = 0;
1163 tqspi->rx_status = 0;
1167 if (!xfer->cs_change) {
1168 tegra_qspi_transfer_end(spi);
1169 spi_transfer_delay_exec(xfer);
1176 msg->actual_length += xfer->len;
1184 tegra_qspi_transfer_end(spi);
1185 spi_transfer_delay_exec(xfer);
1191 static int tegra_qspi_non_combined_seq_xfer(struct tegra_qspi *tqspi,
1192 struct spi_message *msg)
1194 struct spi_device *spi = msg->spi;
1195 struct spi_transfer *transfer;
1196 bool is_first_msg = true;
1197 int ret = 0, val = 0;
1200 msg->actual_length = 0;
1201 tqspi->tx_status = 0;
1202 tqspi->rx_status = 0;
1204 /* Disable Combined sequence mode */
1205 val = tegra_qspi_readl(tqspi, QSPI_GLOBAL_CONFIG);
1206 val &= ~QSPI_CMB_SEQ_EN;
1207 if (tqspi->soc_data->supports_tpm)
1208 val &= ~QSPI_TPM_WAIT_POLL_EN;
1209 tegra_qspi_writel(tqspi, val, QSPI_GLOBAL_CONFIG);
1210 list_for_each_entry(transfer, &msg->transfers, transfer_list) {
1211 struct spi_transfer *xfer = transfer;
1215 tqspi->dummy_cycles = 0;
1217 * Tegra QSPI hardware supports dummy bytes transfer after actual transfer
1218 * bytes based on programmed dummy clock cycles in the QSPI_MISC register.
1219 * So, check if the next transfer is dummy data transfer and program dummy
1220 * clock cycles along with the current transfer and skip next transfer.
1222 if (!list_is_last(&xfer->transfer_list, &msg->transfers)) {
1223 struct spi_transfer *next_xfer;
1225 next_xfer = list_next_entry(xfer, transfer_list);
1226 if (next_xfer->dummy_data) {
1227 u32 dummy_cycles = next_xfer->len * 8 / next_xfer->tx_nbits;
1229 if (dummy_cycles <= QSPI_DUMMY_CYCLES_MAX) {
1230 tqspi->dummy_cycles = dummy_cycles;
1231 dummy_bytes = next_xfer->len;
1232 transfer = next_xfer;
1237 reinit_completion(&tqspi->xfer_completion);
1239 cmd1 = tegra_qspi_setup_transfer_one(spi, xfer, is_first_msg);
1241 ret = tegra_qspi_start_transfer_one(spi, xfer, cmd1);
1243 dev_err(tqspi->dev, "failed to start transfer: %d\n", ret);
1247 ret = wait_for_completion_timeout(&tqspi->xfer_completion,
1249 if (WARN_ON(ret == 0)) {
1250 dev_err(tqspi->dev, "transfer timeout\n");
1251 if (tqspi->is_curr_dma_xfer && (tqspi->cur_direction & DATA_DIR_TX))
1252 dmaengine_terminate_all(tqspi->tx_dma_chan);
1253 if (tqspi->is_curr_dma_xfer && (tqspi->cur_direction & DATA_DIR_RX))
1254 dmaengine_terminate_all(tqspi->rx_dma_chan);
1255 tegra_qspi_handle_error(tqspi);
1260 if (tqspi->tx_status || tqspi->rx_status) {
1261 tegra_qspi_handle_error(tqspi);
1266 msg->actual_length += xfer->len + dummy_bytes;
1270 tegra_qspi_transfer_end(spi);
1271 spi_transfer_delay_exec(xfer);
1275 if (list_is_last(&xfer->transfer_list, &msg->transfers)) {
1276 /* de-activate CS after last transfer only when cs_change is not set */
1277 if (!xfer->cs_change) {
1278 tegra_qspi_transfer_end(spi);
1279 spi_transfer_delay_exec(xfer);
1281 } else if (xfer->cs_change) {
1282 /* de-activated CS between the transfers only when cs_change is set */
1283 tegra_qspi_transfer_end(spi);
1284 spi_transfer_delay_exec(xfer);
1295 static bool tegra_qspi_validate_cmb_seq(struct tegra_qspi *tqspi,
1296 struct spi_message *msg)
1298 int transfer_count = 0;
1299 struct spi_transfer *xfer;
1301 list_for_each_entry(xfer, &msg->transfers, transfer_list) {
1304 if (!tqspi->soc_data->cmb_xfer_capable || transfer_count != 3)
1306 xfer = list_first_entry(&msg->transfers, typeof(*xfer),
1310 xfer = list_next_entry(xfer, transfer_list);
1311 if (xfer->len > 4 || xfer->len < 3)
1313 xfer = list_next_entry(xfer, transfer_list);
1314 if (!tqspi->soc_data->has_dma && xfer->len > (QSPI_FIFO_DEPTH << 2))
1320 static int tegra_qspi_transfer_one_message(struct spi_master *master,
1321 struct spi_message *msg)
1323 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1326 if (tegra_qspi_validate_cmb_seq(tqspi, msg))
1327 ret = tegra_qspi_combined_seq_xfer(tqspi, msg);
1329 ret = tegra_qspi_non_combined_seq_xfer(tqspi, msg);
1331 spi_finalize_current_message(master);
1336 static irqreturn_t handle_cpu_based_xfer(struct tegra_qspi *tqspi)
1338 struct spi_transfer *t = tqspi->curr_xfer;
1339 unsigned long flags;
1341 spin_lock_irqsave(&tqspi->lock, flags);
1343 if (tqspi->tx_status || tqspi->rx_status) {
1344 tegra_qspi_handle_error(tqspi);
1345 complete(&tqspi->xfer_completion);
1349 if (tqspi->cur_direction & DATA_DIR_RX)
1350 tegra_qspi_read_rx_fifo_to_client_rxbuf(tqspi, t);
1352 if (tqspi->cur_direction & DATA_DIR_TX)
1353 tqspi->cur_pos = tqspi->cur_tx_pos;
1355 tqspi->cur_pos = tqspi->cur_rx_pos;
1357 if (tqspi->cur_pos == t->len) {
1358 complete(&tqspi->xfer_completion);
1362 tegra_qspi_calculate_curr_xfer_param(tqspi, t);
1363 tegra_qspi_start_cpu_based_transfer(tqspi, t);
1365 spin_unlock_irqrestore(&tqspi->lock, flags);
1369 static irqreturn_t handle_dma_based_xfer(struct tegra_qspi *tqspi)
1371 struct spi_transfer *t = tqspi->curr_xfer;
1372 unsigned int total_fifo_words;
1373 unsigned long flags;
1377 if (tqspi->cur_direction & DATA_DIR_TX) {
1378 if (tqspi->tx_status) {
1379 dmaengine_terminate_all(tqspi->tx_dma_chan);
1382 wait_status = wait_for_completion_interruptible_timeout(
1383 &tqspi->tx_dma_complete, QSPI_DMA_TIMEOUT);
1384 if (wait_status <= 0) {
1385 dmaengine_terminate_all(tqspi->tx_dma_chan);
1386 dev_err(tqspi->dev, "failed TX DMA transfer\n");
1392 if (tqspi->cur_direction & DATA_DIR_RX) {
1393 if (tqspi->rx_status) {
1394 dmaengine_terminate_all(tqspi->rx_dma_chan);
1397 wait_status = wait_for_completion_interruptible_timeout(
1398 &tqspi->rx_dma_complete, QSPI_DMA_TIMEOUT);
1399 if (wait_status <= 0) {
1400 dmaengine_terminate_all(tqspi->rx_dma_chan);
1401 dev_err(tqspi->dev, "failed RX DMA transfer\n");
1407 spin_lock_irqsave(&tqspi->lock, flags);
1410 tegra_qspi_dma_unmap_xfer(tqspi, t);
1411 tegra_qspi_handle_error(tqspi);
1412 complete(&tqspi->xfer_completion);
1416 if (tqspi->cur_direction & DATA_DIR_RX)
1417 tegra_qspi_copy_qspi_rxbuf_to_client_rxbuf(tqspi, t);
1419 if (tqspi->cur_direction & DATA_DIR_TX)
1420 tqspi->cur_pos = tqspi->cur_tx_pos;
1422 tqspi->cur_pos = tqspi->cur_rx_pos;
1424 if (tqspi->cur_pos == t->len) {
1425 tegra_qspi_dma_unmap_xfer(tqspi, t);
1426 complete(&tqspi->xfer_completion);
1430 tegra_qspi_dma_unmap_xfer(tqspi, t);
1432 /* continue transfer in current message */
1433 total_fifo_words = tegra_qspi_calculate_curr_xfer_param(tqspi, t);
1434 if (total_fifo_words > QSPI_FIFO_DEPTH)
1435 err = tegra_qspi_start_dma_based_transfer(tqspi, t);
1437 err = tegra_qspi_start_cpu_based_transfer(tqspi, t);
1440 spin_unlock_irqrestore(&tqspi->lock, flags);
1444 static irqreturn_t tegra_qspi_isr_thread(int irq, void *context_data)
1446 struct tegra_qspi *tqspi = context_data;
1448 tqspi->status_reg = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
1450 if (tqspi->cur_direction & DATA_DIR_TX)
1451 tqspi->tx_status = tqspi->status_reg & (QSPI_TX_FIFO_UNF | QSPI_TX_FIFO_OVF);
1453 if (tqspi->cur_direction & DATA_DIR_RX)
1454 tqspi->rx_status = tqspi->status_reg & (QSPI_RX_FIFO_OVF | QSPI_RX_FIFO_UNF);
1456 tegra_qspi_mask_clear_irq(tqspi);
1458 if (!tqspi->is_curr_dma_xfer)
1459 return handle_cpu_based_xfer(tqspi);
1461 return handle_dma_based_xfer(tqspi);
1464 static struct tegra_qspi_soc_data tegra210_qspi_soc_data = {
1466 .cmb_xfer_capable = false,
1467 .supports_tpm = false,
1471 static struct tegra_qspi_soc_data tegra186_qspi_soc_data = {
1473 .cmb_xfer_capable = true,
1474 .supports_tpm = false,
1478 static struct tegra_qspi_soc_data tegra234_qspi_soc_data = {
1480 .cmb_xfer_capable = true,
1481 .supports_tpm = true,
1485 static struct tegra_qspi_soc_data tegra241_qspi_soc_data = {
1487 .cmb_xfer_capable = true,
1488 .supports_tpm = true,
1492 static const struct of_device_id tegra_qspi_of_match[] = {
1494 .compatible = "nvidia,tegra210-qspi",
1495 .data = &tegra210_qspi_soc_data,
1497 .compatible = "nvidia,tegra186-qspi",
1498 .data = &tegra186_qspi_soc_data,
1500 .compatible = "nvidia,tegra194-qspi",
1501 .data = &tegra186_qspi_soc_data,
1503 .compatible = "nvidia,tegra234-qspi",
1504 .data = &tegra234_qspi_soc_data,
1506 .compatible = "nvidia,tegra241-qspi",
1507 .data = &tegra241_qspi_soc_data,
1512 MODULE_DEVICE_TABLE(of, tegra_qspi_of_match);
1515 static const struct acpi_device_id tegra_qspi_acpi_match[] = {
1518 .driver_data = (kernel_ulong_t)&tegra210_qspi_soc_data,
1521 .driver_data = (kernel_ulong_t)&tegra186_qspi_soc_data,
1524 .driver_data = (kernel_ulong_t)&tegra234_qspi_soc_data,
1527 .driver_data = (kernel_ulong_t)&tegra241_qspi_soc_data,
1532 MODULE_DEVICE_TABLE(acpi, tegra_qspi_acpi_match);
1535 static int tegra_qspi_probe(struct platform_device *pdev)
1537 struct spi_master *master;
1538 struct tegra_qspi *tqspi;
1543 master = devm_spi_alloc_master(&pdev->dev, sizeof(*tqspi));
1547 platform_set_drvdata(pdev, master);
1548 tqspi = spi_master_get_devdata(master);
1550 master->mode_bits = SPI_MODE_0 | SPI_MODE_3 | SPI_CS_HIGH |
1551 SPI_TX_DUAL | SPI_RX_DUAL | SPI_TX_QUAD | SPI_RX_QUAD;
1552 master->bits_per_word_mask = SPI_BPW_MASK(32) | SPI_BPW_MASK(16) | SPI_BPW_MASK(8);
1553 master->flags = SPI_CONTROLLER_HALF_DUPLEX;
1554 master->setup = tegra_qspi_setup;
1555 master->transfer_one_message = tegra_qspi_transfer_one_message;
1556 master->num_chipselect = 1;
1557 master->auto_runtime_pm = true;
1559 bus_num = of_alias_get_id(pdev->dev.of_node, "spi");
1561 master->bus_num = bus_num;
1563 tqspi->master = master;
1564 tqspi->dev = &pdev->dev;
1565 spin_lock_init(&tqspi->lock);
1567 tqspi->soc_data = device_get_match_data(&pdev->dev);
1568 master->num_chipselect = tqspi->soc_data->cs_count;
1569 tqspi->base = devm_platform_get_and_ioremap_resource(pdev, 0, &r);
1570 if (IS_ERR(tqspi->base))
1571 return PTR_ERR(tqspi->base);
1573 tqspi->phys = r->start;
1574 qspi_irq = platform_get_irq(pdev, 0);
1577 tqspi->irq = qspi_irq;
1579 if (!has_acpi_companion(tqspi->dev)) {
1580 tqspi->clk = devm_clk_get(&pdev->dev, "qspi");
1581 if (IS_ERR(tqspi->clk)) {
1582 ret = PTR_ERR(tqspi->clk);
1583 dev_err(&pdev->dev, "failed to get clock: %d\n", ret);
1589 tqspi->max_buf_size = QSPI_FIFO_DEPTH << 2;
1590 tqspi->dma_buf_size = DEFAULT_QSPI_DMA_BUF_LEN;
1592 ret = tegra_qspi_init_dma(tqspi);
1597 tqspi->max_buf_size = tqspi->dma_buf_size;
1599 init_completion(&tqspi->tx_dma_complete);
1600 init_completion(&tqspi->rx_dma_complete);
1601 init_completion(&tqspi->xfer_completion);
1603 pm_runtime_enable(&pdev->dev);
1604 ret = pm_runtime_resume_and_get(&pdev->dev);
1606 dev_err(&pdev->dev, "failed to get runtime PM: %d\n", ret);
1607 goto exit_pm_disable;
1610 if (device_reset(tqspi->dev) < 0)
1611 dev_warn_once(tqspi->dev, "device reset failed\n");
1613 tqspi->def_command1_reg = QSPI_M_S | QSPI_CS_SW_HW | QSPI_CS_SW_VAL;
1614 tegra_qspi_writel(tqspi, tqspi->def_command1_reg, QSPI_COMMAND1);
1615 tqspi->spi_cs_timing1 = tegra_qspi_readl(tqspi, QSPI_CS_TIMING1);
1616 tqspi->spi_cs_timing2 = tegra_qspi_readl(tqspi, QSPI_CS_TIMING2);
1617 tqspi->def_command2_reg = tegra_qspi_readl(tqspi, QSPI_COMMAND2);
1619 pm_runtime_put(&pdev->dev);
1621 ret = request_threaded_irq(tqspi->irq, NULL,
1622 tegra_qspi_isr_thread, IRQF_ONESHOT,
1623 dev_name(&pdev->dev), tqspi);
1625 dev_err(&pdev->dev, "failed to request IRQ#%u: %d\n", tqspi->irq, ret);
1626 goto exit_pm_disable;
1629 master->dev.of_node = pdev->dev.of_node;
1630 ret = spi_register_master(master);
1632 dev_err(&pdev->dev, "failed to register master: %d\n", ret);
1639 free_irq(qspi_irq, tqspi);
1641 pm_runtime_force_suspend(&pdev->dev);
1642 tegra_qspi_deinit_dma(tqspi);
1646 static void tegra_qspi_remove(struct platform_device *pdev)
1648 struct spi_master *master = platform_get_drvdata(pdev);
1649 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1651 spi_unregister_master(master);
1652 free_irq(tqspi->irq, tqspi);
1653 pm_runtime_force_suspend(&pdev->dev);
1654 tegra_qspi_deinit_dma(tqspi);
1657 static int __maybe_unused tegra_qspi_suspend(struct device *dev)
1659 struct spi_master *master = dev_get_drvdata(dev);
1661 return spi_master_suspend(master);
1664 static int __maybe_unused tegra_qspi_resume(struct device *dev)
1666 struct spi_master *master = dev_get_drvdata(dev);
1667 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1670 ret = pm_runtime_resume_and_get(dev);
1672 dev_err(dev, "failed to get runtime PM: %d\n", ret);
1676 tegra_qspi_writel(tqspi, tqspi->command1_reg, QSPI_COMMAND1);
1677 tegra_qspi_writel(tqspi, tqspi->def_command2_reg, QSPI_COMMAND2);
1678 pm_runtime_put(dev);
1680 return spi_master_resume(master);
1683 static int __maybe_unused tegra_qspi_runtime_suspend(struct device *dev)
1685 struct spi_master *master = dev_get_drvdata(dev);
1686 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1688 /* Runtime pm disabled with ACPI */
1689 if (has_acpi_companion(tqspi->dev))
1691 /* flush all write which are in PPSB queue by reading back */
1692 tegra_qspi_readl(tqspi, QSPI_COMMAND1);
1694 clk_disable_unprepare(tqspi->clk);
1699 static int __maybe_unused tegra_qspi_runtime_resume(struct device *dev)
1701 struct spi_master *master = dev_get_drvdata(dev);
1702 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1705 /* Runtime pm disabled with ACPI */
1706 if (has_acpi_companion(tqspi->dev))
1708 ret = clk_prepare_enable(tqspi->clk);
1710 dev_err(tqspi->dev, "failed to enable clock: %d\n", ret);
1715 static const struct dev_pm_ops tegra_qspi_pm_ops = {
1716 SET_RUNTIME_PM_OPS(tegra_qspi_runtime_suspend, tegra_qspi_runtime_resume, NULL)
1717 SET_SYSTEM_SLEEP_PM_OPS(tegra_qspi_suspend, tegra_qspi_resume)
1720 static struct platform_driver tegra_qspi_driver = {
1722 .name = "tegra-qspi",
1723 .pm = &tegra_qspi_pm_ops,
1724 .of_match_table = tegra_qspi_of_match,
1725 .acpi_match_table = ACPI_PTR(tegra_qspi_acpi_match),
1727 .probe = tegra_qspi_probe,
1728 .remove_new = tegra_qspi_remove,
1730 module_platform_driver(tegra_qspi_driver);
1732 MODULE_ALIAS("platform:qspi-tegra");
1733 MODULE_DESCRIPTION("NVIDIA Tegra QSPI Controller Driver");
1734 MODULE_AUTHOR("Sowjanya Komatineni <skomatineni@nvidia.com>");
1735 MODULE_LICENSE("GPL v2");