1 // SPDX-License-Identifier: GPL-2.0-only
3 // Copyright (C) 2020 NVIDIA CORPORATION.
6 #include <linux/completion.h>
7 #include <linux/delay.h>
8 #include <linux/dmaengine.h>
9 #include <linux/dma-mapping.h>
10 #include <linux/dmapool.h>
11 #include <linux/err.h>
12 #include <linux/interrupt.h>
14 #include <linux/iopoll.h>
15 #include <linux/kernel.h>
16 #include <linux/kthread.h>
17 #include <linux/module.h>
18 #include <linux/platform_device.h>
19 #include <linux/pm_runtime.h>
21 #include <linux/of_device.h>
22 #include <linux/reset.h>
23 #include <linux/spi/spi.h>
24 #include <linux/acpi.h>
25 #include <linux/property.h>
27 #define QSPI_COMMAND1 0x000
28 #define QSPI_BIT_LENGTH(x) (((x) & 0x1f) << 0)
29 #define QSPI_PACKED BIT(5)
30 #define QSPI_INTERFACE_WIDTH_MASK (0x03 << 7)
31 #define QSPI_INTERFACE_WIDTH(x) (((x) & 0x03) << 7)
32 #define QSPI_INTERFACE_WIDTH_SINGLE QSPI_INTERFACE_WIDTH(0)
33 #define QSPI_INTERFACE_WIDTH_DUAL QSPI_INTERFACE_WIDTH(1)
34 #define QSPI_INTERFACE_WIDTH_QUAD QSPI_INTERFACE_WIDTH(2)
35 #define QSPI_SDR_DDR_SEL BIT(9)
36 #define QSPI_TX_EN BIT(11)
37 #define QSPI_RX_EN BIT(12)
38 #define QSPI_CS_SW_VAL BIT(20)
39 #define QSPI_CS_SW_HW BIT(21)
41 #define QSPI_CS_POL_INACTIVE(n) (1 << (22 + (n)))
42 #define QSPI_CS_POL_INACTIVE_MASK (0xF << 22)
43 #define QSPI_CS_SEL_0 (0 << 26)
44 #define QSPI_CS_SEL_1 (1 << 26)
45 #define QSPI_CS_SEL_2 (2 << 26)
46 #define QSPI_CS_SEL_3 (3 << 26)
47 #define QSPI_CS_SEL_MASK (3 << 26)
48 #define QSPI_CS_SEL(x) (((x) & 0x3) << 26)
50 #define QSPI_CONTROL_MODE_0 (0 << 28)
51 #define QSPI_CONTROL_MODE_3 (3 << 28)
52 #define QSPI_CONTROL_MODE_MASK (3 << 28)
53 #define QSPI_M_S BIT(30)
54 #define QSPI_PIO BIT(31)
56 #define QSPI_COMMAND2 0x004
57 #define QSPI_TX_TAP_DELAY(x) (((x) & 0x3f) << 10)
58 #define QSPI_RX_TAP_DELAY(x) (((x) & 0xff) << 0)
60 #define QSPI_CS_TIMING1 0x008
61 #define QSPI_SETUP_HOLD(setup, hold) (((setup) << 4) | (hold))
63 #define QSPI_CS_TIMING2 0x00c
64 #define CYCLES_BETWEEN_PACKETS_0(x) (((x) & 0x1f) << 0)
65 #define CS_ACTIVE_BETWEEN_PACKETS_0 BIT(5)
67 #define QSPI_TRANS_STATUS 0x010
68 #define QSPI_BLK_CNT(val) (((val) >> 0) & 0xffff)
69 #define QSPI_RDY BIT(30)
71 #define QSPI_FIFO_STATUS 0x014
72 #define QSPI_RX_FIFO_EMPTY BIT(0)
73 #define QSPI_RX_FIFO_FULL BIT(1)
74 #define QSPI_TX_FIFO_EMPTY BIT(2)
75 #define QSPI_TX_FIFO_FULL BIT(3)
76 #define QSPI_RX_FIFO_UNF BIT(4)
77 #define QSPI_RX_FIFO_OVF BIT(5)
78 #define QSPI_TX_FIFO_UNF BIT(6)
79 #define QSPI_TX_FIFO_OVF BIT(7)
80 #define QSPI_ERR BIT(8)
81 #define QSPI_TX_FIFO_FLUSH BIT(14)
82 #define QSPI_RX_FIFO_FLUSH BIT(15)
83 #define QSPI_TX_FIFO_EMPTY_COUNT(val) (((val) >> 16) & 0x7f)
84 #define QSPI_RX_FIFO_FULL_COUNT(val) (((val) >> 23) & 0x7f)
86 #define QSPI_FIFO_ERROR (QSPI_RX_FIFO_UNF | \
90 #define QSPI_FIFO_EMPTY (QSPI_RX_FIFO_EMPTY | \
93 #define QSPI_TX_DATA 0x018
94 #define QSPI_RX_DATA 0x01c
96 #define QSPI_DMA_CTL 0x020
97 #define QSPI_TX_TRIG(n) (((n) & 0x3) << 15)
98 #define QSPI_TX_TRIG_1 QSPI_TX_TRIG(0)
99 #define QSPI_TX_TRIG_4 QSPI_TX_TRIG(1)
100 #define QSPI_TX_TRIG_8 QSPI_TX_TRIG(2)
101 #define QSPI_TX_TRIG_16 QSPI_TX_TRIG(3)
103 #define QSPI_RX_TRIG(n) (((n) & 0x3) << 19)
104 #define QSPI_RX_TRIG_1 QSPI_RX_TRIG(0)
105 #define QSPI_RX_TRIG_4 QSPI_RX_TRIG(1)
106 #define QSPI_RX_TRIG_8 QSPI_RX_TRIG(2)
107 #define QSPI_RX_TRIG_16 QSPI_RX_TRIG(3)
109 #define QSPI_DMA_EN BIT(31)
111 #define QSPI_DMA_BLK 0x024
112 #define QSPI_DMA_BLK_SET(x) (((x) & 0xffff) << 0)
114 #define QSPI_TX_FIFO 0x108
115 #define QSPI_RX_FIFO 0x188
117 #define QSPI_FIFO_DEPTH 64
119 #define QSPI_INTR_MASK 0x18c
120 #define QSPI_INTR_RX_FIFO_UNF_MASK BIT(25)
121 #define QSPI_INTR_RX_FIFO_OVF_MASK BIT(26)
122 #define QSPI_INTR_TX_FIFO_UNF_MASK BIT(27)
123 #define QSPI_INTR_TX_FIFO_OVF_MASK BIT(28)
124 #define QSPI_INTR_RDY_MASK BIT(29)
125 #define QSPI_INTR_RX_TX_FIFO_ERR (QSPI_INTR_RX_FIFO_UNF_MASK | \
126 QSPI_INTR_RX_FIFO_OVF_MASK | \
127 QSPI_INTR_TX_FIFO_UNF_MASK | \
128 QSPI_INTR_TX_FIFO_OVF_MASK)
130 #define QSPI_MISC_REG 0x194
131 #define QSPI_NUM_DUMMY_CYCLE(x) (((x) & 0xff) << 0)
132 #define QSPI_DUMMY_CYCLES_MAX 0xff
134 #define QSPI_CMB_SEQ_CMD 0x19c
135 #define QSPI_COMMAND_VALUE_SET(X) (((x) & 0xFF) << 0)
137 #define QSPI_CMB_SEQ_CMD_CFG 0x1a0
138 #define QSPI_COMMAND_X1_X2_X4(x) (((x) & 0x3) << 13)
139 #define QSPI_COMMAND_X1_X2_X4_MASK (0x03 << 13)
140 #define QSPI_COMMAND_SDR_DDR BIT(12)
141 #define QSPI_COMMAND_SIZE_SET(x) (((x) & 0xFF) << 0)
143 #define QSPI_GLOBAL_CONFIG 0X1a4
144 #define QSPI_CMB_SEQ_EN BIT(0)
146 #define QSPI_CMB_SEQ_ADDR 0x1a8
147 #define QSPI_ADDRESS_VALUE_SET(X) (((x) & 0xFFFF) << 0)
149 #define QSPI_CMB_SEQ_ADDR_CFG 0x1ac
150 #define QSPI_ADDRESS_X1_X2_X4(x) (((x) & 0x3) << 13)
151 #define QSPI_ADDRESS_X1_X2_X4_MASK (0x03 << 13)
152 #define QSPI_ADDRESS_SDR_DDR BIT(12)
153 #define QSPI_ADDRESS_SIZE_SET(x) (((x) & 0xFF) << 0)
155 #define DATA_DIR_TX BIT(0)
156 #define DATA_DIR_RX BIT(1)
158 #define QSPI_DMA_TIMEOUT (msecs_to_jiffies(1000))
159 #define DEFAULT_QSPI_DMA_BUF_LEN (64 * 1024)
160 #define CMD_TRANSFER 0
161 #define ADDR_TRANSFER 1
162 #define DATA_TRANSFER 2
164 struct tegra_qspi_soc_data {
166 bool cmb_xfer_capable;
167 unsigned int cs_count;
170 struct tegra_qspi_client_data {
171 int tx_clk_tap_delay;
172 int rx_clk_tap_delay;
177 struct spi_master *master;
178 /* lock to protect data accessed by irq */
187 unsigned int cur_pos;
188 unsigned int words_per_32bit;
189 unsigned int bytes_per_word;
190 unsigned int curr_dma_words;
191 unsigned int cur_direction;
193 unsigned int cur_rx_pos;
194 unsigned int cur_tx_pos;
196 unsigned int dma_buf_size;
197 unsigned int max_buf_size;
198 bool is_curr_dma_xfer;
200 struct completion rx_dma_complete;
201 struct completion tx_dma_complete;
211 u32 def_command1_reg;
212 u32 def_command2_reg;
217 struct completion xfer_completion;
218 struct spi_transfer *curr_xfer;
220 struct dma_chan *rx_dma_chan;
222 dma_addr_t rx_dma_phys;
223 struct dma_async_tx_descriptor *rx_dma_desc;
225 struct dma_chan *tx_dma_chan;
227 dma_addr_t tx_dma_phys;
228 struct dma_async_tx_descriptor *tx_dma_desc;
229 const struct tegra_qspi_soc_data *soc_data;
232 static inline u32 tegra_qspi_readl(struct tegra_qspi *tqspi, unsigned long offset)
234 return readl(tqspi->base + offset);
237 static inline void tegra_qspi_writel(struct tegra_qspi *tqspi, u32 value, unsigned long offset)
239 writel(value, tqspi->base + offset);
241 /* read back register to make sure that register writes completed */
242 if (offset != QSPI_TX_FIFO)
243 readl(tqspi->base + QSPI_COMMAND1);
246 static void tegra_qspi_mask_clear_irq(struct tegra_qspi *tqspi)
250 /* write 1 to clear status register */
251 value = tegra_qspi_readl(tqspi, QSPI_TRANS_STATUS);
252 tegra_qspi_writel(tqspi, value, QSPI_TRANS_STATUS);
254 value = tegra_qspi_readl(tqspi, QSPI_INTR_MASK);
255 if (!(value & QSPI_INTR_RDY_MASK)) {
256 value |= (QSPI_INTR_RDY_MASK | QSPI_INTR_RX_TX_FIFO_ERR);
257 tegra_qspi_writel(tqspi, value, QSPI_INTR_MASK);
260 /* clear fifo status error if any */
261 value = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
262 if (value & QSPI_ERR)
263 tegra_qspi_writel(tqspi, QSPI_ERR | QSPI_FIFO_ERROR, QSPI_FIFO_STATUS);
267 tegra_qspi_calculate_curr_xfer_param(struct tegra_qspi *tqspi, struct spi_transfer *t)
269 unsigned int max_word, max_len, total_fifo_words;
270 unsigned int remain_len = t->len - tqspi->cur_pos;
271 unsigned int bits_per_word = t->bits_per_word;
273 tqspi->bytes_per_word = DIV_ROUND_UP(bits_per_word, 8);
276 * Tegra QSPI controller supports packed or unpacked mode transfers.
277 * Packed mode is used for data transfers using 8, 16, or 32 bits per
278 * word with a minimum transfer of 1 word and for all other transfers
279 * unpacked mode will be used.
282 if ((bits_per_word == 8 || bits_per_word == 16 ||
283 bits_per_word == 32) && t->len > 3) {
284 tqspi->is_packed = true;
285 tqspi->words_per_32bit = 32 / bits_per_word;
287 tqspi->is_packed = false;
288 tqspi->words_per_32bit = 1;
291 if (tqspi->is_packed) {
292 max_len = min(remain_len, tqspi->max_buf_size);
293 tqspi->curr_dma_words = max_len / tqspi->bytes_per_word;
294 total_fifo_words = (max_len + 3) / 4;
296 max_word = (remain_len - 1) / tqspi->bytes_per_word + 1;
297 max_word = min(max_word, tqspi->max_buf_size / 4);
298 tqspi->curr_dma_words = max_word;
299 total_fifo_words = max_word;
302 return total_fifo_words;
306 tegra_qspi_fill_tx_fifo_from_client_txbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
308 unsigned int written_words, fifo_words_left, count;
309 unsigned int len, tx_empty_count, max_n_32bit, i;
310 u8 *tx_buf = (u8 *)t->tx_buf + tqspi->cur_tx_pos;
313 fifo_status = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
314 tx_empty_count = QSPI_TX_FIFO_EMPTY_COUNT(fifo_status);
316 if (tqspi->is_packed) {
317 fifo_words_left = tx_empty_count * tqspi->words_per_32bit;
318 written_words = min(fifo_words_left, tqspi->curr_dma_words);
319 len = written_words * tqspi->bytes_per_word;
320 max_n_32bit = DIV_ROUND_UP(len, 4);
321 for (count = 0; count < max_n_32bit; count++) {
324 for (i = 0; (i < 4) && len; i++, len--)
325 x |= (u32)(*tx_buf++) << (i * 8);
326 tegra_qspi_writel(tqspi, x, QSPI_TX_FIFO);
329 tqspi->cur_tx_pos += written_words * tqspi->bytes_per_word;
331 unsigned int write_bytes;
332 u8 bytes_per_word = tqspi->bytes_per_word;
334 max_n_32bit = min(tqspi->curr_dma_words, tx_empty_count);
335 written_words = max_n_32bit;
336 len = written_words * tqspi->bytes_per_word;
337 if (len > t->len - tqspi->cur_pos)
338 len = t->len - tqspi->cur_pos;
340 for (count = 0; count < max_n_32bit; count++) {
343 for (i = 0; len && (i < bytes_per_word); i++, len--)
344 x |= (u32)(*tx_buf++) << (i * 8);
345 tegra_qspi_writel(tqspi, x, QSPI_TX_FIFO);
348 tqspi->cur_tx_pos += write_bytes;
351 return written_words;
355 tegra_qspi_read_rx_fifo_to_client_rxbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
357 u8 *rx_buf = (u8 *)t->rx_buf + tqspi->cur_rx_pos;
358 unsigned int len, rx_full_count, count, i;
359 unsigned int read_words = 0;
362 fifo_status = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
363 rx_full_count = QSPI_RX_FIFO_FULL_COUNT(fifo_status);
364 if (tqspi->is_packed) {
365 len = tqspi->curr_dma_words * tqspi->bytes_per_word;
366 for (count = 0; count < rx_full_count; count++) {
367 x = tegra_qspi_readl(tqspi, QSPI_RX_FIFO);
369 for (i = 0; len && (i < 4); i++, len--)
370 *rx_buf++ = (x >> i * 8) & 0xff;
373 read_words += tqspi->curr_dma_words;
374 tqspi->cur_rx_pos += tqspi->curr_dma_words * tqspi->bytes_per_word;
376 u32 rx_mask = ((u32)1 << t->bits_per_word) - 1;
377 u8 bytes_per_word = tqspi->bytes_per_word;
378 unsigned int read_bytes;
380 len = rx_full_count * bytes_per_word;
381 if (len > t->len - tqspi->cur_pos)
382 len = t->len - tqspi->cur_pos;
384 for (count = 0; count < rx_full_count; count++) {
385 x = tegra_qspi_readl(tqspi, QSPI_RX_FIFO) & rx_mask;
387 for (i = 0; len && (i < bytes_per_word); i++, len--)
388 *rx_buf++ = (x >> (i * 8)) & 0xff;
391 read_words += rx_full_count;
392 tqspi->cur_rx_pos += read_bytes;
399 tegra_qspi_copy_client_txbuf_to_qspi_txbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
401 dma_sync_single_for_cpu(tqspi->dev, tqspi->tx_dma_phys,
402 tqspi->dma_buf_size, DMA_TO_DEVICE);
405 * In packed mode, each word in FIFO may contain multiple packets
406 * based on bits per word. So all bytes in each FIFO word are valid.
408 * In unpacked mode, each word in FIFO contains single packet and
409 * based on bits per word any remaining bits in FIFO word will be
410 * ignored by the hardware and are invalid bits.
412 if (tqspi->is_packed) {
413 tqspi->cur_tx_pos += tqspi->curr_dma_words * tqspi->bytes_per_word;
415 u8 *tx_buf = (u8 *)t->tx_buf + tqspi->cur_tx_pos;
416 unsigned int i, count, consume, write_bytes;
419 * Fill tx_dma_buf to contain single packet in each word based
420 * on bits per word from SPI core tx_buf.
422 consume = tqspi->curr_dma_words * tqspi->bytes_per_word;
423 if (consume > t->len - tqspi->cur_pos)
424 consume = t->len - tqspi->cur_pos;
425 write_bytes = consume;
426 for (count = 0; count < tqspi->curr_dma_words; count++) {
429 for (i = 0; consume && (i < tqspi->bytes_per_word); i++, consume--)
430 x |= (u32)(*tx_buf++) << (i * 8);
431 tqspi->tx_dma_buf[count] = x;
434 tqspi->cur_tx_pos += write_bytes;
437 dma_sync_single_for_device(tqspi->dev, tqspi->tx_dma_phys,
438 tqspi->dma_buf_size, DMA_TO_DEVICE);
442 tegra_qspi_copy_qspi_rxbuf_to_client_rxbuf(struct tegra_qspi *tqspi, struct spi_transfer *t)
444 dma_sync_single_for_cpu(tqspi->dev, tqspi->rx_dma_phys,
445 tqspi->dma_buf_size, DMA_FROM_DEVICE);
447 if (tqspi->is_packed) {
448 tqspi->cur_rx_pos += tqspi->curr_dma_words * tqspi->bytes_per_word;
450 unsigned char *rx_buf = t->rx_buf + tqspi->cur_rx_pos;
451 u32 rx_mask = ((u32)1 << t->bits_per_word) - 1;
452 unsigned int i, count, consume, read_bytes;
455 * Each FIFO word contains single data packet.
456 * Skip invalid bits in each FIFO word based on bits per word
457 * and align bytes while filling in SPI core rx_buf.
459 consume = tqspi->curr_dma_words * tqspi->bytes_per_word;
460 if (consume > t->len - tqspi->cur_pos)
461 consume = t->len - tqspi->cur_pos;
462 read_bytes = consume;
463 for (count = 0; count < tqspi->curr_dma_words; count++) {
464 u32 x = tqspi->rx_dma_buf[count] & rx_mask;
466 for (i = 0; consume && (i < tqspi->bytes_per_word); i++, consume--)
467 *rx_buf++ = (x >> (i * 8)) & 0xff;
470 tqspi->cur_rx_pos += read_bytes;
473 dma_sync_single_for_device(tqspi->dev, tqspi->rx_dma_phys,
474 tqspi->dma_buf_size, DMA_FROM_DEVICE);
477 static void tegra_qspi_dma_complete(void *args)
479 struct completion *dma_complete = args;
481 complete(dma_complete);
484 static int tegra_qspi_start_tx_dma(struct tegra_qspi *tqspi, struct spi_transfer *t, int len)
486 dma_addr_t tx_dma_phys;
488 reinit_completion(&tqspi->tx_dma_complete);
490 if (tqspi->is_packed)
491 tx_dma_phys = t->tx_dma;
493 tx_dma_phys = tqspi->tx_dma_phys;
495 tqspi->tx_dma_desc = dmaengine_prep_slave_single(tqspi->tx_dma_chan, tx_dma_phys,
497 DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
499 if (!tqspi->tx_dma_desc) {
500 dev_err(tqspi->dev, "Unable to get TX descriptor\n");
504 tqspi->tx_dma_desc->callback = tegra_qspi_dma_complete;
505 tqspi->tx_dma_desc->callback_param = &tqspi->tx_dma_complete;
506 dmaengine_submit(tqspi->tx_dma_desc);
507 dma_async_issue_pending(tqspi->tx_dma_chan);
512 static int tegra_qspi_start_rx_dma(struct tegra_qspi *tqspi, struct spi_transfer *t, int len)
514 dma_addr_t rx_dma_phys;
516 reinit_completion(&tqspi->rx_dma_complete);
518 if (tqspi->is_packed)
519 rx_dma_phys = t->rx_dma;
521 rx_dma_phys = tqspi->rx_dma_phys;
523 tqspi->rx_dma_desc = dmaengine_prep_slave_single(tqspi->rx_dma_chan, rx_dma_phys,
525 DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
527 if (!tqspi->rx_dma_desc) {
528 dev_err(tqspi->dev, "Unable to get RX descriptor\n");
532 tqspi->rx_dma_desc->callback = tegra_qspi_dma_complete;
533 tqspi->rx_dma_desc->callback_param = &tqspi->rx_dma_complete;
534 dmaengine_submit(tqspi->rx_dma_desc);
535 dma_async_issue_pending(tqspi->rx_dma_chan);
540 static int tegra_qspi_flush_fifos(struct tegra_qspi *tqspi, bool atomic)
542 void __iomem *addr = tqspi->base + QSPI_FIFO_STATUS;
545 val = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
546 if ((val & QSPI_FIFO_EMPTY) == QSPI_FIFO_EMPTY)
549 val |= QSPI_RX_FIFO_FLUSH | QSPI_TX_FIFO_FLUSH;
550 tegra_qspi_writel(tqspi, val, QSPI_FIFO_STATUS);
553 return readl_relaxed_poll_timeout(addr, val,
554 (val & QSPI_FIFO_EMPTY) == QSPI_FIFO_EMPTY,
557 return readl_relaxed_poll_timeout_atomic(addr, val,
558 (val & QSPI_FIFO_EMPTY) == QSPI_FIFO_EMPTY,
562 static void tegra_qspi_unmask_irq(struct tegra_qspi *tqspi)
566 intr_mask = tegra_qspi_readl(tqspi, QSPI_INTR_MASK);
567 intr_mask &= ~(QSPI_INTR_RDY_MASK | QSPI_INTR_RX_TX_FIFO_ERR);
568 tegra_qspi_writel(tqspi, intr_mask, QSPI_INTR_MASK);
571 static int tegra_qspi_dma_map_xfer(struct tegra_qspi *tqspi, struct spi_transfer *t)
573 u8 *tx_buf = (u8 *)t->tx_buf + tqspi->cur_tx_pos;
574 u8 *rx_buf = (u8 *)t->rx_buf + tqspi->cur_rx_pos;
577 len = DIV_ROUND_UP(tqspi->curr_dma_words * tqspi->bytes_per_word, 4) * 4;
580 t->tx_dma = dma_map_single(tqspi->dev, (void *)tx_buf, len, DMA_TO_DEVICE);
581 if (dma_mapping_error(tqspi->dev, t->tx_dma))
586 t->rx_dma = dma_map_single(tqspi->dev, (void *)rx_buf, len, DMA_FROM_DEVICE);
587 if (dma_mapping_error(tqspi->dev, t->rx_dma)) {
588 dma_unmap_single(tqspi->dev, t->tx_dma, len, DMA_TO_DEVICE);
596 static void tegra_qspi_dma_unmap_xfer(struct tegra_qspi *tqspi, struct spi_transfer *t)
600 len = DIV_ROUND_UP(tqspi->curr_dma_words * tqspi->bytes_per_word, 4) * 4;
602 dma_unmap_single(tqspi->dev, t->tx_dma, len, DMA_TO_DEVICE);
603 dma_unmap_single(tqspi->dev, t->rx_dma, len, DMA_FROM_DEVICE);
606 static int tegra_qspi_start_dma_based_transfer(struct tegra_qspi *tqspi, struct spi_transfer *t)
608 struct dma_slave_config dma_sconfig = { 0 };
614 if (tqspi->is_packed) {
615 ret = tegra_qspi_dma_map_xfer(tqspi, t);
620 val = QSPI_DMA_BLK_SET(tqspi->curr_dma_words - 1);
621 tegra_qspi_writel(tqspi, val, QSPI_DMA_BLK);
623 tegra_qspi_unmask_irq(tqspi);
625 if (tqspi->is_packed)
626 len = DIV_ROUND_UP(tqspi->curr_dma_words * tqspi->bytes_per_word, 4) * 4;
628 len = tqspi->curr_dma_words * 4;
630 /* set attention level based on length of transfer */
633 val |= QSPI_TX_TRIG_1 | QSPI_RX_TRIG_1;
635 } else if (((len) >> 4) & 0x1) {
636 val |= QSPI_TX_TRIG_4 | QSPI_RX_TRIG_4;
639 val |= QSPI_TX_TRIG_8 | QSPI_RX_TRIG_8;
643 tegra_qspi_writel(tqspi, val, QSPI_DMA_CTL);
644 tqspi->dma_control_reg = val;
646 dma_sconfig.device_fc = true;
647 if (tqspi->cur_direction & DATA_DIR_TX) {
648 dma_sconfig.dst_addr = tqspi->phys + QSPI_TX_FIFO;
649 dma_sconfig.dst_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
650 dma_sconfig.dst_maxburst = dma_burst;
651 ret = dmaengine_slave_config(tqspi->tx_dma_chan, &dma_sconfig);
653 dev_err(tqspi->dev, "failed DMA slave config: %d\n", ret);
657 tegra_qspi_copy_client_txbuf_to_qspi_txbuf(tqspi, t);
658 ret = tegra_qspi_start_tx_dma(tqspi, t, len);
660 dev_err(tqspi->dev, "failed to starting TX DMA: %d\n", ret);
665 if (tqspi->cur_direction & DATA_DIR_RX) {
666 dma_sconfig.src_addr = tqspi->phys + QSPI_RX_FIFO;
667 dma_sconfig.src_addr_width = DMA_SLAVE_BUSWIDTH_4_BYTES;
668 dma_sconfig.src_maxburst = dma_burst;
669 ret = dmaengine_slave_config(tqspi->rx_dma_chan, &dma_sconfig);
671 dev_err(tqspi->dev, "failed DMA slave config: %d\n", ret);
675 dma_sync_single_for_device(tqspi->dev, tqspi->rx_dma_phys,
679 ret = tegra_qspi_start_rx_dma(tqspi, t, len);
681 dev_err(tqspi->dev, "failed to start RX DMA: %d\n", ret);
682 if (tqspi->cur_direction & DATA_DIR_TX)
683 dmaengine_terminate_all(tqspi->tx_dma_chan);
688 tegra_qspi_writel(tqspi, tqspi->command1_reg, QSPI_COMMAND1);
690 tqspi->is_curr_dma_xfer = true;
691 tqspi->dma_control_reg = val;
693 tegra_qspi_writel(tqspi, val, QSPI_DMA_CTL);
698 static int tegra_qspi_start_cpu_based_transfer(struct tegra_qspi *qspi, struct spi_transfer *t)
701 unsigned int cur_words;
703 if (qspi->cur_direction & DATA_DIR_TX)
704 cur_words = tegra_qspi_fill_tx_fifo_from_client_txbuf(qspi, t);
706 cur_words = qspi->curr_dma_words;
708 val = QSPI_DMA_BLK_SET(cur_words - 1);
709 tegra_qspi_writel(qspi, val, QSPI_DMA_BLK);
711 tegra_qspi_unmask_irq(qspi);
713 qspi->is_curr_dma_xfer = false;
714 val = qspi->command1_reg;
716 tegra_qspi_writel(qspi, val, QSPI_COMMAND1);
721 static void tegra_qspi_deinit_dma(struct tegra_qspi *tqspi)
723 if (!tqspi->soc_data->has_dma)
726 if (tqspi->tx_dma_buf) {
727 dma_free_coherent(tqspi->dev, tqspi->dma_buf_size,
728 tqspi->tx_dma_buf, tqspi->tx_dma_phys);
729 tqspi->tx_dma_buf = NULL;
732 if (tqspi->tx_dma_chan) {
733 dma_release_channel(tqspi->tx_dma_chan);
734 tqspi->tx_dma_chan = NULL;
737 if (tqspi->rx_dma_buf) {
738 dma_free_coherent(tqspi->dev, tqspi->dma_buf_size,
739 tqspi->rx_dma_buf, tqspi->rx_dma_phys);
740 tqspi->rx_dma_buf = NULL;
743 if (tqspi->rx_dma_chan) {
744 dma_release_channel(tqspi->rx_dma_chan);
745 tqspi->rx_dma_chan = NULL;
749 static int tegra_qspi_init_dma(struct tegra_qspi *tqspi)
751 struct dma_chan *dma_chan;
756 if (!tqspi->soc_data->has_dma)
759 dma_chan = dma_request_chan(tqspi->dev, "rx");
760 if (IS_ERR(dma_chan)) {
761 err = PTR_ERR(dma_chan);
765 tqspi->rx_dma_chan = dma_chan;
767 dma_buf = dma_alloc_coherent(tqspi->dev, tqspi->dma_buf_size, &dma_phys, GFP_KERNEL);
773 tqspi->rx_dma_buf = dma_buf;
774 tqspi->rx_dma_phys = dma_phys;
776 dma_chan = dma_request_chan(tqspi->dev, "tx");
777 if (IS_ERR(dma_chan)) {
778 err = PTR_ERR(dma_chan);
782 tqspi->tx_dma_chan = dma_chan;
784 dma_buf = dma_alloc_coherent(tqspi->dev, tqspi->dma_buf_size, &dma_phys, GFP_KERNEL);
790 tqspi->tx_dma_buf = dma_buf;
791 tqspi->tx_dma_phys = dma_phys;
792 tqspi->use_dma = true;
797 tegra_qspi_deinit_dma(tqspi);
799 if (err != -EPROBE_DEFER) {
800 dev_err(tqspi->dev, "cannot use DMA: %d\n", err);
801 dev_err(tqspi->dev, "falling back to PIO\n");
808 static u32 tegra_qspi_setup_transfer_one(struct spi_device *spi, struct spi_transfer *t,
809 bool is_first_of_msg)
811 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
812 struct tegra_qspi_client_data *cdata = spi->controller_data;
813 u32 command1, command2, speed = t->speed_hz;
814 u8 bits_per_word = t->bits_per_word;
815 u32 tx_tap = 0, rx_tap = 0;
818 if (!has_acpi_companion(tqspi->dev) && speed != tqspi->cur_speed) {
819 clk_set_rate(tqspi->clk, speed);
820 tqspi->cur_speed = speed;
824 tqspi->cur_rx_pos = 0;
825 tqspi->cur_tx_pos = 0;
826 tqspi->curr_xfer = t;
828 if (is_first_of_msg) {
829 tegra_qspi_mask_clear_irq(tqspi);
831 command1 = tqspi->def_command1_reg;
832 command1 |= QSPI_CS_SEL(spi->chip_select);
833 command1 |= QSPI_BIT_LENGTH(bits_per_word - 1);
835 command1 &= ~QSPI_CONTROL_MODE_MASK;
836 req_mode = spi->mode & 0x3;
837 if (req_mode == SPI_MODE_3)
838 command1 |= QSPI_CONTROL_MODE_3;
840 command1 |= QSPI_CONTROL_MODE_0;
842 if (spi->mode & SPI_CS_HIGH)
843 command1 |= QSPI_CS_SW_VAL;
845 command1 &= ~QSPI_CS_SW_VAL;
846 tegra_qspi_writel(tqspi, command1, QSPI_COMMAND1);
848 if (cdata && cdata->tx_clk_tap_delay)
849 tx_tap = cdata->tx_clk_tap_delay;
851 if (cdata && cdata->rx_clk_tap_delay)
852 rx_tap = cdata->rx_clk_tap_delay;
854 command2 = QSPI_TX_TAP_DELAY(tx_tap) | QSPI_RX_TAP_DELAY(rx_tap);
855 if (command2 != tqspi->def_command2_reg)
856 tegra_qspi_writel(tqspi, command2, QSPI_COMMAND2);
859 command1 = tqspi->command1_reg;
860 command1 &= ~QSPI_BIT_LENGTH(~0);
861 command1 |= QSPI_BIT_LENGTH(bits_per_word - 1);
864 command1 &= ~QSPI_SDR_DDR_SEL;
869 static int tegra_qspi_start_transfer_one(struct spi_device *spi,
870 struct spi_transfer *t, u32 command1)
872 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
873 unsigned int total_fifo_words;
877 total_fifo_words = tegra_qspi_calculate_curr_xfer_param(tqspi, t);
879 command1 &= ~QSPI_PACKED;
880 if (tqspi->is_packed)
881 command1 |= QSPI_PACKED;
882 tegra_qspi_writel(tqspi, command1, QSPI_COMMAND1);
884 tqspi->cur_direction = 0;
886 command1 &= ~(QSPI_TX_EN | QSPI_RX_EN);
888 command1 |= QSPI_RX_EN;
889 tqspi->cur_direction |= DATA_DIR_RX;
890 bus_width = t->rx_nbits;
894 command1 |= QSPI_TX_EN;
895 tqspi->cur_direction |= DATA_DIR_TX;
896 bus_width = t->tx_nbits;
899 command1 &= ~QSPI_INTERFACE_WIDTH_MASK;
901 if (bus_width == SPI_NBITS_QUAD)
902 command1 |= QSPI_INTERFACE_WIDTH_QUAD;
903 else if (bus_width == SPI_NBITS_DUAL)
904 command1 |= QSPI_INTERFACE_WIDTH_DUAL;
906 command1 |= QSPI_INTERFACE_WIDTH_SINGLE;
908 tqspi->command1_reg = command1;
910 tegra_qspi_writel(tqspi, QSPI_NUM_DUMMY_CYCLE(tqspi->dummy_cycles), QSPI_MISC_REG);
912 ret = tegra_qspi_flush_fifos(tqspi, false);
916 if (tqspi->use_dma && total_fifo_words > QSPI_FIFO_DEPTH)
917 ret = tegra_qspi_start_dma_based_transfer(tqspi, t);
919 ret = tegra_qspi_start_cpu_based_transfer(tqspi, t);
924 static struct tegra_qspi_client_data *tegra_qspi_parse_cdata_dt(struct spi_device *spi)
926 struct tegra_qspi_client_data *cdata;
928 cdata = devm_kzalloc(&spi->dev, sizeof(*cdata), GFP_KERNEL);
932 device_property_read_u32(&spi->dev, "nvidia,tx-clk-tap-delay",
933 &cdata->tx_clk_tap_delay);
934 device_property_read_u32(&spi->dev, "nvidia,rx-clk-tap-delay",
935 &cdata->rx_clk_tap_delay);
940 static int tegra_qspi_setup(struct spi_device *spi)
942 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
943 struct tegra_qspi_client_data *cdata = spi->controller_data;
948 ret = pm_runtime_resume_and_get(tqspi->dev);
950 dev_err(tqspi->dev, "failed to get runtime PM: %d\n", ret);
955 cdata = tegra_qspi_parse_cdata_dt(spi);
956 spi->controller_data = cdata;
958 spin_lock_irqsave(&tqspi->lock, flags);
960 /* keep default cs state to inactive */
961 val = tqspi->def_command1_reg;
962 val |= QSPI_CS_SEL(spi->chip_select);
963 if (spi->mode & SPI_CS_HIGH)
964 val &= ~QSPI_CS_POL_INACTIVE(spi->chip_select);
966 val |= QSPI_CS_POL_INACTIVE(spi->chip_select);
968 tqspi->def_command1_reg = val;
969 tegra_qspi_writel(tqspi, tqspi->def_command1_reg, QSPI_COMMAND1);
971 spin_unlock_irqrestore(&tqspi->lock, flags);
973 pm_runtime_put(tqspi->dev);
978 static void tegra_qspi_dump_regs(struct tegra_qspi *tqspi)
980 dev_dbg(tqspi->dev, "============ QSPI REGISTER DUMP ============\n");
981 dev_dbg(tqspi->dev, "Command1: 0x%08x | Command2: 0x%08x\n",
982 tegra_qspi_readl(tqspi, QSPI_COMMAND1),
983 tegra_qspi_readl(tqspi, QSPI_COMMAND2));
984 dev_dbg(tqspi->dev, "DMA_CTL: 0x%08x | DMA_BLK: 0x%08x\n",
985 tegra_qspi_readl(tqspi, QSPI_DMA_CTL),
986 tegra_qspi_readl(tqspi, QSPI_DMA_BLK));
987 dev_dbg(tqspi->dev, "INTR_MASK: 0x%08x | MISC: 0x%08x\n",
988 tegra_qspi_readl(tqspi, QSPI_INTR_MASK),
989 tegra_qspi_readl(tqspi, QSPI_MISC_REG));
990 dev_dbg(tqspi->dev, "TRANS_STAT: 0x%08x | FIFO_STATUS: 0x%08x\n",
991 tegra_qspi_readl(tqspi, QSPI_TRANS_STATUS),
992 tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS));
995 static void tegra_qspi_handle_error(struct tegra_qspi *tqspi)
997 dev_err(tqspi->dev, "error in transfer, fifo status 0x%08x\n", tqspi->status_reg);
998 tegra_qspi_dump_regs(tqspi);
999 tegra_qspi_flush_fifos(tqspi, true);
1000 if (device_reset(tqspi->dev) < 0)
1001 dev_warn_once(tqspi->dev, "device reset failed\n");
1004 static void tegra_qspi_transfer_end(struct spi_device *spi)
1006 struct tegra_qspi *tqspi = spi_master_get_devdata(spi->master);
1007 int cs_val = (spi->mode & SPI_CS_HIGH) ? 0 : 1;
1010 tqspi->command1_reg |= QSPI_CS_SW_VAL;
1012 tqspi->command1_reg &= ~QSPI_CS_SW_VAL;
1013 tegra_qspi_writel(tqspi, tqspi->command1_reg, QSPI_COMMAND1);
1014 tegra_qspi_writel(tqspi, tqspi->def_command1_reg, QSPI_COMMAND1);
1017 static u32 tegra_qspi_cmd_config(bool is_ddr, u8 bus_width, u8 len)
1021 /* Extract Command configuration and value */
1023 cmd_config |= QSPI_COMMAND_SDR_DDR;
1025 cmd_config &= ~QSPI_COMMAND_SDR_DDR;
1027 cmd_config |= QSPI_COMMAND_X1_X2_X4(bus_width);
1028 cmd_config |= QSPI_COMMAND_SIZE_SET((len * 8) - 1);
1033 static u32 tegra_qspi_addr_config(bool is_ddr, u8 bus_width, u8 len)
1035 u32 addr_config = 0;
1037 /* Extract Address configuration and value */
1038 is_ddr = 0; //Only SDR mode supported
1039 bus_width = 0; //X1 mode
1042 addr_config |= QSPI_ADDRESS_SDR_DDR;
1044 addr_config &= ~QSPI_ADDRESS_SDR_DDR;
1046 addr_config |= QSPI_ADDRESS_X1_X2_X4(bus_width);
1047 addr_config |= QSPI_ADDRESS_SIZE_SET((len * 8) - 1);
1052 static int tegra_qspi_combined_seq_xfer(struct tegra_qspi *tqspi,
1053 struct spi_message *msg)
1055 bool is_first_msg = true;
1056 struct spi_transfer *xfer;
1057 struct spi_device *spi = msg->spi;
1058 u8 transfer_phase = 0;
1059 u32 cmd1 = 0, dma_ctl = 0;
1061 u32 address_value = 0;
1062 u32 cmd_config = 0, addr_config = 0;
1063 u8 cmd_value = 0, val = 0;
1065 /* Enable Combined sequence mode */
1066 val = tegra_qspi_readl(tqspi, QSPI_GLOBAL_CONFIG);
1067 val |= QSPI_CMB_SEQ_EN;
1068 tegra_qspi_writel(tqspi, val, QSPI_GLOBAL_CONFIG);
1069 /* Process individual transfer list */
1070 list_for_each_entry(xfer, &msg->transfers, transfer_list) {
1071 switch (transfer_phase) {
1074 cmd_config = tegra_qspi_cmd_config(false, 0,
1076 cmd_value = *((const u8 *)(xfer->tx_buf));
1080 addr_config = tegra_qspi_addr_config(false, 0,
1082 address_value = *((const u32 *)(xfer->tx_buf));
1085 /* Program Command, Address value in register */
1086 tegra_qspi_writel(tqspi, cmd_value, QSPI_CMB_SEQ_CMD);
1087 tegra_qspi_writel(tqspi, address_value,
1089 /* Program Command and Address config in register */
1090 tegra_qspi_writel(tqspi, cmd_config,
1091 QSPI_CMB_SEQ_CMD_CFG);
1092 tegra_qspi_writel(tqspi, addr_config,
1093 QSPI_CMB_SEQ_ADDR_CFG);
1095 reinit_completion(&tqspi->xfer_completion);
1096 cmd1 = tegra_qspi_setup_transfer_one(spi, xfer,
1098 ret = tegra_qspi_start_transfer_one(spi, xfer,
1102 dev_err(tqspi->dev, "Failed to start transfer-one: %d\n",
1107 is_first_msg = false;
1108 ret = wait_for_completion_timeout
1109 (&tqspi->xfer_completion,
1112 if (WARN_ON(ret == 0)) {
1113 dev_err(tqspi->dev, "QSPI Transfer failed with timeout: %d\n",
1115 if (tqspi->is_curr_dma_xfer &&
1116 (tqspi->cur_direction & DATA_DIR_TX))
1117 dmaengine_terminate_all
1118 (tqspi->tx_dma_chan);
1120 if (tqspi->is_curr_dma_xfer &&
1121 (tqspi->cur_direction & DATA_DIR_RX))
1122 dmaengine_terminate_all
1123 (tqspi->rx_dma_chan);
1125 /* Abort transfer by resetting pio/dma bit */
1126 if (!tqspi->is_curr_dma_xfer) {
1127 cmd1 = tegra_qspi_readl
1135 dma_ctl = tegra_qspi_readl
1138 dma_ctl &= ~QSPI_DMA_EN;
1139 tegra_qspi_writel(tqspi, dma_ctl,
1143 /* Reset controller if timeout happens */
1144 if (device_reset(tqspi->dev) < 0)
1145 dev_warn_once(tqspi->dev,
1146 "device reset failed\n");
1151 if (tqspi->tx_status || tqspi->rx_status) {
1152 dev_err(tqspi->dev, "QSPI Transfer failed\n");
1153 tqspi->tx_status = 0;
1154 tqspi->rx_status = 0;
1163 msg->actual_length += xfer->len;
1166 if (!xfer->cs_change) {
1167 tegra_qspi_transfer_end(spi);
1168 spi_transfer_delay_exec(xfer);
1178 static int tegra_qspi_non_combined_seq_xfer(struct tegra_qspi *tqspi,
1179 struct spi_message *msg)
1181 struct spi_device *spi = msg->spi;
1182 struct spi_transfer *transfer;
1183 bool is_first_msg = true;
1184 int ret = 0, val = 0;
1187 msg->actual_length = 0;
1188 tqspi->tx_status = 0;
1189 tqspi->rx_status = 0;
1191 /* Disable Combined sequence mode */
1192 val = tegra_qspi_readl(tqspi, QSPI_GLOBAL_CONFIG);
1193 val &= ~QSPI_CMB_SEQ_EN;
1194 tegra_qspi_writel(tqspi, val, QSPI_GLOBAL_CONFIG);
1195 list_for_each_entry(transfer, &msg->transfers, transfer_list) {
1196 struct spi_transfer *xfer = transfer;
1200 tqspi->dummy_cycles = 0;
1202 * Tegra QSPI hardware supports dummy bytes transfer after actual transfer
1203 * bytes based on programmed dummy clock cycles in the QSPI_MISC register.
1204 * So, check if the next transfer is dummy data transfer and program dummy
1205 * clock cycles along with the current transfer and skip next transfer.
1207 if (!list_is_last(&xfer->transfer_list, &msg->transfers)) {
1208 struct spi_transfer *next_xfer;
1210 next_xfer = list_next_entry(xfer, transfer_list);
1211 if (next_xfer->dummy_data) {
1212 u32 dummy_cycles = next_xfer->len * 8 / next_xfer->tx_nbits;
1214 if (dummy_cycles <= QSPI_DUMMY_CYCLES_MAX) {
1215 tqspi->dummy_cycles = dummy_cycles;
1216 dummy_bytes = next_xfer->len;
1217 transfer = next_xfer;
1222 reinit_completion(&tqspi->xfer_completion);
1224 cmd1 = tegra_qspi_setup_transfer_one(spi, xfer, is_first_msg);
1226 ret = tegra_qspi_start_transfer_one(spi, xfer, cmd1);
1228 dev_err(tqspi->dev, "failed to start transfer: %d\n", ret);
1232 ret = wait_for_completion_timeout(&tqspi->xfer_completion,
1234 if (WARN_ON(ret == 0)) {
1235 dev_err(tqspi->dev, "transfer timeout\n");
1236 if (tqspi->is_curr_dma_xfer && (tqspi->cur_direction & DATA_DIR_TX))
1237 dmaengine_terminate_all(tqspi->tx_dma_chan);
1238 if (tqspi->is_curr_dma_xfer && (tqspi->cur_direction & DATA_DIR_RX))
1239 dmaengine_terminate_all(tqspi->rx_dma_chan);
1240 tegra_qspi_handle_error(tqspi);
1245 if (tqspi->tx_status || tqspi->rx_status) {
1246 tegra_qspi_handle_error(tqspi);
1251 msg->actual_length += xfer->len + dummy_bytes;
1255 tegra_qspi_transfer_end(spi);
1256 spi_transfer_delay_exec(xfer);
1260 if (list_is_last(&xfer->transfer_list, &msg->transfers)) {
1261 /* de-activate CS after last transfer only when cs_change is not set */
1262 if (!xfer->cs_change) {
1263 tegra_qspi_transfer_end(spi);
1264 spi_transfer_delay_exec(xfer);
1266 } else if (xfer->cs_change) {
1267 /* de-activated CS between the transfers only when cs_change is set */
1268 tegra_qspi_transfer_end(spi);
1269 spi_transfer_delay_exec(xfer);
1280 static bool tegra_qspi_validate_cmb_seq(struct tegra_qspi *tqspi,
1281 struct spi_message *msg)
1283 int transfer_count = 0;
1284 struct spi_transfer *xfer;
1286 list_for_each_entry(xfer, &msg->transfers, transfer_list) {
1289 if (!tqspi->soc_data->cmb_xfer_capable || transfer_count != 3)
1291 xfer = list_first_entry(&msg->transfers, typeof(*xfer),
1295 xfer = list_next_entry(xfer, transfer_list);
1296 if (xfer->len > 4 || xfer->len < 3)
1298 xfer = list_next_entry(xfer, transfer_list);
1299 if (!tqspi->soc_data->has_dma || xfer->len > (QSPI_FIFO_DEPTH << 2))
1305 static int tegra_qspi_transfer_one_message(struct spi_master *master,
1306 struct spi_message *msg)
1308 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1311 if (tegra_qspi_validate_cmb_seq(tqspi, msg))
1312 ret = tegra_qspi_combined_seq_xfer(tqspi, msg);
1314 ret = tegra_qspi_non_combined_seq_xfer(tqspi, msg);
1316 spi_finalize_current_message(master);
1321 static irqreturn_t handle_cpu_based_xfer(struct tegra_qspi *tqspi)
1323 struct spi_transfer *t = tqspi->curr_xfer;
1324 unsigned long flags;
1326 spin_lock_irqsave(&tqspi->lock, flags);
1328 if (tqspi->tx_status || tqspi->rx_status) {
1329 tegra_qspi_handle_error(tqspi);
1330 complete(&tqspi->xfer_completion);
1334 if (tqspi->cur_direction & DATA_DIR_RX)
1335 tegra_qspi_read_rx_fifo_to_client_rxbuf(tqspi, t);
1337 if (tqspi->cur_direction & DATA_DIR_TX)
1338 tqspi->cur_pos = tqspi->cur_tx_pos;
1340 tqspi->cur_pos = tqspi->cur_rx_pos;
1342 if (tqspi->cur_pos == t->len) {
1343 complete(&tqspi->xfer_completion);
1347 tegra_qspi_calculate_curr_xfer_param(tqspi, t);
1348 tegra_qspi_start_cpu_based_transfer(tqspi, t);
1350 spin_unlock_irqrestore(&tqspi->lock, flags);
1354 static irqreturn_t handle_dma_based_xfer(struct tegra_qspi *tqspi)
1356 struct spi_transfer *t = tqspi->curr_xfer;
1357 unsigned int total_fifo_words;
1358 unsigned long flags;
1362 if (tqspi->cur_direction & DATA_DIR_TX) {
1363 if (tqspi->tx_status) {
1364 dmaengine_terminate_all(tqspi->tx_dma_chan);
1367 wait_status = wait_for_completion_interruptible_timeout(
1368 &tqspi->tx_dma_complete, QSPI_DMA_TIMEOUT);
1369 if (wait_status <= 0) {
1370 dmaengine_terminate_all(tqspi->tx_dma_chan);
1371 dev_err(tqspi->dev, "failed TX DMA transfer\n");
1377 if (tqspi->cur_direction & DATA_DIR_RX) {
1378 if (tqspi->rx_status) {
1379 dmaengine_terminate_all(tqspi->rx_dma_chan);
1382 wait_status = wait_for_completion_interruptible_timeout(
1383 &tqspi->rx_dma_complete, QSPI_DMA_TIMEOUT);
1384 if (wait_status <= 0) {
1385 dmaengine_terminate_all(tqspi->rx_dma_chan);
1386 dev_err(tqspi->dev, "failed RX DMA transfer\n");
1392 spin_lock_irqsave(&tqspi->lock, flags);
1395 tegra_qspi_dma_unmap_xfer(tqspi, t);
1396 tegra_qspi_handle_error(tqspi);
1397 complete(&tqspi->xfer_completion);
1401 if (tqspi->cur_direction & DATA_DIR_RX)
1402 tegra_qspi_copy_qspi_rxbuf_to_client_rxbuf(tqspi, t);
1404 if (tqspi->cur_direction & DATA_DIR_TX)
1405 tqspi->cur_pos = tqspi->cur_tx_pos;
1407 tqspi->cur_pos = tqspi->cur_rx_pos;
1409 if (tqspi->cur_pos == t->len) {
1410 tegra_qspi_dma_unmap_xfer(tqspi, t);
1411 complete(&tqspi->xfer_completion);
1415 tegra_qspi_dma_unmap_xfer(tqspi, t);
1417 /* continue transfer in current message */
1418 total_fifo_words = tegra_qspi_calculate_curr_xfer_param(tqspi, t);
1419 if (total_fifo_words > QSPI_FIFO_DEPTH)
1420 err = tegra_qspi_start_dma_based_transfer(tqspi, t);
1422 err = tegra_qspi_start_cpu_based_transfer(tqspi, t);
1425 spin_unlock_irqrestore(&tqspi->lock, flags);
1429 static irqreturn_t tegra_qspi_isr_thread(int irq, void *context_data)
1431 struct tegra_qspi *tqspi = context_data;
1433 tqspi->status_reg = tegra_qspi_readl(tqspi, QSPI_FIFO_STATUS);
1435 if (tqspi->cur_direction & DATA_DIR_TX)
1436 tqspi->tx_status = tqspi->status_reg & (QSPI_TX_FIFO_UNF | QSPI_TX_FIFO_OVF);
1438 if (tqspi->cur_direction & DATA_DIR_RX)
1439 tqspi->rx_status = tqspi->status_reg & (QSPI_RX_FIFO_OVF | QSPI_RX_FIFO_UNF);
1441 tegra_qspi_mask_clear_irq(tqspi);
1443 if (!tqspi->is_curr_dma_xfer)
1444 return handle_cpu_based_xfer(tqspi);
1446 return handle_dma_based_xfer(tqspi);
1449 static struct tegra_qspi_soc_data tegra210_qspi_soc_data = {
1451 .cmb_xfer_capable = false,
1455 static struct tegra_qspi_soc_data tegra186_qspi_soc_data = {
1457 .cmb_xfer_capable = true,
1461 static struct tegra_qspi_soc_data tegra234_qspi_soc_data = {
1463 .cmb_xfer_capable = true,
1467 static struct tegra_qspi_soc_data tegra241_qspi_soc_data = {
1469 .cmb_xfer_capable = true,
1473 static const struct of_device_id tegra_qspi_of_match[] = {
1475 .compatible = "nvidia,tegra210-qspi",
1476 .data = &tegra210_qspi_soc_data,
1478 .compatible = "nvidia,tegra186-qspi",
1479 .data = &tegra186_qspi_soc_data,
1481 .compatible = "nvidia,tegra194-qspi",
1482 .data = &tegra186_qspi_soc_data,
1484 .compatible = "nvidia,tegra234-qspi",
1485 .data = &tegra234_qspi_soc_data,
1487 .compatible = "nvidia,tegra241-qspi",
1488 .data = &tegra241_qspi_soc_data,
1493 MODULE_DEVICE_TABLE(of, tegra_qspi_of_match);
1496 static const struct acpi_device_id tegra_qspi_acpi_match[] = {
1499 .driver_data = (kernel_ulong_t)&tegra210_qspi_soc_data,
1502 .driver_data = (kernel_ulong_t)&tegra186_qspi_soc_data,
1505 .driver_data = (kernel_ulong_t)&tegra234_qspi_soc_data,
1508 .driver_data = (kernel_ulong_t)&tegra241_qspi_soc_data,
1513 MODULE_DEVICE_TABLE(acpi, tegra_qspi_acpi_match);
1516 static int tegra_qspi_probe(struct platform_device *pdev)
1518 struct spi_master *master;
1519 struct tegra_qspi *tqspi;
1524 master = devm_spi_alloc_master(&pdev->dev, sizeof(*tqspi));
1528 platform_set_drvdata(pdev, master);
1529 tqspi = spi_master_get_devdata(master);
1531 master->mode_bits = SPI_MODE_0 | SPI_MODE_3 | SPI_CS_HIGH |
1532 SPI_TX_DUAL | SPI_RX_DUAL | SPI_TX_QUAD | SPI_RX_QUAD;
1533 master->bits_per_word_mask = SPI_BPW_MASK(32) | SPI_BPW_MASK(16) | SPI_BPW_MASK(8);
1534 master->setup = tegra_qspi_setup;
1535 master->transfer_one_message = tegra_qspi_transfer_one_message;
1536 master->num_chipselect = 1;
1537 master->auto_runtime_pm = true;
1539 bus_num = of_alias_get_id(pdev->dev.of_node, "spi");
1541 master->bus_num = bus_num;
1543 tqspi->master = master;
1544 tqspi->dev = &pdev->dev;
1545 spin_lock_init(&tqspi->lock);
1547 tqspi->soc_data = device_get_match_data(&pdev->dev);
1548 master->num_chipselect = tqspi->soc_data->cs_count;
1549 r = platform_get_resource(pdev, IORESOURCE_MEM, 0);
1550 tqspi->base = devm_ioremap_resource(&pdev->dev, r);
1551 if (IS_ERR(tqspi->base))
1552 return PTR_ERR(tqspi->base);
1554 tqspi->phys = r->start;
1555 qspi_irq = platform_get_irq(pdev, 0);
1558 tqspi->irq = qspi_irq;
1560 if (!has_acpi_companion(tqspi->dev)) {
1561 tqspi->clk = devm_clk_get(&pdev->dev, "qspi");
1562 if (IS_ERR(tqspi->clk)) {
1563 ret = PTR_ERR(tqspi->clk);
1564 dev_err(&pdev->dev, "failed to get clock: %d\n", ret);
1570 tqspi->max_buf_size = QSPI_FIFO_DEPTH << 2;
1571 tqspi->dma_buf_size = DEFAULT_QSPI_DMA_BUF_LEN;
1573 ret = tegra_qspi_init_dma(tqspi);
1578 tqspi->max_buf_size = tqspi->dma_buf_size;
1580 init_completion(&tqspi->tx_dma_complete);
1581 init_completion(&tqspi->rx_dma_complete);
1582 init_completion(&tqspi->xfer_completion);
1584 pm_runtime_enable(&pdev->dev);
1585 ret = pm_runtime_resume_and_get(&pdev->dev);
1587 dev_err(&pdev->dev, "failed to get runtime PM: %d\n", ret);
1588 goto exit_pm_disable;
1591 if (device_reset(tqspi->dev) < 0)
1592 dev_warn_once(tqspi->dev, "device reset failed\n");
1594 tqspi->def_command1_reg = QSPI_M_S | QSPI_CS_SW_HW | QSPI_CS_SW_VAL;
1595 tegra_qspi_writel(tqspi, tqspi->def_command1_reg, QSPI_COMMAND1);
1596 tqspi->spi_cs_timing1 = tegra_qspi_readl(tqspi, QSPI_CS_TIMING1);
1597 tqspi->spi_cs_timing2 = tegra_qspi_readl(tqspi, QSPI_CS_TIMING2);
1598 tqspi->def_command2_reg = tegra_qspi_readl(tqspi, QSPI_COMMAND2);
1600 pm_runtime_put(&pdev->dev);
1602 ret = request_threaded_irq(tqspi->irq, NULL,
1603 tegra_qspi_isr_thread, IRQF_ONESHOT,
1604 dev_name(&pdev->dev), tqspi);
1606 dev_err(&pdev->dev, "failed to request IRQ#%u: %d\n", tqspi->irq, ret);
1607 goto exit_pm_disable;
1610 master->dev.of_node = pdev->dev.of_node;
1611 ret = spi_register_master(master);
1613 dev_err(&pdev->dev, "failed to register master: %d\n", ret);
1620 free_irq(qspi_irq, tqspi);
1622 pm_runtime_force_suspend(&pdev->dev);
1623 tegra_qspi_deinit_dma(tqspi);
1627 static int tegra_qspi_remove(struct platform_device *pdev)
1629 struct spi_master *master = platform_get_drvdata(pdev);
1630 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1632 spi_unregister_master(master);
1633 free_irq(tqspi->irq, tqspi);
1634 pm_runtime_force_suspend(&pdev->dev);
1635 tegra_qspi_deinit_dma(tqspi);
1640 static int __maybe_unused tegra_qspi_suspend(struct device *dev)
1642 struct spi_master *master = dev_get_drvdata(dev);
1644 return spi_master_suspend(master);
1647 static int __maybe_unused tegra_qspi_resume(struct device *dev)
1649 struct spi_master *master = dev_get_drvdata(dev);
1650 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1653 ret = pm_runtime_resume_and_get(dev);
1655 dev_err(dev, "failed to get runtime PM: %d\n", ret);
1659 tegra_qspi_writel(tqspi, tqspi->command1_reg, QSPI_COMMAND1);
1660 tegra_qspi_writel(tqspi, tqspi->def_command2_reg, QSPI_COMMAND2);
1661 pm_runtime_put(dev);
1663 return spi_master_resume(master);
1666 static int __maybe_unused tegra_qspi_runtime_suspend(struct device *dev)
1668 struct spi_master *master = dev_get_drvdata(dev);
1669 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1671 /* Runtime pm disabled with ACPI */
1672 if (has_acpi_companion(tqspi->dev))
1674 /* flush all write which are in PPSB queue by reading back */
1675 tegra_qspi_readl(tqspi, QSPI_COMMAND1);
1677 clk_disable_unprepare(tqspi->clk);
1682 static int __maybe_unused tegra_qspi_runtime_resume(struct device *dev)
1684 struct spi_master *master = dev_get_drvdata(dev);
1685 struct tegra_qspi *tqspi = spi_master_get_devdata(master);
1688 /* Runtime pm disabled with ACPI */
1689 if (has_acpi_companion(tqspi->dev))
1691 ret = clk_prepare_enable(tqspi->clk);
1693 dev_err(tqspi->dev, "failed to enable clock: %d\n", ret);
1698 static const struct dev_pm_ops tegra_qspi_pm_ops = {
1699 SET_RUNTIME_PM_OPS(tegra_qspi_runtime_suspend, tegra_qspi_runtime_resume, NULL)
1700 SET_SYSTEM_SLEEP_PM_OPS(tegra_qspi_suspend, tegra_qspi_resume)
1703 static struct platform_driver tegra_qspi_driver = {
1705 .name = "tegra-qspi",
1706 .pm = &tegra_qspi_pm_ops,
1707 .of_match_table = tegra_qspi_of_match,
1708 .acpi_match_table = ACPI_PTR(tegra_qspi_acpi_match),
1710 .probe = tegra_qspi_probe,
1711 .remove = tegra_qspi_remove,
1713 module_platform_driver(tegra_qspi_driver);
1715 MODULE_ALIAS("platform:qspi-tegra");
1716 MODULE_DESCRIPTION("NVIDIA Tegra QSPI Controller Driver");
1717 MODULE_AUTHOR("Sowjanya Komatineni <skomatineni@nvidia.com>");
1718 MODULE_LICENSE("GPL v2");