Merge tag 'i2c-for-6.6-rc8' of git://git.kernel.org/pub/scm/linux/kernel/git/wsa...
[platform/kernel/linux-starfive.git] / drivers / spi / spi-qcom-qspi.c
1 // SPDX-License-Identifier: GPL-2.0
2 // Copyright (c) 2017-2018, The Linux foundation. All rights reserved.
3
4 #include <linux/clk.h>
5 #include <linux/dmapool.h>
6 #include <linux/dma-mapping.h>
7 #include <linux/interconnect.h>
8 #include <linux/interrupt.h>
9 #include <linux/io.h>
10 #include <linux/module.h>
11 #include <linux/of.h>
12 #include <linux/platform_device.h>
13 #include <linux/pinctrl/consumer.h>
14 #include <linux/pm_runtime.h>
15 #include <linux/pm_opp.h>
16 #include <linux/spi/spi.h>
17 #include <linux/spi/spi-mem.h>
18
19
20 #define QSPI_NUM_CS             2
21 #define QSPI_BYTES_PER_WORD     4
22
23 #define MSTR_CONFIG             0x0000
24 #define FULL_CYCLE_MODE         BIT(3)
25 #define FB_CLK_EN               BIT(4)
26 #define PIN_HOLDN               BIT(6)
27 #define PIN_WPN                 BIT(7)
28 #define DMA_ENABLE              BIT(8)
29 #define BIG_ENDIAN_MODE         BIT(9)
30 #define SPI_MODE_MSK            0xc00
31 #define SPI_MODE_SHFT           10
32 #define CHIP_SELECT_NUM         BIT(12)
33 #define SBL_EN                  BIT(13)
34 #define LPA_BASE_MSK            0x3c000
35 #define LPA_BASE_SHFT           14
36 #define TX_DATA_DELAY_MSK       0xc0000
37 #define TX_DATA_DELAY_SHFT      18
38 #define TX_CLK_DELAY_MSK        0x300000
39 #define TX_CLK_DELAY_SHFT       20
40 #define TX_CS_N_DELAY_MSK       0xc00000
41 #define TX_CS_N_DELAY_SHFT      22
42 #define TX_DATA_OE_DELAY_MSK    0x3000000
43 #define TX_DATA_OE_DELAY_SHFT   24
44
45 #define AHB_MASTER_CFG                          0x0004
46 #define HMEM_TYPE_START_MID_TRANS_MSK           0x7
47 #define HMEM_TYPE_START_MID_TRANS_SHFT          0
48 #define HMEM_TYPE_LAST_TRANS_MSK                0x38
49 #define HMEM_TYPE_LAST_TRANS_SHFT               3
50 #define USE_HMEMTYPE_LAST_ON_DESC_OR_CHAIN_MSK  0xc0
51 #define USE_HMEMTYPE_LAST_ON_DESC_OR_CHAIN_SHFT 6
52 #define HMEMTYPE_READ_TRANS_MSK                 0x700
53 #define HMEMTYPE_READ_TRANS_SHFT                8
54 #define HSHARED                                 BIT(11)
55 #define HINNERSHARED                            BIT(12)
56
57 #define MSTR_INT_EN             0x000C
58 #define MSTR_INT_STATUS         0x0010
59 #define RESP_FIFO_UNDERRUN      BIT(0)
60 #define RESP_FIFO_NOT_EMPTY     BIT(1)
61 #define RESP_FIFO_RDY           BIT(2)
62 #define HRESP_FROM_NOC_ERR      BIT(3)
63 #define WR_FIFO_EMPTY           BIT(9)
64 #define WR_FIFO_FULL            BIT(10)
65 #define WR_FIFO_OVERRUN         BIT(11)
66 #define TRANSACTION_DONE        BIT(16)
67 #define DMA_CHAIN_DONE          BIT(31)
68 #define QSPI_ERR_IRQS           (RESP_FIFO_UNDERRUN | HRESP_FROM_NOC_ERR | \
69                                  WR_FIFO_OVERRUN)
70 #define QSPI_ALL_IRQS           (QSPI_ERR_IRQS | RESP_FIFO_RDY | \
71                                  WR_FIFO_EMPTY | WR_FIFO_FULL | \
72                                  TRANSACTION_DONE | DMA_CHAIN_DONE)
73
74 #define PIO_XFER_CTRL           0x0014
75 #define REQUEST_COUNT_MSK       0xffff
76
77 #define PIO_XFER_CFG            0x0018
78 #define TRANSFER_DIRECTION      BIT(0)
79 #define MULTI_IO_MODE_MSK       0xe
80 #define MULTI_IO_MODE_SHFT      1
81 #define TRANSFER_FRAGMENT       BIT(8)
82 #define SDR_1BIT                1
83 #define SDR_2BIT                2
84 #define SDR_4BIT                3
85 #define DDR_1BIT                5
86 #define DDR_2BIT                6
87 #define DDR_4BIT                7
88 #define DMA_DESC_SINGLE_SPI     1
89 #define DMA_DESC_DUAL_SPI       2
90 #define DMA_DESC_QUAD_SPI       3
91
92 #define PIO_XFER_STATUS         0x001c
93 #define WR_FIFO_BYTES_MSK       0xffff0000
94 #define WR_FIFO_BYTES_SHFT      16
95
96 #define PIO_DATAOUT_1B          0x0020
97 #define PIO_DATAOUT_4B          0x0024
98
99 #define RD_FIFO_CFG             0x0028
100 #define CONTINUOUS_MODE         BIT(0)
101
102 #define RD_FIFO_STATUS  0x002c
103 #define FIFO_EMPTY      BIT(11)
104 #define WR_CNTS_MSK     0x7f0
105 #define WR_CNTS_SHFT    4
106 #define RDY_64BYTE      BIT(3)
107 #define RDY_32BYTE      BIT(2)
108 #define RDY_16BYTE      BIT(1)
109 #define FIFO_RDY        BIT(0)
110
111 #define RD_FIFO_RESET           0x0030
112 #define RESET_FIFO              BIT(0)
113
114 #define NEXT_DMA_DESC_ADDR      0x0040
115 #define CURRENT_DMA_DESC_ADDR   0x0044
116 #define CURRENT_MEM_ADDR        0x0048
117
118 #define CUR_MEM_ADDR            0x0048
119 #define HW_VERSION              0x004c
120 #define RD_FIFO                 0x0050
121 #define SAMPLING_CLK_CFG        0x0090
122 #define SAMPLING_CLK_STATUS     0x0094
123
124 #define QSPI_ALIGN_REQ  32
125
126 enum qspi_dir {
127         QSPI_READ,
128         QSPI_WRITE,
129 };
130
131 struct qspi_cmd_desc {
132         u32 data_address;
133         u32 next_descriptor;
134         u32 direction:1;
135         u32 multi_io_mode:3;
136         u32 reserved1:4;
137         u32 fragment:1;
138         u32 reserved2:7;
139         u32 length:16;
140 };
141
142 struct qspi_xfer {
143         union {
144                 const void *tx_buf;
145                 void *rx_buf;
146         };
147         unsigned int rem_bytes;
148         unsigned int buswidth;
149         enum qspi_dir dir;
150         bool is_last;
151 };
152
153 enum qspi_clocks {
154         QSPI_CLK_CORE,
155         QSPI_CLK_IFACE,
156         QSPI_NUM_CLKS
157 };
158
159 /*
160  * Number of entries in sgt returned from spi framework that-
161  * will be supported. Can be modified as required.
162  * In practice, given max_dma_len is 64KB, the number of
163  * entries is not expected to exceed 1.
164  */
165 #define QSPI_MAX_SG 5
166
167 struct qcom_qspi {
168         void __iomem *base;
169         struct device *dev;
170         struct clk_bulk_data *clks;
171         struct qspi_xfer xfer;
172         struct dma_pool *dma_cmd_pool;
173         dma_addr_t dma_cmd_desc[QSPI_MAX_SG];
174         void *virt_cmd_desc[QSPI_MAX_SG];
175         unsigned int n_cmd_desc;
176         struct icc_path *icc_path_cpu_to_qspi;
177         unsigned long last_speed;
178         /* Lock to protect data accessed by IRQs */
179         spinlock_t lock;
180 };
181
182 static u32 qspi_buswidth_to_iomode(struct qcom_qspi *ctrl,
183                                    unsigned int buswidth)
184 {
185         switch (buswidth) {
186         case 1:
187                 return SDR_1BIT;
188         case 2:
189                 return SDR_2BIT;
190         case 4:
191                 return SDR_4BIT;
192         default:
193                 dev_warn_once(ctrl->dev,
194                                 "Unexpected bus width: %u\n", buswidth);
195                 return SDR_1BIT;
196         }
197 }
198
199 static void qcom_qspi_pio_xfer_cfg(struct qcom_qspi *ctrl)
200 {
201         u32 pio_xfer_cfg;
202         u32 iomode;
203         const struct qspi_xfer *xfer;
204
205         xfer = &ctrl->xfer;
206         pio_xfer_cfg = readl(ctrl->base + PIO_XFER_CFG);
207         pio_xfer_cfg &= ~TRANSFER_DIRECTION;
208         pio_xfer_cfg |= xfer->dir;
209         if (xfer->is_last)
210                 pio_xfer_cfg &= ~TRANSFER_FRAGMENT;
211         else
212                 pio_xfer_cfg |= TRANSFER_FRAGMENT;
213         pio_xfer_cfg &= ~MULTI_IO_MODE_MSK;
214         iomode = qspi_buswidth_to_iomode(ctrl, xfer->buswidth);
215         pio_xfer_cfg |= iomode << MULTI_IO_MODE_SHFT;
216
217         writel(pio_xfer_cfg, ctrl->base + PIO_XFER_CFG);
218 }
219
220 static void qcom_qspi_pio_xfer_ctrl(struct qcom_qspi *ctrl)
221 {
222         u32 pio_xfer_ctrl;
223
224         pio_xfer_ctrl = readl(ctrl->base + PIO_XFER_CTRL);
225         pio_xfer_ctrl &= ~REQUEST_COUNT_MSK;
226         pio_xfer_ctrl |= ctrl->xfer.rem_bytes;
227         writel(pio_xfer_ctrl, ctrl->base + PIO_XFER_CTRL);
228 }
229
230 static void qcom_qspi_pio_xfer(struct qcom_qspi *ctrl)
231 {
232         u32 ints;
233
234         qcom_qspi_pio_xfer_cfg(ctrl);
235
236         /* Ack any previous interrupts that might be hanging around */
237         writel(QSPI_ALL_IRQS, ctrl->base + MSTR_INT_STATUS);
238
239         /* Setup new interrupts */
240         if (ctrl->xfer.dir == QSPI_WRITE)
241                 ints = QSPI_ERR_IRQS | WR_FIFO_EMPTY;
242         else
243                 ints = QSPI_ERR_IRQS | RESP_FIFO_RDY;
244         writel(ints, ctrl->base + MSTR_INT_EN);
245
246         /* Kick off the transfer */
247         qcom_qspi_pio_xfer_ctrl(ctrl);
248 }
249
250 static void qcom_qspi_handle_err(struct spi_controller *host,
251                                  struct spi_message *msg)
252 {
253         u32 int_status;
254         struct qcom_qspi *ctrl = spi_controller_get_devdata(host);
255         unsigned long flags;
256         int i;
257
258         spin_lock_irqsave(&ctrl->lock, flags);
259         writel(0, ctrl->base + MSTR_INT_EN);
260         int_status = readl(ctrl->base + MSTR_INT_STATUS);
261         writel(int_status, ctrl->base + MSTR_INT_STATUS);
262         ctrl->xfer.rem_bytes = 0;
263
264         /* free cmd descriptors if they are around (DMA mode) */
265         for (i = 0; i < ctrl->n_cmd_desc; i++)
266                 dma_pool_free(ctrl->dma_cmd_pool, ctrl->virt_cmd_desc[i],
267                                   ctrl->dma_cmd_desc[i]);
268         ctrl->n_cmd_desc = 0;
269         spin_unlock_irqrestore(&ctrl->lock, flags);
270 }
271
272 static int qcom_qspi_set_speed(struct qcom_qspi *ctrl, unsigned long speed_hz)
273 {
274         int ret;
275         unsigned int avg_bw_cpu;
276
277         if (speed_hz == ctrl->last_speed)
278                 return 0;
279
280         /* In regular operation (SBL_EN=1) core must be 4x transfer clock */
281         ret = dev_pm_opp_set_rate(ctrl->dev, speed_hz * 4);
282         if (ret) {
283                 dev_err(ctrl->dev, "Failed to set core clk %d\n", ret);
284                 return ret;
285         }
286
287         /*
288          * Set BW quota for CPU.
289          * We don't have explicit peak requirement so keep it equal to avg_bw.
290          */
291         avg_bw_cpu = Bps_to_icc(speed_hz);
292         ret = icc_set_bw(ctrl->icc_path_cpu_to_qspi, avg_bw_cpu, avg_bw_cpu);
293         if (ret) {
294                 dev_err(ctrl->dev, "%s: ICC BW voting failed for cpu: %d\n",
295                         __func__, ret);
296                 return ret;
297         }
298
299         ctrl->last_speed = speed_hz;
300
301         return 0;
302 }
303
304 static int qcom_qspi_alloc_desc(struct qcom_qspi *ctrl, dma_addr_t dma_ptr,
305                         uint32_t n_bytes)
306 {
307         struct qspi_cmd_desc *virt_cmd_desc, *prev;
308         dma_addr_t dma_cmd_desc;
309
310         /* allocate for dma cmd descriptor */
311         virt_cmd_desc = dma_pool_alloc(ctrl->dma_cmd_pool, GFP_ATOMIC | __GFP_ZERO, &dma_cmd_desc);
312         if (!virt_cmd_desc) {
313                 dev_warn_once(ctrl->dev, "Couldn't find memory for descriptor\n");
314                 return -EAGAIN;
315         }
316
317         ctrl->virt_cmd_desc[ctrl->n_cmd_desc] = virt_cmd_desc;
318         ctrl->dma_cmd_desc[ctrl->n_cmd_desc] = dma_cmd_desc;
319         ctrl->n_cmd_desc++;
320
321         /* setup cmd descriptor */
322         virt_cmd_desc->data_address = dma_ptr;
323         virt_cmd_desc->direction = ctrl->xfer.dir;
324         virt_cmd_desc->multi_io_mode = qspi_buswidth_to_iomode(ctrl, ctrl->xfer.buswidth);
325         virt_cmd_desc->fragment = !ctrl->xfer.is_last;
326         virt_cmd_desc->length = n_bytes;
327
328         /* update previous descriptor */
329         if (ctrl->n_cmd_desc >= 2) {
330                 prev = (ctrl->virt_cmd_desc)[ctrl->n_cmd_desc - 2];
331                 prev->next_descriptor = dma_cmd_desc;
332                 prev->fragment = 1;
333         }
334
335         return 0;
336 }
337
338 static int qcom_qspi_setup_dma_desc(struct qcom_qspi *ctrl,
339                                 struct spi_transfer *xfer)
340 {
341         int ret;
342         struct sg_table *sgt;
343         dma_addr_t dma_ptr_sg;
344         unsigned int dma_len_sg;
345         int i;
346
347         if (ctrl->n_cmd_desc) {
348                 dev_err(ctrl->dev, "Remnant dma buffers n_cmd_desc-%d\n", ctrl->n_cmd_desc);
349                 return -EIO;
350         }
351
352         sgt = (ctrl->xfer.dir == QSPI_READ) ? &xfer->rx_sg : &xfer->tx_sg;
353         if (!sgt->nents || sgt->nents > QSPI_MAX_SG) {
354                 dev_warn_once(ctrl->dev, "Cannot handle %d entries in scatter list\n", sgt->nents);
355                 return -EAGAIN;
356         }
357
358         for (i = 0; i < sgt->nents; i++) {
359                 dma_ptr_sg = sg_dma_address(sgt->sgl + i);
360                 dma_len_sg = sg_dma_len(sgt->sgl + i);
361                 if (!IS_ALIGNED(dma_ptr_sg, QSPI_ALIGN_REQ)) {
362                         dev_warn_once(ctrl->dev, "dma_address not aligned to %d\n", QSPI_ALIGN_REQ);
363                         return -EAGAIN;
364                 }
365                 /*
366                  * When reading with DMA the controller writes to memory 1 word
367                  * at a time. If the length isn't a multiple of 4 bytes then
368                  * the controller can clobber the things later in memory.
369                  * Fallback to PIO to be safe.
370                  */
371                 if (ctrl->xfer.dir == QSPI_READ && (dma_len_sg & 0x03)) {
372                         dev_warn_once(ctrl->dev, "fallback to PIO for read of size %#010x\n",
373                                       dma_len_sg);
374                         return -EAGAIN;
375                 }
376         }
377
378         for (i = 0; i < sgt->nents; i++) {
379                 dma_ptr_sg = sg_dma_address(sgt->sgl + i);
380                 dma_len_sg = sg_dma_len(sgt->sgl + i);
381
382                 ret = qcom_qspi_alloc_desc(ctrl, dma_ptr_sg, dma_len_sg);
383                 if (ret)
384                         goto cleanup;
385         }
386         return 0;
387
388 cleanup:
389         for (i = 0; i < ctrl->n_cmd_desc; i++)
390                 dma_pool_free(ctrl->dma_cmd_pool, ctrl->virt_cmd_desc[i],
391                                   ctrl->dma_cmd_desc[i]);
392         ctrl->n_cmd_desc = 0;
393         return ret;
394 }
395
396 static void qcom_qspi_dma_xfer(struct qcom_qspi *ctrl)
397 {
398         /* Setup new interrupts */
399         writel(DMA_CHAIN_DONE, ctrl->base + MSTR_INT_EN);
400
401         /* kick off transfer */
402         writel((u32)((ctrl->dma_cmd_desc)[0]), ctrl->base + NEXT_DMA_DESC_ADDR);
403 }
404
405 /* Switch to DMA if transfer length exceeds this */
406 #define QSPI_MAX_BYTES_FIFO 64
407
408 static bool qcom_qspi_can_dma(struct spi_controller *ctlr,
409                          struct spi_device *slv, struct spi_transfer *xfer)
410 {
411         return xfer->len > QSPI_MAX_BYTES_FIFO;
412 }
413
414 static int qcom_qspi_transfer_one(struct spi_controller *host,
415                                   struct spi_device *slv,
416                                   struct spi_transfer *xfer)
417 {
418         struct qcom_qspi *ctrl = spi_controller_get_devdata(host);
419         int ret;
420         unsigned long speed_hz;
421         unsigned long flags;
422         u32 mstr_cfg;
423
424         speed_hz = slv->max_speed_hz;
425         if (xfer->speed_hz)
426                 speed_hz = xfer->speed_hz;
427
428         ret = qcom_qspi_set_speed(ctrl, speed_hz);
429         if (ret)
430                 return ret;
431
432         spin_lock_irqsave(&ctrl->lock, flags);
433         mstr_cfg = readl(ctrl->base + MSTR_CONFIG);
434
435         /* We are half duplex, so either rx or tx will be set */
436         if (xfer->rx_buf) {
437                 ctrl->xfer.dir = QSPI_READ;
438                 ctrl->xfer.buswidth = xfer->rx_nbits;
439                 ctrl->xfer.rx_buf = xfer->rx_buf;
440         } else {
441                 ctrl->xfer.dir = QSPI_WRITE;
442                 ctrl->xfer.buswidth = xfer->tx_nbits;
443                 ctrl->xfer.tx_buf = xfer->tx_buf;
444         }
445         ctrl->xfer.is_last = list_is_last(&xfer->transfer_list,
446                                           &host->cur_msg->transfers);
447         ctrl->xfer.rem_bytes = xfer->len;
448
449         if (xfer->rx_sg.nents || xfer->tx_sg.nents) {
450                 /* do DMA transfer */
451                 if (!(mstr_cfg & DMA_ENABLE)) {
452                         mstr_cfg |= DMA_ENABLE;
453                         writel(mstr_cfg, ctrl->base + MSTR_CONFIG);
454                 }
455
456                 ret = qcom_qspi_setup_dma_desc(ctrl, xfer);
457                 if (ret != -EAGAIN) {
458                         if (!ret) {
459                                 dma_wmb();
460                                 qcom_qspi_dma_xfer(ctrl);
461                         }
462                         goto exit;
463                 }
464                 dev_warn_once(ctrl->dev, "DMA failure, falling back to PIO\n");
465                 ret = 0; /* We'll retry w/ PIO */
466         }
467
468         if (mstr_cfg & DMA_ENABLE) {
469                 mstr_cfg &= ~DMA_ENABLE;
470                 writel(mstr_cfg, ctrl->base + MSTR_CONFIG);
471         }
472         qcom_qspi_pio_xfer(ctrl);
473
474 exit:
475         spin_unlock_irqrestore(&ctrl->lock, flags);
476
477         if (ret)
478                 return ret;
479
480         /* We'll call spi_finalize_current_transfer() when done */
481         return 1;
482 }
483
484 static int qcom_qspi_prepare_message(struct spi_controller *host,
485                                      struct spi_message *message)
486 {
487         u32 mstr_cfg;
488         struct qcom_qspi *ctrl;
489         int tx_data_oe_delay = 1;
490         int tx_data_delay = 1;
491         unsigned long flags;
492
493         ctrl = spi_controller_get_devdata(host);
494         spin_lock_irqsave(&ctrl->lock, flags);
495
496         mstr_cfg = readl(ctrl->base + MSTR_CONFIG);
497         mstr_cfg &= ~CHIP_SELECT_NUM;
498         if (spi_get_chipselect(message->spi, 0))
499                 mstr_cfg |= CHIP_SELECT_NUM;
500
501         mstr_cfg |= FB_CLK_EN | PIN_WPN | PIN_HOLDN | SBL_EN | FULL_CYCLE_MODE;
502         mstr_cfg &= ~(SPI_MODE_MSK | TX_DATA_OE_DELAY_MSK | TX_DATA_DELAY_MSK);
503         mstr_cfg |= message->spi->mode << SPI_MODE_SHFT;
504         mstr_cfg |= tx_data_oe_delay << TX_DATA_OE_DELAY_SHFT;
505         mstr_cfg |= tx_data_delay << TX_DATA_DELAY_SHFT;
506         mstr_cfg &= ~DMA_ENABLE;
507
508         writel(mstr_cfg, ctrl->base + MSTR_CONFIG);
509         spin_unlock_irqrestore(&ctrl->lock, flags);
510
511         return 0;
512 }
513
514 static int qcom_qspi_alloc_dma(struct qcom_qspi *ctrl)
515 {
516         ctrl->dma_cmd_pool = dmam_pool_create("qspi cmd desc pool",
517                 ctrl->dev, sizeof(struct qspi_cmd_desc), 0, 0);
518         if (!ctrl->dma_cmd_pool)
519                 return -ENOMEM;
520
521         return 0;
522 }
523
524 static irqreturn_t pio_read(struct qcom_qspi *ctrl)
525 {
526         u32 rd_fifo_status;
527         u32 rd_fifo;
528         unsigned int wr_cnts;
529         unsigned int bytes_to_read;
530         unsigned int words_to_read;
531         u32 *word_buf;
532         u8 *byte_buf;
533         int i;
534
535         rd_fifo_status = readl(ctrl->base + RD_FIFO_STATUS);
536
537         if (!(rd_fifo_status & FIFO_RDY)) {
538                 dev_dbg(ctrl->dev, "Spurious IRQ %#x\n", rd_fifo_status);
539                 return IRQ_NONE;
540         }
541
542         wr_cnts = (rd_fifo_status & WR_CNTS_MSK) >> WR_CNTS_SHFT;
543         wr_cnts = min(wr_cnts, ctrl->xfer.rem_bytes);
544
545         words_to_read = wr_cnts / QSPI_BYTES_PER_WORD;
546         bytes_to_read = wr_cnts % QSPI_BYTES_PER_WORD;
547
548         if (words_to_read) {
549                 word_buf = ctrl->xfer.rx_buf;
550                 ctrl->xfer.rem_bytes -= words_to_read * QSPI_BYTES_PER_WORD;
551                 ioread32_rep(ctrl->base + RD_FIFO, word_buf, words_to_read);
552                 ctrl->xfer.rx_buf = word_buf + words_to_read;
553         }
554
555         if (bytes_to_read) {
556                 byte_buf = ctrl->xfer.rx_buf;
557                 rd_fifo = readl(ctrl->base + RD_FIFO);
558                 ctrl->xfer.rem_bytes -= bytes_to_read;
559                 for (i = 0; i < bytes_to_read; i++)
560                         *byte_buf++ = rd_fifo >> (i * BITS_PER_BYTE);
561                 ctrl->xfer.rx_buf = byte_buf;
562         }
563
564         return IRQ_HANDLED;
565 }
566
567 static irqreturn_t pio_write(struct qcom_qspi *ctrl)
568 {
569         const void *xfer_buf = ctrl->xfer.tx_buf;
570         const int *word_buf;
571         const char *byte_buf;
572         unsigned int wr_fifo_bytes;
573         unsigned int wr_fifo_words;
574         unsigned int wr_size;
575         unsigned int rem_words;
576
577         wr_fifo_bytes = readl(ctrl->base + PIO_XFER_STATUS);
578         wr_fifo_bytes >>= WR_FIFO_BYTES_SHFT;
579
580         if (ctrl->xfer.rem_bytes < QSPI_BYTES_PER_WORD) {
581                 /* Process the last 1-3 bytes */
582                 wr_size = min(wr_fifo_bytes, ctrl->xfer.rem_bytes);
583                 ctrl->xfer.rem_bytes -= wr_size;
584
585                 byte_buf = xfer_buf;
586                 while (wr_size--)
587                         writel(*byte_buf++,
588                                ctrl->base + PIO_DATAOUT_1B);
589                 ctrl->xfer.tx_buf = byte_buf;
590         } else {
591                 /*
592                  * Process all the whole words; to keep things simple we'll
593                  * just wait for the next interrupt to handle the last 1-3
594                  * bytes if we don't have an even number of words.
595                  */
596                 rem_words = ctrl->xfer.rem_bytes / QSPI_BYTES_PER_WORD;
597                 wr_fifo_words = wr_fifo_bytes / QSPI_BYTES_PER_WORD;
598
599                 wr_size = min(rem_words, wr_fifo_words);
600                 ctrl->xfer.rem_bytes -= wr_size * QSPI_BYTES_PER_WORD;
601
602                 word_buf = xfer_buf;
603                 iowrite32_rep(ctrl->base + PIO_DATAOUT_4B, word_buf, wr_size);
604                 ctrl->xfer.tx_buf = word_buf + wr_size;
605
606         }
607
608         return IRQ_HANDLED;
609 }
610
611 static irqreturn_t qcom_qspi_irq(int irq, void *dev_id)
612 {
613         u32 int_status;
614         struct qcom_qspi *ctrl = dev_id;
615         irqreturn_t ret = IRQ_NONE;
616
617         spin_lock(&ctrl->lock);
618
619         int_status = readl(ctrl->base + MSTR_INT_STATUS);
620         writel(int_status, ctrl->base + MSTR_INT_STATUS);
621
622         /* Ignore disabled interrupts */
623         int_status &= readl(ctrl->base + MSTR_INT_EN);
624
625         /* PIO mode handling */
626         if (ctrl->xfer.dir == QSPI_WRITE) {
627                 if (int_status & WR_FIFO_EMPTY)
628                         ret = pio_write(ctrl);
629         } else {
630                 if (int_status & RESP_FIFO_RDY)
631                         ret = pio_read(ctrl);
632         }
633
634         if (int_status & QSPI_ERR_IRQS) {
635                 if (int_status & RESP_FIFO_UNDERRUN)
636                         dev_err(ctrl->dev, "IRQ error: FIFO underrun\n");
637                 if (int_status & WR_FIFO_OVERRUN)
638                         dev_err(ctrl->dev, "IRQ error: FIFO overrun\n");
639                 if (int_status & HRESP_FROM_NOC_ERR)
640                         dev_err(ctrl->dev, "IRQ error: NOC response error\n");
641                 ret = IRQ_HANDLED;
642         }
643
644         if (!ctrl->xfer.rem_bytes) {
645                 writel(0, ctrl->base + MSTR_INT_EN);
646                 spi_finalize_current_transfer(dev_get_drvdata(ctrl->dev));
647         }
648
649         /* DMA mode handling */
650         if (int_status & DMA_CHAIN_DONE) {
651                 int i;
652
653                 writel(0, ctrl->base + MSTR_INT_EN);
654                 ctrl->xfer.rem_bytes = 0;
655
656                 for (i = 0; i < ctrl->n_cmd_desc; i++)
657                         dma_pool_free(ctrl->dma_cmd_pool, ctrl->virt_cmd_desc[i],
658                                           ctrl->dma_cmd_desc[i]);
659                 ctrl->n_cmd_desc = 0;
660
661                 ret = IRQ_HANDLED;
662                 spi_finalize_current_transfer(dev_get_drvdata(ctrl->dev));
663         }
664
665         spin_unlock(&ctrl->lock);
666         return ret;
667 }
668
669 static int qcom_qspi_adjust_op_size(struct spi_mem *mem, struct spi_mem_op *op)
670 {
671         /*
672          * If qcom_qspi_can_dma() is going to return false we don't need to
673          * adjust anything.
674          */
675         if (op->data.nbytes <= QSPI_MAX_BYTES_FIFO)
676                 return 0;
677
678         /*
679          * When reading, the transfer needs to be a multiple of 4 bytes so
680          * shrink the transfer if that's not true. The caller will then do a
681          * second transfer to finish things up.
682          */
683         if (op->data.dir == SPI_MEM_DATA_IN && (op->data.nbytes & 0x3))
684                 op->data.nbytes &= ~0x3;
685
686         return 0;
687 }
688
689 static const struct spi_controller_mem_ops qcom_qspi_mem_ops = {
690         .adjust_op_size = qcom_qspi_adjust_op_size,
691 };
692
693 static int qcom_qspi_probe(struct platform_device *pdev)
694 {
695         int ret;
696         struct device *dev;
697         struct spi_controller *host;
698         struct qcom_qspi *ctrl;
699
700         dev = &pdev->dev;
701
702         host = devm_spi_alloc_host(dev, sizeof(*ctrl));
703         if (!host)
704                 return -ENOMEM;
705
706         platform_set_drvdata(pdev, host);
707
708         ctrl = spi_controller_get_devdata(host);
709
710         spin_lock_init(&ctrl->lock);
711         ctrl->dev = dev;
712         ctrl->base = devm_platform_ioremap_resource(pdev, 0);
713         if (IS_ERR(ctrl->base))
714                 return PTR_ERR(ctrl->base);
715
716         ctrl->clks = devm_kcalloc(dev, QSPI_NUM_CLKS,
717                                   sizeof(*ctrl->clks), GFP_KERNEL);
718         if (!ctrl->clks)
719                 return -ENOMEM;
720
721         ctrl->clks[QSPI_CLK_CORE].id = "core";
722         ctrl->clks[QSPI_CLK_IFACE].id = "iface";
723         ret = devm_clk_bulk_get(dev, QSPI_NUM_CLKS, ctrl->clks);
724         if (ret)
725                 return ret;
726
727         ctrl->icc_path_cpu_to_qspi = devm_of_icc_get(dev, "qspi-config");
728         if (IS_ERR(ctrl->icc_path_cpu_to_qspi))
729                 return dev_err_probe(dev, PTR_ERR(ctrl->icc_path_cpu_to_qspi),
730                                      "Failed to get cpu path\n");
731
732         /* Set BW vote for register access */
733         ret = icc_set_bw(ctrl->icc_path_cpu_to_qspi, Bps_to_icc(1000),
734                                 Bps_to_icc(1000));
735         if (ret) {
736                 dev_err(ctrl->dev, "%s: ICC BW voting failed for cpu: %d\n",
737                                 __func__, ret);
738                 return ret;
739         }
740
741         ret = icc_disable(ctrl->icc_path_cpu_to_qspi);
742         if (ret) {
743                 dev_err(ctrl->dev, "%s: ICC disable failed for cpu: %d\n",
744                                 __func__, ret);
745                 return ret;
746         }
747
748         ret = platform_get_irq(pdev, 0);
749         if (ret < 0)
750                 return ret;
751         ret = devm_request_irq(dev, ret, qcom_qspi_irq, 0, dev_name(dev), ctrl);
752         if (ret) {
753                 dev_err(dev, "Failed to request irq %d\n", ret);
754                 return ret;
755         }
756
757         ret = dma_set_mask_and_coherent(dev, DMA_BIT_MASK(32));
758         if (ret)
759                 return dev_err_probe(dev, ret, "could not set DMA mask\n");
760
761         host->max_speed_hz = 300000000;
762         host->max_dma_len = 65536; /* as per HPG */
763         host->dma_alignment = QSPI_ALIGN_REQ;
764         host->num_chipselect = QSPI_NUM_CS;
765         host->bus_num = -1;
766         host->dev.of_node = pdev->dev.of_node;
767         host->mode_bits = SPI_MODE_0 |
768                           SPI_TX_DUAL | SPI_RX_DUAL |
769                           SPI_TX_QUAD | SPI_RX_QUAD;
770         host->flags = SPI_CONTROLLER_HALF_DUPLEX;
771         host->prepare_message = qcom_qspi_prepare_message;
772         host->transfer_one = qcom_qspi_transfer_one;
773         host->handle_err = qcom_qspi_handle_err;
774         if (of_property_read_bool(pdev->dev.of_node, "iommus"))
775                 host->can_dma = qcom_qspi_can_dma;
776         host->auto_runtime_pm = true;
777         host->mem_ops = &qcom_qspi_mem_ops;
778
779         ret = devm_pm_opp_set_clkname(&pdev->dev, "core");
780         if (ret)
781                 return ret;
782         /* OPP table is optional */
783         ret = devm_pm_opp_of_add_table(&pdev->dev);
784         if (ret && ret != -ENODEV) {
785                 dev_err(&pdev->dev, "invalid OPP table in device tree\n");
786                 return ret;
787         }
788
789         ret = qcom_qspi_alloc_dma(ctrl);
790         if (ret)
791                 return ret;
792
793         pm_runtime_use_autosuspend(dev);
794         pm_runtime_set_autosuspend_delay(dev, 250);
795         pm_runtime_enable(dev);
796
797         ret = spi_register_controller(host);
798         if (!ret)
799                 return 0;
800
801         pm_runtime_disable(dev);
802
803         return ret;
804 }
805
806 static void qcom_qspi_remove(struct platform_device *pdev)
807 {
808         struct spi_controller *host = platform_get_drvdata(pdev);
809
810         /* Unregister _before_ disabling pm_runtime() so we stop transfers */
811         spi_unregister_controller(host);
812
813         pm_runtime_disable(&pdev->dev);
814 }
815
816 static int __maybe_unused qcom_qspi_runtime_suspend(struct device *dev)
817 {
818         struct spi_controller *host = dev_get_drvdata(dev);
819         struct qcom_qspi *ctrl = spi_controller_get_devdata(host);
820         int ret;
821
822         /* Drop the performance state vote */
823         dev_pm_opp_set_rate(dev, 0);
824         clk_bulk_disable_unprepare(QSPI_NUM_CLKS, ctrl->clks);
825
826         ret = icc_disable(ctrl->icc_path_cpu_to_qspi);
827         if (ret) {
828                 dev_err_ratelimited(ctrl->dev, "%s: ICC disable failed for cpu: %d\n",
829                         __func__, ret);
830                 return ret;
831         }
832
833         pinctrl_pm_select_sleep_state(dev);
834
835         return 0;
836 }
837
838 static int __maybe_unused qcom_qspi_runtime_resume(struct device *dev)
839 {
840         struct spi_controller *host = dev_get_drvdata(dev);
841         struct qcom_qspi *ctrl = spi_controller_get_devdata(host);
842         int ret;
843
844         pinctrl_pm_select_default_state(dev);
845
846         ret = icc_enable(ctrl->icc_path_cpu_to_qspi);
847         if (ret) {
848                 dev_err_ratelimited(ctrl->dev, "%s: ICC enable failed for cpu: %d\n",
849                         __func__, ret);
850                 return ret;
851         }
852
853         ret = clk_bulk_prepare_enable(QSPI_NUM_CLKS, ctrl->clks);
854         if (ret)
855                 return ret;
856
857         return dev_pm_opp_set_rate(dev, ctrl->last_speed * 4);
858 }
859
860 static int __maybe_unused qcom_qspi_suspend(struct device *dev)
861 {
862         struct spi_controller *host = dev_get_drvdata(dev);
863         int ret;
864
865         ret = spi_controller_suspend(host);
866         if (ret)
867                 return ret;
868
869         ret = pm_runtime_force_suspend(dev);
870         if (ret)
871                 spi_controller_resume(host);
872
873         return ret;
874 }
875
876 static int __maybe_unused qcom_qspi_resume(struct device *dev)
877 {
878         struct spi_controller *host = dev_get_drvdata(dev);
879         int ret;
880
881         ret = pm_runtime_force_resume(dev);
882         if (ret)
883                 return ret;
884
885         ret = spi_controller_resume(host);
886         if (ret)
887                 pm_runtime_force_suspend(dev);
888
889         return ret;
890 }
891
892 static const struct dev_pm_ops qcom_qspi_dev_pm_ops = {
893         SET_RUNTIME_PM_OPS(qcom_qspi_runtime_suspend,
894                            qcom_qspi_runtime_resume, NULL)
895         SET_SYSTEM_SLEEP_PM_OPS(qcom_qspi_suspend, qcom_qspi_resume)
896 };
897
898 static const struct of_device_id qcom_qspi_dt_match[] = {
899         { .compatible = "qcom,qspi-v1", },
900         { }
901 };
902 MODULE_DEVICE_TABLE(of, qcom_qspi_dt_match);
903
904 static struct platform_driver qcom_qspi_driver = {
905         .driver = {
906                 .name           = "qcom_qspi",
907                 .pm             = &qcom_qspi_dev_pm_ops,
908                 .of_match_table = qcom_qspi_dt_match,
909         },
910         .probe = qcom_qspi_probe,
911         .remove_new = qcom_qspi_remove,
912 };
913 module_platform_driver(qcom_qspi_driver);
914
915 MODULE_DESCRIPTION("SPI driver for QSPI cores");
916 MODULE_LICENSE("GPL v2");