1 // SPDX-License-Identifier: GPL-2.0-only
3 // Driver for Cadence QSPI Controller
5 // Copyright Altera Corporation (C) 2012-2014. All rights reserved.
6 // Copyright Intel Corporation (C) 2019-2020. All rights reserved.
7 // Copyright (C) 2020 Texas Instruments Incorporated - http://www.ti.com
10 #include <linux/completion.h>
11 #include <linux/delay.h>
12 #include <linux/dma-mapping.h>
13 #include <linux/dmaengine.h>
14 #include <linux/err.h>
15 #include <linux/errno.h>
16 #include <linux/firmware/xlnx-zynqmp.h>
17 #include <linux/interrupt.h>
19 #include <linux/iopoll.h>
20 #include <linux/jiffies.h>
21 #include <linux/kernel.h>
22 #include <linux/log2.h>
23 #include <linux/module.h>
24 #include <linux/of_device.h>
26 #include <linux/platform_device.h>
27 #include <linux/pm_runtime.h>
28 #include <linux/reset.h>
29 #include <linux/sched.h>
30 #include <linux/spi/spi.h>
31 #include <linux/spi/spi-mem.h>
32 #include <linux/timer.h>
34 #define CQSPI_NAME "cadence-qspi"
35 #define CQSPI_MAX_CHIPSELECT 16
38 #define CQSPI_NEEDS_WR_DELAY BIT(0)
39 #define CQSPI_DISABLE_DAC_MODE BIT(1)
40 #define CQSPI_SUPPORT_EXTERNAL_DMA BIT(2)
41 #define CQSPI_NO_SUPPORT_WR_COMPLETION BIT(3)
44 #define CQSPI_SUPPORTS_OCTAL BIT(0)
48 struct cqspi_flash_pdata {
49 struct cqspi_st *cqspi;
64 struct platform_device *pdev;
70 void __iomem *ahb_base;
71 resource_size_t ahb_size;
72 struct completion transfer_complete;
74 struct dma_chan *rx_chan;
75 struct completion rx_dma_complete;
76 dma_addr_t mmap_phys_base;
79 unsigned long master_ref_clk_hz;
88 struct cqspi_flash_pdata f_pdata[CQSPI_MAX_CHIPSELECT];
94 struct cqspi_driver_platdata {
97 int (*indirect_read_dma)(struct cqspi_flash_pdata *f_pdata,
98 u_char *rxbuf, loff_t from_addr, size_t n_rx);
99 u32 (*get_dma_status)(struct cqspi_st *cqspi);
102 /* Operation timeout value */
103 #define CQSPI_TIMEOUT_MS 500
104 #define CQSPI_READ_TIMEOUT_MS 10
106 #define CQSPI_DUMMY_CLKS_PER_BYTE 8
107 #define CQSPI_DUMMY_BYTES_MAX 4
108 #define CQSPI_DUMMY_CLKS_MAX 31
110 #define CQSPI_STIG_DATA_LEN_MAX 8
113 #define CQSPI_REG_CONFIG 0x00
114 #define CQSPI_REG_CONFIG_ENABLE_MASK BIT(0)
115 #define CQSPI_REG_CONFIG_ENB_DIR_ACC_CTRL BIT(7)
116 #define CQSPI_REG_CONFIG_DECODE_MASK BIT(9)
117 #define CQSPI_REG_CONFIG_CHIPSELECT_LSB 10
118 #define CQSPI_REG_CONFIG_DMA_MASK BIT(15)
119 #define CQSPI_REG_CONFIG_BAUD_LSB 19
120 #define CQSPI_REG_CONFIG_DTR_PROTO BIT(24)
121 #define CQSPI_REG_CONFIG_DUAL_OPCODE BIT(30)
122 #define CQSPI_REG_CONFIG_IDLE_LSB 31
123 #define CQSPI_REG_CONFIG_CHIPSELECT_MASK 0xF
124 #define CQSPI_REG_CONFIG_BAUD_MASK 0xF
126 #define CQSPI_REG_RD_INSTR 0x04
127 #define CQSPI_REG_RD_INSTR_OPCODE_LSB 0
128 #define CQSPI_REG_RD_INSTR_TYPE_INSTR_LSB 8
129 #define CQSPI_REG_RD_INSTR_TYPE_ADDR_LSB 12
130 #define CQSPI_REG_RD_INSTR_TYPE_DATA_LSB 16
131 #define CQSPI_REG_RD_INSTR_MODE_EN_LSB 20
132 #define CQSPI_REG_RD_INSTR_DUMMY_LSB 24
133 #define CQSPI_REG_RD_INSTR_TYPE_INSTR_MASK 0x3
134 #define CQSPI_REG_RD_INSTR_TYPE_ADDR_MASK 0x3
135 #define CQSPI_REG_RD_INSTR_TYPE_DATA_MASK 0x3
136 #define CQSPI_REG_RD_INSTR_DUMMY_MASK 0x1F
138 #define CQSPI_REG_WR_INSTR 0x08
139 #define CQSPI_REG_WR_INSTR_OPCODE_LSB 0
140 #define CQSPI_REG_WR_INSTR_TYPE_ADDR_LSB 12
141 #define CQSPI_REG_WR_INSTR_TYPE_DATA_LSB 16
143 #define CQSPI_REG_DELAY 0x0C
144 #define CQSPI_REG_DELAY_TSLCH_LSB 0
145 #define CQSPI_REG_DELAY_TCHSH_LSB 8
146 #define CQSPI_REG_DELAY_TSD2D_LSB 16
147 #define CQSPI_REG_DELAY_TSHSL_LSB 24
148 #define CQSPI_REG_DELAY_TSLCH_MASK 0xFF
149 #define CQSPI_REG_DELAY_TCHSH_MASK 0xFF
150 #define CQSPI_REG_DELAY_TSD2D_MASK 0xFF
151 #define CQSPI_REG_DELAY_TSHSL_MASK 0xFF
153 #define CQSPI_REG_READCAPTURE 0x10
154 #define CQSPI_REG_READCAPTURE_BYPASS_LSB 0
155 #define CQSPI_REG_READCAPTURE_DELAY_LSB 1
156 #define CQSPI_REG_READCAPTURE_DELAY_MASK 0xF
158 #define CQSPI_REG_SIZE 0x14
159 #define CQSPI_REG_SIZE_ADDRESS_LSB 0
160 #define CQSPI_REG_SIZE_PAGE_LSB 4
161 #define CQSPI_REG_SIZE_BLOCK_LSB 16
162 #define CQSPI_REG_SIZE_ADDRESS_MASK 0xF
163 #define CQSPI_REG_SIZE_PAGE_MASK 0xFFF
164 #define CQSPI_REG_SIZE_BLOCK_MASK 0x3F
166 #define CQSPI_REG_SRAMPARTITION 0x18
167 #define CQSPI_REG_INDIRECTTRIGGER 0x1C
169 #define CQSPI_REG_DMA 0x20
170 #define CQSPI_REG_DMA_SINGLE_LSB 0
171 #define CQSPI_REG_DMA_BURST_LSB 8
172 #define CQSPI_REG_DMA_SINGLE_MASK 0xFF
173 #define CQSPI_REG_DMA_BURST_MASK 0xFF
175 #define CQSPI_REG_REMAP 0x24
176 #define CQSPI_REG_MODE_BIT 0x28
178 #define CQSPI_REG_SDRAMLEVEL 0x2C
179 #define CQSPI_REG_SDRAMLEVEL_RD_LSB 0
180 #define CQSPI_REG_SDRAMLEVEL_WR_LSB 16
181 #define CQSPI_REG_SDRAMLEVEL_RD_MASK 0xFFFF
182 #define CQSPI_REG_SDRAMLEVEL_WR_MASK 0xFFFF
184 #define CQSPI_REG_WR_COMPLETION_CTRL 0x38
185 #define CQSPI_REG_WR_DISABLE_AUTO_POLL BIT(14)
187 #define CQSPI_REG_IRQSTATUS 0x40
188 #define CQSPI_REG_IRQMASK 0x44
190 #define CQSPI_REG_INDIRECTRD 0x60
191 #define CQSPI_REG_INDIRECTRD_START_MASK BIT(0)
192 #define CQSPI_REG_INDIRECTRD_CANCEL_MASK BIT(1)
193 #define CQSPI_REG_INDIRECTRD_DONE_MASK BIT(5)
195 #define CQSPI_REG_INDIRECTRDWATERMARK 0x64
196 #define CQSPI_REG_INDIRECTRDSTARTADDR 0x68
197 #define CQSPI_REG_INDIRECTRDBYTES 0x6C
199 #define CQSPI_REG_CMDCTRL 0x90
200 #define CQSPI_REG_CMDCTRL_EXECUTE_MASK BIT(0)
201 #define CQSPI_REG_CMDCTRL_INPROGRESS_MASK BIT(1)
202 #define CQSPI_REG_CMDCTRL_DUMMY_LSB 7
203 #define CQSPI_REG_CMDCTRL_WR_BYTES_LSB 12
204 #define CQSPI_REG_CMDCTRL_WR_EN_LSB 15
205 #define CQSPI_REG_CMDCTRL_ADD_BYTES_LSB 16
206 #define CQSPI_REG_CMDCTRL_ADDR_EN_LSB 19
207 #define CQSPI_REG_CMDCTRL_RD_BYTES_LSB 20
208 #define CQSPI_REG_CMDCTRL_RD_EN_LSB 23
209 #define CQSPI_REG_CMDCTRL_OPCODE_LSB 24
210 #define CQSPI_REG_CMDCTRL_WR_BYTES_MASK 0x7
211 #define CQSPI_REG_CMDCTRL_ADD_BYTES_MASK 0x3
212 #define CQSPI_REG_CMDCTRL_RD_BYTES_MASK 0x7
213 #define CQSPI_REG_CMDCTRL_DUMMY_MASK 0x1F
215 #define CQSPI_REG_INDIRECTWR 0x70
216 #define CQSPI_REG_INDIRECTWR_START_MASK BIT(0)
217 #define CQSPI_REG_INDIRECTWR_CANCEL_MASK BIT(1)
218 #define CQSPI_REG_INDIRECTWR_DONE_MASK BIT(5)
220 #define CQSPI_REG_INDIRECTWRWATERMARK 0x74
221 #define CQSPI_REG_INDIRECTWRSTARTADDR 0x78
222 #define CQSPI_REG_INDIRECTWRBYTES 0x7C
224 #define CQSPI_REG_INDTRIG_ADDRRANGE 0x80
226 #define CQSPI_REG_CMDADDRESS 0x94
227 #define CQSPI_REG_CMDREADDATALOWER 0xA0
228 #define CQSPI_REG_CMDREADDATAUPPER 0xA4
229 #define CQSPI_REG_CMDWRITEDATALOWER 0xA8
230 #define CQSPI_REG_CMDWRITEDATAUPPER 0xAC
232 #define CQSPI_REG_POLLING_STATUS 0xB0
233 #define CQSPI_REG_POLLING_STATUS_DUMMY_LSB 16
235 #define CQSPI_REG_OP_EXT_LOWER 0xE0
236 #define CQSPI_REG_OP_EXT_READ_LSB 24
237 #define CQSPI_REG_OP_EXT_WRITE_LSB 16
238 #define CQSPI_REG_OP_EXT_STIG_LSB 0
240 #define CQSPI_REG_VERSAL_DMA_SRC_ADDR 0x1000
242 #define CQSPI_REG_VERSAL_DMA_DST_ADDR 0x1800
243 #define CQSPI_REG_VERSAL_DMA_DST_SIZE 0x1804
245 #define CQSPI_REG_VERSAL_DMA_DST_CTRL 0x180C
247 #define CQSPI_REG_VERSAL_DMA_DST_I_STS 0x1814
248 #define CQSPI_REG_VERSAL_DMA_DST_I_EN 0x1818
249 #define CQSPI_REG_VERSAL_DMA_DST_I_DIS 0x181C
250 #define CQSPI_REG_VERSAL_DMA_DST_DONE_MASK BIT(1)
252 #define CQSPI_REG_VERSAL_DMA_DST_ADDR_MSB 0x1828
254 #define CQSPI_REG_VERSAL_DMA_DST_CTRL_VAL 0xF43FFA00
255 #define CQSPI_REG_VERSAL_ADDRRANGE_WIDTH_VAL 0x6
257 /* Interrupt status bits */
258 #define CQSPI_REG_IRQ_MODE_ERR BIT(0)
259 #define CQSPI_REG_IRQ_UNDERFLOW BIT(1)
260 #define CQSPI_REG_IRQ_IND_COMP BIT(2)
261 #define CQSPI_REG_IRQ_IND_RD_REJECT BIT(3)
262 #define CQSPI_REG_IRQ_WR_PROTECTED_ERR BIT(4)
263 #define CQSPI_REG_IRQ_ILLEGAL_AHB_ERR BIT(5)
264 #define CQSPI_REG_IRQ_WATERMARK BIT(6)
265 #define CQSPI_REG_IRQ_IND_SRAM_FULL BIT(12)
267 #define CQSPI_IRQ_MASK_RD (CQSPI_REG_IRQ_WATERMARK | \
268 CQSPI_REG_IRQ_IND_SRAM_FULL | \
269 CQSPI_REG_IRQ_IND_COMP)
271 #define CQSPI_IRQ_MASK_WR (CQSPI_REG_IRQ_IND_COMP | \
272 CQSPI_REG_IRQ_WATERMARK | \
273 CQSPI_REG_IRQ_UNDERFLOW)
275 #define CQSPI_IRQ_STATUS_MASK 0x1FFFF
276 #define CQSPI_DMA_UNALIGN 0x3
278 #define CQSPI_REG_VERSAL_DMA_VAL 0x602
280 static int cqspi_wait_for_bit(void __iomem *reg, const u32 mask, bool clr)
284 return readl_relaxed_poll_timeout(reg, val,
285 (((clr ? ~val : val) & mask) == mask),
286 10, CQSPI_TIMEOUT_MS * 1000);
289 static bool cqspi_is_idle(struct cqspi_st *cqspi)
291 u32 reg = readl(cqspi->iobase + CQSPI_REG_CONFIG);
293 return reg & (1UL << CQSPI_REG_CONFIG_IDLE_LSB);
296 static u32 cqspi_get_rd_sram_level(struct cqspi_st *cqspi)
298 u32 reg = readl(cqspi->iobase + CQSPI_REG_SDRAMLEVEL);
300 reg >>= CQSPI_REG_SDRAMLEVEL_RD_LSB;
301 return reg & CQSPI_REG_SDRAMLEVEL_RD_MASK;
304 static u32 cqspi_get_versal_dma_status(struct cqspi_st *cqspi)
308 dma_status = readl(cqspi->iobase +
309 CQSPI_REG_VERSAL_DMA_DST_I_STS);
310 writel(dma_status, cqspi->iobase +
311 CQSPI_REG_VERSAL_DMA_DST_I_STS);
313 return dma_status & CQSPI_REG_VERSAL_DMA_DST_DONE_MASK;
316 static irqreturn_t cqspi_irq_handler(int this_irq, void *dev)
318 struct cqspi_st *cqspi = dev;
319 unsigned int irq_status;
320 struct device *device = &cqspi->pdev->dev;
321 const struct cqspi_driver_platdata *ddata;
323 ddata = of_device_get_match_data(device);
325 /* Read interrupt status */
326 irq_status = readl(cqspi->iobase + CQSPI_REG_IRQSTATUS);
328 /* Clear interrupt */
329 writel(irq_status, cqspi->iobase + CQSPI_REG_IRQSTATUS);
331 if (cqspi->use_dma_read && ddata && ddata->get_dma_status) {
332 if (ddata->get_dma_status(cqspi)) {
333 complete(&cqspi->transfer_complete);
338 irq_status &= CQSPI_IRQ_MASK_RD | CQSPI_IRQ_MASK_WR;
341 complete(&cqspi->transfer_complete);
346 static unsigned int cqspi_calc_rdreg(struct cqspi_flash_pdata *f_pdata)
350 rdreg |= f_pdata->inst_width << CQSPI_REG_RD_INSTR_TYPE_INSTR_LSB;
351 rdreg |= f_pdata->addr_width << CQSPI_REG_RD_INSTR_TYPE_ADDR_LSB;
352 rdreg |= f_pdata->data_width << CQSPI_REG_RD_INSTR_TYPE_DATA_LSB;
357 static unsigned int cqspi_calc_dummy(const struct spi_mem_op *op, bool dtr)
359 unsigned int dummy_clk;
361 if (!op->dummy.nbytes)
364 dummy_clk = op->dummy.nbytes * (8 / op->dummy.buswidth);
371 static int cqspi_set_protocol(struct cqspi_flash_pdata *f_pdata,
372 const struct spi_mem_op *op)
375 * For an op to be DTR, cmd phase along with every other non-empty
376 * phase should have dtr field set to 1. If an op phase has zero
377 * nbytes, ignore its dtr field; otherwise, check its dtr field.
379 f_pdata->dtr = op->cmd.dtr &&
380 (!op->addr.nbytes || op->addr.dtr) &&
381 (!op->data.nbytes || op->data.dtr);
383 f_pdata->inst_width = 0;
384 if (op->cmd.buswidth)
385 f_pdata->inst_width = ilog2(op->cmd.buswidth);
387 f_pdata->addr_width = 0;
388 if (op->addr.buswidth)
389 f_pdata->addr_width = ilog2(op->addr.buswidth);
391 f_pdata->data_width = 0;
392 if (op->data.buswidth)
393 f_pdata->data_width = ilog2(op->data.buswidth);
395 /* Right now we only support 8-8-8 DTR mode. */
397 switch (op->cmd.buswidth) {
405 switch (op->addr.buswidth) {
413 switch (op->data.buswidth) {
425 static int cqspi_wait_idle(struct cqspi_st *cqspi)
427 const unsigned int poll_idle_retry = 3;
428 unsigned int count = 0;
429 unsigned long timeout;
431 timeout = jiffies + msecs_to_jiffies(CQSPI_TIMEOUT_MS);
434 * Read few times in succession to ensure the controller
435 * is indeed idle, that is, the bit does not transition
438 if (cqspi_is_idle(cqspi))
443 if (count >= poll_idle_retry)
446 if (time_after(jiffies, timeout)) {
447 /* Timeout, in busy mode. */
448 dev_err(&cqspi->pdev->dev,
449 "QSPI is still busy after %dms timeout.\n",
458 static int cqspi_exec_flash_cmd(struct cqspi_st *cqspi, unsigned int reg)
460 void __iomem *reg_base = cqspi->iobase;
463 /* Write the CMDCTRL without start execution. */
464 writel(reg, reg_base + CQSPI_REG_CMDCTRL);
466 reg |= CQSPI_REG_CMDCTRL_EXECUTE_MASK;
467 writel(reg, reg_base + CQSPI_REG_CMDCTRL);
469 /* Polling for completion. */
470 ret = cqspi_wait_for_bit(reg_base + CQSPI_REG_CMDCTRL,
471 CQSPI_REG_CMDCTRL_INPROGRESS_MASK, 1);
473 dev_err(&cqspi->pdev->dev,
474 "Flash command execution timed out.\n");
478 /* Polling QSPI idle status. */
479 return cqspi_wait_idle(cqspi);
482 static int cqspi_setup_opcode_ext(struct cqspi_flash_pdata *f_pdata,
483 const struct spi_mem_op *op,
486 struct cqspi_st *cqspi = f_pdata->cqspi;
487 void __iomem *reg_base = cqspi->iobase;
491 if (op->cmd.nbytes != 2)
494 /* Opcode extension is the LSB. */
495 ext = op->cmd.opcode & 0xff;
497 reg = readl(reg_base + CQSPI_REG_OP_EXT_LOWER);
498 reg &= ~(0xff << shift);
500 writel(reg, reg_base + CQSPI_REG_OP_EXT_LOWER);
505 static int cqspi_enable_dtr(struct cqspi_flash_pdata *f_pdata,
506 const struct spi_mem_op *op, unsigned int shift,
509 struct cqspi_st *cqspi = f_pdata->cqspi;
510 void __iomem *reg_base = cqspi->iobase;
514 reg = readl(reg_base + CQSPI_REG_CONFIG);
517 * We enable dual byte opcode here. The callers have to set up the
518 * extension opcode based on which type of operation it is.
521 reg |= CQSPI_REG_CONFIG_DTR_PROTO;
522 reg |= CQSPI_REG_CONFIG_DUAL_OPCODE;
524 /* Set up command opcode extension. */
525 ret = cqspi_setup_opcode_ext(f_pdata, op, shift);
529 reg &= ~CQSPI_REG_CONFIG_DTR_PROTO;
530 reg &= ~CQSPI_REG_CONFIG_DUAL_OPCODE;
533 writel(reg, reg_base + CQSPI_REG_CONFIG);
535 return cqspi_wait_idle(cqspi);
538 static int cqspi_command_read(struct cqspi_flash_pdata *f_pdata,
539 const struct spi_mem_op *op)
541 struct cqspi_st *cqspi = f_pdata->cqspi;
542 void __iomem *reg_base = cqspi->iobase;
543 u8 *rxbuf = op->data.buf.in;
545 size_t n_rx = op->data.nbytes;
548 unsigned int dummy_clk;
552 status = cqspi_set_protocol(f_pdata, op);
556 status = cqspi_enable_dtr(f_pdata, op, CQSPI_REG_OP_EXT_STIG_LSB,
561 if (!n_rx || n_rx > CQSPI_STIG_DATA_LEN_MAX || !rxbuf) {
562 dev_err(&cqspi->pdev->dev,
563 "Invalid input argument, len %zu rxbuf 0x%p\n",
569 opcode = op->cmd.opcode >> 8;
571 opcode = op->cmd.opcode;
573 reg = opcode << CQSPI_REG_CMDCTRL_OPCODE_LSB;
575 rdreg = cqspi_calc_rdreg(f_pdata);
576 writel(rdreg, reg_base + CQSPI_REG_RD_INSTR);
578 dummy_clk = cqspi_calc_dummy(op, f_pdata->dtr);
579 if (dummy_clk > CQSPI_DUMMY_CLKS_MAX)
583 reg |= (dummy_clk & CQSPI_REG_CMDCTRL_DUMMY_MASK)
584 << CQSPI_REG_CMDCTRL_DUMMY_LSB;
586 reg |= (0x1 << CQSPI_REG_CMDCTRL_RD_EN_LSB);
588 /* 0 means 1 byte. */
589 reg |= (((n_rx - 1) & CQSPI_REG_CMDCTRL_RD_BYTES_MASK)
590 << CQSPI_REG_CMDCTRL_RD_BYTES_LSB);
591 status = cqspi_exec_flash_cmd(cqspi, reg);
595 reg = readl(reg_base + CQSPI_REG_CMDREADDATALOWER);
597 /* Put the read value into rx_buf */
598 read_len = (n_rx > 4) ? 4 : n_rx;
599 memcpy(rxbuf, ®, read_len);
603 reg = readl(reg_base + CQSPI_REG_CMDREADDATAUPPER);
605 read_len = n_rx - read_len;
606 memcpy(rxbuf, ®, read_len);
612 static int cqspi_command_write(struct cqspi_flash_pdata *f_pdata,
613 const struct spi_mem_op *op)
615 struct cqspi_st *cqspi = f_pdata->cqspi;
616 void __iomem *reg_base = cqspi->iobase;
618 const u8 *txbuf = op->data.buf.out;
619 size_t n_tx = op->data.nbytes;
625 ret = cqspi_set_protocol(f_pdata, op);
629 ret = cqspi_enable_dtr(f_pdata, op, CQSPI_REG_OP_EXT_STIG_LSB,
634 if (n_tx > CQSPI_STIG_DATA_LEN_MAX || (n_tx && !txbuf)) {
635 dev_err(&cqspi->pdev->dev,
636 "Invalid input argument, cmdlen %zu txbuf 0x%p\n",
641 reg = cqspi_calc_rdreg(f_pdata);
642 writel(reg, reg_base + CQSPI_REG_RD_INSTR);
645 opcode = op->cmd.opcode >> 8;
647 opcode = op->cmd.opcode;
649 reg = opcode << CQSPI_REG_CMDCTRL_OPCODE_LSB;
651 if (op->addr.nbytes) {
652 reg |= (0x1 << CQSPI_REG_CMDCTRL_ADDR_EN_LSB);
653 reg |= ((op->addr.nbytes - 1) &
654 CQSPI_REG_CMDCTRL_ADD_BYTES_MASK)
655 << CQSPI_REG_CMDCTRL_ADD_BYTES_LSB;
657 writel(op->addr.val, reg_base + CQSPI_REG_CMDADDRESS);
661 reg |= (0x1 << CQSPI_REG_CMDCTRL_WR_EN_LSB);
662 reg |= ((n_tx - 1) & CQSPI_REG_CMDCTRL_WR_BYTES_MASK)
663 << CQSPI_REG_CMDCTRL_WR_BYTES_LSB;
665 write_len = (n_tx > 4) ? 4 : n_tx;
666 memcpy(&data, txbuf, write_len);
668 writel(data, reg_base + CQSPI_REG_CMDWRITEDATALOWER);
672 write_len = n_tx - 4;
673 memcpy(&data, txbuf, write_len);
674 writel(data, reg_base + CQSPI_REG_CMDWRITEDATAUPPER);
678 return cqspi_exec_flash_cmd(cqspi, reg);
681 static int cqspi_read_setup(struct cqspi_flash_pdata *f_pdata,
682 const struct spi_mem_op *op)
684 struct cqspi_st *cqspi = f_pdata->cqspi;
685 void __iomem *reg_base = cqspi->iobase;
686 unsigned int dummy_clk = 0;
691 ret = cqspi_enable_dtr(f_pdata, op, CQSPI_REG_OP_EXT_READ_LSB,
697 opcode = op->cmd.opcode >> 8;
699 opcode = op->cmd.opcode;
701 reg = opcode << CQSPI_REG_RD_INSTR_OPCODE_LSB;
702 reg |= cqspi_calc_rdreg(f_pdata);
704 /* Setup dummy clock cycles */
705 dummy_clk = cqspi_calc_dummy(op, f_pdata->dtr);
707 if (dummy_clk > CQSPI_DUMMY_CLKS_MAX)
711 reg |= (dummy_clk & CQSPI_REG_RD_INSTR_DUMMY_MASK)
712 << CQSPI_REG_RD_INSTR_DUMMY_LSB;
714 writel(reg, reg_base + CQSPI_REG_RD_INSTR);
716 /* Set address width */
717 reg = readl(reg_base + CQSPI_REG_SIZE);
718 reg &= ~CQSPI_REG_SIZE_ADDRESS_MASK;
719 reg |= (op->addr.nbytes - 1);
720 writel(reg, reg_base + CQSPI_REG_SIZE);
724 static int cqspi_indirect_read_execute(struct cqspi_flash_pdata *f_pdata,
725 u8 *rxbuf, loff_t from_addr,
728 struct cqspi_st *cqspi = f_pdata->cqspi;
729 struct device *dev = &cqspi->pdev->dev;
730 void __iomem *reg_base = cqspi->iobase;
731 void __iomem *ahb_base = cqspi->ahb_base;
732 unsigned int remaining = n_rx;
733 unsigned int mod_bytes = n_rx % 4;
734 unsigned int bytes_to_read = 0;
735 u8 *rxbuf_end = rxbuf + n_rx;
738 writel(from_addr, reg_base + CQSPI_REG_INDIRECTRDSTARTADDR);
739 writel(remaining, reg_base + CQSPI_REG_INDIRECTRDBYTES);
741 /* Clear all interrupts. */
742 writel(CQSPI_IRQ_STATUS_MASK, reg_base + CQSPI_REG_IRQSTATUS);
744 writel(CQSPI_IRQ_MASK_RD, reg_base + CQSPI_REG_IRQMASK);
746 reinit_completion(&cqspi->transfer_complete);
747 writel(CQSPI_REG_INDIRECTRD_START_MASK,
748 reg_base + CQSPI_REG_INDIRECTRD);
750 while (remaining > 0) {
751 if (!wait_for_completion_timeout(&cqspi->transfer_complete,
752 msecs_to_jiffies(CQSPI_READ_TIMEOUT_MS)))
755 bytes_to_read = cqspi_get_rd_sram_level(cqspi);
757 if (ret && bytes_to_read == 0) {
758 dev_err(dev, "Indirect read timeout, no bytes\n");
762 while (bytes_to_read != 0) {
763 unsigned int word_remain = round_down(remaining, 4);
765 bytes_to_read *= cqspi->fifo_width;
766 bytes_to_read = bytes_to_read > remaining ?
767 remaining : bytes_to_read;
768 bytes_to_read = round_down(bytes_to_read, 4);
769 /* Read 4 byte word chunks then single bytes */
771 ioread32_rep(ahb_base, rxbuf,
772 (bytes_to_read / 4));
773 } else if (!word_remain && mod_bytes) {
774 unsigned int temp = ioread32(ahb_base);
776 bytes_to_read = mod_bytes;
777 memcpy(rxbuf, &temp, min((unsigned int)
781 rxbuf += bytes_to_read;
782 remaining -= bytes_to_read;
783 bytes_to_read = cqspi_get_rd_sram_level(cqspi);
787 reinit_completion(&cqspi->transfer_complete);
790 /* Check indirect done status */
791 ret = cqspi_wait_for_bit(reg_base + CQSPI_REG_INDIRECTRD,
792 CQSPI_REG_INDIRECTRD_DONE_MASK, 0);
794 dev_err(dev, "Indirect read completion error (%i)\n", ret);
798 /* Disable interrupt */
799 writel(0, reg_base + CQSPI_REG_IRQMASK);
801 /* Clear indirect completion status */
802 writel(CQSPI_REG_INDIRECTRD_DONE_MASK, reg_base + CQSPI_REG_INDIRECTRD);
807 /* Disable interrupt */
808 writel(0, reg_base + CQSPI_REG_IRQMASK);
810 /* Cancel the indirect read */
811 writel(CQSPI_REG_INDIRECTWR_CANCEL_MASK,
812 reg_base + CQSPI_REG_INDIRECTRD);
816 static int cqspi_versal_indirect_read_dma(struct cqspi_flash_pdata *f_pdata,
817 u_char *rxbuf, loff_t from_addr,
820 struct cqspi_st *cqspi = f_pdata->cqspi;
821 struct device *dev = &cqspi->pdev->dev;
822 void __iomem *reg_base = cqspi->iobase;
823 u32 reg, bytes_to_dma;
824 loff_t addr = from_addr;
830 bytes_rem = n_rx % 4;
831 bytes_to_dma = (n_rx - bytes_rem);
836 ret = zynqmp_pm_ospi_mux_select(cqspi->pd_dev_id, PM_OSPI_MUX_SEL_DMA);
840 reg = readl(cqspi->iobase + CQSPI_REG_CONFIG);
841 reg |= CQSPI_REG_CONFIG_DMA_MASK;
842 writel(reg, cqspi->iobase + CQSPI_REG_CONFIG);
844 dma_addr = dma_map_single(dev, rxbuf, bytes_to_dma, DMA_FROM_DEVICE);
845 if (dma_mapping_error(dev, dma_addr)) {
846 dev_err(dev, "dma mapping failed\n");
850 writel(from_addr, reg_base + CQSPI_REG_INDIRECTRDSTARTADDR);
851 writel(bytes_to_dma, reg_base + CQSPI_REG_INDIRECTRDBYTES);
852 writel(CQSPI_REG_VERSAL_ADDRRANGE_WIDTH_VAL,
853 reg_base + CQSPI_REG_INDTRIG_ADDRRANGE);
855 /* Clear all interrupts. */
856 writel(CQSPI_IRQ_STATUS_MASK, reg_base + CQSPI_REG_IRQSTATUS);
858 /* Enable DMA done interrupt */
859 writel(CQSPI_REG_VERSAL_DMA_DST_DONE_MASK,
860 reg_base + CQSPI_REG_VERSAL_DMA_DST_I_EN);
862 /* Default DMA periph configuration */
863 writel(CQSPI_REG_VERSAL_DMA_VAL, reg_base + CQSPI_REG_DMA);
865 /* Configure DMA Dst address */
866 writel(lower_32_bits(dma_addr),
867 reg_base + CQSPI_REG_VERSAL_DMA_DST_ADDR);
868 writel(upper_32_bits(dma_addr),
869 reg_base + CQSPI_REG_VERSAL_DMA_DST_ADDR_MSB);
871 /* Configure DMA Src address */
872 writel(cqspi->trigger_address, reg_base +
873 CQSPI_REG_VERSAL_DMA_SRC_ADDR);
875 /* Set DMA destination size */
876 writel(bytes_to_dma, reg_base + CQSPI_REG_VERSAL_DMA_DST_SIZE);
878 /* Set DMA destination control */
879 writel(CQSPI_REG_VERSAL_DMA_DST_CTRL_VAL,
880 reg_base + CQSPI_REG_VERSAL_DMA_DST_CTRL);
882 writel(CQSPI_REG_INDIRECTRD_START_MASK,
883 reg_base + CQSPI_REG_INDIRECTRD);
885 reinit_completion(&cqspi->transfer_complete);
887 if (!wait_for_completion_timeout(&cqspi->transfer_complete,
888 msecs_to_jiffies(CQSPI_READ_TIMEOUT_MS))) {
893 /* Disable DMA interrupt */
894 writel(0x0, cqspi->iobase + CQSPI_REG_VERSAL_DMA_DST_I_DIS);
896 /* Clear indirect completion status */
897 writel(CQSPI_REG_INDIRECTRD_DONE_MASK,
898 cqspi->iobase + CQSPI_REG_INDIRECTRD);
899 dma_unmap_single(dev, dma_addr, bytes_to_dma, DMA_FROM_DEVICE);
901 reg = readl(cqspi->iobase + CQSPI_REG_CONFIG);
902 reg &= ~CQSPI_REG_CONFIG_DMA_MASK;
903 writel(reg, cqspi->iobase + CQSPI_REG_CONFIG);
905 ret = zynqmp_pm_ospi_mux_select(cqspi->pd_dev_id,
906 PM_OSPI_MUX_SEL_LINEAR);
912 addr += bytes_to_dma;
914 ret = cqspi_indirect_read_execute(f_pdata, buf, addr,
923 /* Disable DMA interrupt */
924 writel(0x0, reg_base + CQSPI_REG_VERSAL_DMA_DST_I_DIS);
926 /* Cancel the indirect read */
927 writel(CQSPI_REG_INDIRECTWR_CANCEL_MASK,
928 reg_base + CQSPI_REG_INDIRECTRD);
930 dma_unmap_single(dev, dma_addr, bytes_to_dma, DMA_FROM_DEVICE);
932 reg = readl(cqspi->iobase + CQSPI_REG_CONFIG);
933 reg &= ~CQSPI_REG_CONFIG_DMA_MASK;
934 writel(reg, cqspi->iobase + CQSPI_REG_CONFIG);
936 zynqmp_pm_ospi_mux_select(cqspi->pd_dev_id, PM_OSPI_MUX_SEL_LINEAR);
941 static int cqspi_write_setup(struct cqspi_flash_pdata *f_pdata,
942 const struct spi_mem_op *op)
946 struct cqspi_st *cqspi = f_pdata->cqspi;
947 void __iomem *reg_base = cqspi->iobase;
950 ret = cqspi_enable_dtr(f_pdata, op, CQSPI_REG_OP_EXT_WRITE_LSB,
956 opcode = op->cmd.opcode >> 8;
958 opcode = op->cmd.opcode;
961 reg = opcode << CQSPI_REG_WR_INSTR_OPCODE_LSB;
962 reg |= f_pdata->data_width << CQSPI_REG_WR_INSTR_TYPE_DATA_LSB;
963 reg |= f_pdata->addr_width << CQSPI_REG_WR_INSTR_TYPE_ADDR_LSB;
964 writel(reg, reg_base + CQSPI_REG_WR_INSTR);
965 reg = cqspi_calc_rdreg(f_pdata);
966 writel(reg, reg_base + CQSPI_REG_RD_INSTR);
969 * SPI NAND flashes require the address of the status register to be
970 * passed in the Read SR command. Also, some SPI NOR flashes like the
971 * cypress Semper flash expect a 4-byte dummy address in the Read SR
972 * command in DTR mode.
974 * But this controller does not support address phase in the Read SR
975 * command when doing auto-HW polling. So, disable write completion
976 * polling on the controller's side. spinand and spi-nor will take
977 * care of polling the status register.
979 if (cqspi->wr_completion) {
980 reg = readl(reg_base + CQSPI_REG_WR_COMPLETION_CTRL);
981 reg |= CQSPI_REG_WR_DISABLE_AUTO_POLL;
982 writel(reg, reg_base + CQSPI_REG_WR_COMPLETION_CTRL);
985 reg = readl(reg_base + CQSPI_REG_SIZE);
986 reg &= ~CQSPI_REG_SIZE_ADDRESS_MASK;
987 reg |= (op->addr.nbytes - 1);
988 writel(reg, reg_base + CQSPI_REG_SIZE);
992 static int cqspi_indirect_write_execute(struct cqspi_flash_pdata *f_pdata,
993 loff_t to_addr, const u8 *txbuf,
996 struct cqspi_st *cqspi = f_pdata->cqspi;
997 struct device *dev = &cqspi->pdev->dev;
998 void __iomem *reg_base = cqspi->iobase;
999 unsigned int remaining = n_tx;
1000 unsigned int write_bytes;
1003 writel(to_addr, reg_base + CQSPI_REG_INDIRECTWRSTARTADDR);
1004 writel(remaining, reg_base + CQSPI_REG_INDIRECTWRBYTES);
1006 /* Clear all interrupts. */
1007 writel(CQSPI_IRQ_STATUS_MASK, reg_base + CQSPI_REG_IRQSTATUS);
1009 writel(CQSPI_IRQ_MASK_WR, reg_base + CQSPI_REG_IRQMASK);
1011 reinit_completion(&cqspi->transfer_complete);
1012 writel(CQSPI_REG_INDIRECTWR_START_MASK,
1013 reg_base + CQSPI_REG_INDIRECTWR);
1015 * As per 66AK2G02 TRM SPRUHY8F section 11.15.5.3 Indirect Access
1016 * Controller programming sequence, couple of cycles of
1017 * QSPI_REF_CLK delay is required for the above bit to
1018 * be internally synchronized by the QSPI module. Provide 5
1021 if (cqspi->wr_delay)
1022 ndelay(cqspi->wr_delay);
1024 while (remaining > 0) {
1025 size_t write_words, mod_bytes;
1027 write_bytes = remaining;
1028 write_words = write_bytes / 4;
1029 mod_bytes = write_bytes % 4;
1030 /* Write 4 bytes at a time then single bytes. */
1032 iowrite32_rep(cqspi->ahb_base, txbuf, write_words);
1033 txbuf += (write_words * 4);
1036 unsigned int temp = 0xFFFFFFFF;
1038 memcpy(&temp, txbuf, mod_bytes);
1039 iowrite32(temp, cqspi->ahb_base);
1043 if (!wait_for_completion_timeout(&cqspi->transfer_complete,
1044 msecs_to_jiffies(CQSPI_TIMEOUT_MS))) {
1045 dev_err(dev, "Indirect write timeout\n");
1050 remaining -= write_bytes;
1053 reinit_completion(&cqspi->transfer_complete);
1056 /* Check indirect done status */
1057 ret = cqspi_wait_for_bit(reg_base + CQSPI_REG_INDIRECTWR,
1058 CQSPI_REG_INDIRECTWR_DONE_MASK, 0);
1060 dev_err(dev, "Indirect write completion error (%i)\n", ret);
1064 /* Disable interrupt. */
1065 writel(0, reg_base + CQSPI_REG_IRQMASK);
1067 /* Clear indirect completion status */
1068 writel(CQSPI_REG_INDIRECTWR_DONE_MASK, reg_base + CQSPI_REG_INDIRECTWR);
1070 cqspi_wait_idle(cqspi);
1075 /* Disable interrupt. */
1076 writel(0, reg_base + CQSPI_REG_IRQMASK);
1078 /* Cancel the indirect write */
1079 writel(CQSPI_REG_INDIRECTWR_CANCEL_MASK,
1080 reg_base + CQSPI_REG_INDIRECTWR);
1084 static void cqspi_chipselect(struct cqspi_flash_pdata *f_pdata)
1086 struct cqspi_st *cqspi = f_pdata->cqspi;
1087 void __iomem *reg_base = cqspi->iobase;
1088 unsigned int chip_select = f_pdata->cs;
1091 reg = readl(reg_base + CQSPI_REG_CONFIG);
1092 if (cqspi->is_decoded_cs) {
1093 reg |= CQSPI_REG_CONFIG_DECODE_MASK;
1095 reg &= ~CQSPI_REG_CONFIG_DECODE_MASK;
1097 /* Convert CS if without decoder.
1103 chip_select = 0xF & ~(1 << chip_select);
1106 reg &= ~(CQSPI_REG_CONFIG_CHIPSELECT_MASK
1107 << CQSPI_REG_CONFIG_CHIPSELECT_LSB);
1108 reg |= (chip_select & CQSPI_REG_CONFIG_CHIPSELECT_MASK)
1109 << CQSPI_REG_CONFIG_CHIPSELECT_LSB;
1110 writel(reg, reg_base + CQSPI_REG_CONFIG);
1113 static unsigned int calculate_ticks_for_ns(const unsigned int ref_clk_hz,
1114 const unsigned int ns_val)
1118 ticks = ref_clk_hz / 1000; /* kHz */
1119 ticks = DIV_ROUND_UP(ticks * ns_val, 1000000);
1124 static void cqspi_delay(struct cqspi_flash_pdata *f_pdata)
1126 struct cqspi_st *cqspi = f_pdata->cqspi;
1127 void __iomem *iobase = cqspi->iobase;
1128 const unsigned int ref_clk_hz = cqspi->master_ref_clk_hz;
1129 unsigned int tshsl, tchsh, tslch, tsd2d;
1133 /* calculate the number of ref ticks for one sclk tick */
1134 tsclk = DIV_ROUND_UP(ref_clk_hz, cqspi->sclk);
1136 tshsl = calculate_ticks_for_ns(ref_clk_hz, f_pdata->tshsl_ns);
1137 /* this particular value must be at least one sclk */
1141 tchsh = calculate_ticks_for_ns(ref_clk_hz, f_pdata->tchsh_ns);
1142 tslch = calculate_ticks_for_ns(ref_clk_hz, f_pdata->tslch_ns);
1143 tsd2d = calculate_ticks_for_ns(ref_clk_hz, f_pdata->tsd2d_ns);
1145 reg = (tshsl & CQSPI_REG_DELAY_TSHSL_MASK)
1146 << CQSPI_REG_DELAY_TSHSL_LSB;
1147 reg |= (tchsh & CQSPI_REG_DELAY_TCHSH_MASK)
1148 << CQSPI_REG_DELAY_TCHSH_LSB;
1149 reg |= (tslch & CQSPI_REG_DELAY_TSLCH_MASK)
1150 << CQSPI_REG_DELAY_TSLCH_LSB;
1151 reg |= (tsd2d & CQSPI_REG_DELAY_TSD2D_MASK)
1152 << CQSPI_REG_DELAY_TSD2D_LSB;
1153 writel(reg, iobase + CQSPI_REG_DELAY);
1156 static void cqspi_config_baudrate_div(struct cqspi_st *cqspi)
1158 const unsigned int ref_clk_hz = cqspi->master_ref_clk_hz;
1159 void __iomem *reg_base = cqspi->iobase;
1162 /* Recalculate the baudrate divisor based on QSPI specification. */
1163 div = DIV_ROUND_UP(ref_clk_hz, 2 * cqspi->sclk) - 1;
1165 reg = readl(reg_base + CQSPI_REG_CONFIG);
1166 reg &= ~(CQSPI_REG_CONFIG_BAUD_MASK << CQSPI_REG_CONFIG_BAUD_LSB);
1167 reg |= (div & CQSPI_REG_CONFIG_BAUD_MASK) << CQSPI_REG_CONFIG_BAUD_LSB;
1168 writel(reg, reg_base + CQSPI_REG_CONFIG);
1171 static void cqspi_readdata_capture(struct cqspi_st *cqspi,
1173 const unsigned int delay)
1175 void __iomem *reg_base = cqspi->iobase;
1178 reg = readl(reg_base + CQSPI_REG_READCAPTURE);
1181 reg |= (1 << CQSPI_REG_READCAPTURE_BYPASS_LSB);
1183 reg &= ~(1 << CQSPI_REG_READCAPTURE_BYPASS_LSB);
1185 reg &= ~(CQSPI_REG_READCAPTURE_DELAY_MASK
1186 << CQSPI_REG_READCAPTURE_DELAY_LSB);
1188 reg |= (delay & CQSPI_REG_READCAPTURE_DELAY_MASK)
1189 << CQSPI_REG_READCAPTURE_DELAY_LSB;
1191 writel(reg, reg_base + CQSPI_REG_READCAPTURE);
1194 static void cqspi_controller_enable(struct cqspi_st *cqspi, bool enable)
1196 void __iomem *reg_base = cqspi->iobase;
1199 reg = readl(reg_base + CQSPI_REG_CONFIG);
1202 reg |= CQSPI_REG_CONFIG_ENABLE_MASK;
1204 reg &= ~CQSPI_REG_CONFIG_ENABLE_MASK;
1206 writel(reg, reg_base + CQSPI_REG_CONFIG);
1209 static void cqspi_configure(struct cqspi_flash_pdata *f_pdata,
1212 struct cqspi_st *cqspi = f_pdata->cqspi;
1213 int switch_cs = (cqspi->current_cs != f_pdata->cs);
1214 int switch_ck = (cqspi->sclk != sclk);
1216 if (switch_cs || switch_ck)
1217 cqspi_controller_enable(cqspi, 0);
1219 /* Switch chip select. */
1221 cqspi->current_cs = f_pdata->cs;
1222 cqspi_chipselect(f_pdata);
1225 /* Setup baudrate divisor and delays */
1228 cqspi_config_baudrate_div(cqspi);
1229 cqspi_delay(f_pdata);
1230 cqspi_readdata_capture(cqspi, !cqspi->rclk_en,
1231 f_pdata->read_delay);
1234 if (switch_cs || switch_ck)
1235 cqspi_controller_enable(cqspi, 1);
1238 static ssize_t cqspi_write(struct cqspi_flash_pdata *f_pdata,
1239 const struct spi_mem_op *op)
1241 struct cqspi_st *cqspi = f_pdata->cqspi;
1242 loff_t to = op->addr.val;
1243 size_t len = op->data.nbytes;
1244 const u_char *buf = op->data.buf.out;
1247 ret = cqspi_set_protocol(f_pdata, op);
1251 ret = cqspi_write_setup(f_pdata, op);
1256 * Some flashes like the Cypress Semper flash expect a dummy 4-byte
1257 * address (all 0s) with the read status register command in DTR mode.
1258 * But this controller does not support sending dummy address bytes to
1259 * the flash when it is polling the write completion register in DTR
1260 * mode. So, we can not use direct mode when in DTR mode for writing
1263 if (!f_pdata->dtr && cqspi->use_direct_mode &&
1264 ((to + len) <= cqspi->ahb_size)) {
1265 memcpy_toio(cqspi->ahb_base + to, buf, len);
1266 return cqspi_wait_idle(cqspi);
1269 return cqspi_indirect_write_execute(f_pdata, to, buf, len);
1272 static void cqspi_rx_dma_callback(void *param)
1274 struct cqspi_st *cqspi = param;
1276 complete(&cqspi->rx_dma_complete);
1279 static int cqspi_direct_read_execute(struct cqspi_flash_pdata *f_pdata,
1280 u_char *buf, loff_t from, size_t len)
1282 struct cqspi_st *cqspi = f_pdata->cqspi;
1283 struct device *dev = &cqspi->pdev->dev;
1284 enum dma_ctrl_flags flags = DMA_CTRL_ACK | DMA_PREP_INTERRUPT;
1285 dma_addr_t dma_src = (dma_addr_t)cqspi->mmap_phys_base + from;
1287 struct dma_async_tx_descriptor *tx;
1288 dma_cookie_t cookie;
1290 struct device *ddev;
1292 if (!cqspi->rx_chan || !virt_addr_valid(buf)) {
1293 memcpy_fromio(buf, cqspi->ahb_base + from, len);
1297 ddev = cqspi->rx_chan->device->dev;
1298 dma_dst = dma_map_single(ddev, buf, len, DMA_FROM_DEVICE);
1299 if (dma_mapping_error(ddev, dma_dst)) {
1300 dev_err(dev, "dma mapping failed\n");
1303 tx = dmaengine_prep_dma_memcpy(cqspi->rx_chan, dma_dst, dma_src,
1306 dev_err(dev, "device_prep_dma_memcpy error\n");
1311 tx->callback = cqspi_rx_dma_callback;
1312 tx->callback_param = cqspi;
1313 cookie = tx->tx_submit(tx);
1314 reinit_completion(&cqspi->rx_dma_complete);
1316 ret = dma_submit_error(cookie);
1318 dev_err(dev, "dma_submit_error %d\n", cookie);
1323 dma_async_issue_pending(cqspi->rx_chan);
1324 if (!wait_for_completion_timeout(&cqspi->rx_dma_complete,
1325 msecs_to_jiffies(max_t(size_t, len, 500)))) {
1326 dmaengine_terminate_sync(cqspi->rx_chan);
1327 dev_err(dev, "DMA wait_for_completion_timeout\n");
1333 dma_unmap_single(ddev, dma_dst, len, DMA_FROM_DEVICE);
1338 static ssize_t cqspi_read(struct cqspi_flash_pdata *f_pdata,
1339 const struct spi_mem_op *op)
1341 struct cqspi_st *cqspi = f_pdata->cqspi;
1342 struct device *dev = &cqspi->pdev->dev;
1343 const struct cqspi_driver_platdata *ddata;
1344 loff_t from = op->addr.val;
1345 size_t len = op->data.nbytes;
1346 u_char *buf = op->data.buf.in;
1347 u64 dma_align = (u64)(uintptr_t)buf;
1350 ddata = of_device_get_match_data(dev);
1351 ret = cqspi_set_protocol(f_pdata, op);
1355 ret = cqspi_read_setup(f_pdata, op);
1359 if (cqspi->use_direct_mode && ((from + len) <= cqspi->ahb_size))
1360 return cqspi_direct_read_execute(f_pdata, buf, from, len);
1362 if (cqspi->use_dma_read && ddata && ddata->indirect_read_dma &&
1363 virt_addr_valid(buf) && ((dma_align & CQSPI_DMA_UNALIGN) == 0))
1364 return ddata->indirect_read_dma(f_pdata, buf, from, len);
1366 return cqspi_indirect_read_execute(f_pdata, buf, from, len);
1369 static int cqspi_mem_process(struct spi_mem *mem, const struct spi_mem_op *op)
1371 struct cqspi_st *cqspi = spi_master_get_devdata(mem->spi->master);
1372 struct cqspi_flash_pdata *f_pdata;
1374 f_pdata = &cqspi->f_pdata[mem->spi->chip_select];
1375 cqspi_configure(f_pdata, mem->spi->max_speed_hz);
1377 if (op->data.dir == SPI_MEM_DATA_IN && op->data.buf.in) {
1378 if (!op->addr.nbytes)
1379 return cqspi_command_read(f_pdata, op);
1381 return cqspi_read(f_pdata, op);
1384 if (!op->addr.nbytes || !op->data.buf.out)
1385 return cqspi_command_write(f_pdata, op);
1387 return cqspi_write(f_pdata, op);
1390 static int cqspi_exec_mem_op(struct spi_mem *mem, const struct spi_mem_op *op)
1394 ret = cqspi_mem_process(mem, op);
1396 dev_err(&mem->spi->dev, "operation failed with %d\n", ret);
1401 static bool cqspi_supports_mem_op(struct spi_mem *mem,
1402 const struct spi_mem_op *op)
1404 bool all_true, all_false;
1407 * op->dummy.dtr is required for converting nbytes into ncycles.
1408 * Also, don't check the dtr field of the op phase having zero nbytes.
1410 all_true = op->cmd.dtr &&
1411 (!op->addr.nbytes || op->addr.dtr) &&
1412 (!op->dummy.nbytes || op->dummy.dtr) &&
1413 (!op->data.nbytes || op->data.dtr);
1415 all_false = !op->cmd.dtr && !op->addr.dtr && !op->dummy.dtr &&
1419 /* Right now we only support 8-8-8 DTR mode. */
1420 if (op->cmd.nbytes && op->cmd.buswidth != 8)
1422 if (op->addr.nbytes && op->addr.buswidth != 8)
1424 if (op->data.nbytes && op->data.buswidth != 8)
1426 } else if (all_false) {
1427 /* Only 1-1-X ops are supported without DTR */
1428 if (op->cmd.nbytes && op->cmd.buswidth > 1)
1430 if (op->addr.nbytes && op->addr.buswidth > 1)
1433 /* Mixed DTR modes are not supported. */
1437 return spi_mem_default_supports_op(mem, op);
1440 static int cqspi_of_get_flash_pdata(struct platform_device *pdev,
1441 struct cqspi_flash_pdata *f_pdata,
1442 struct device_node *np)
1444 if (of_property_read_u32(np, "cdns,read-delay", &f_pdata->read_delay)) {
1445 dev_err(&pdev->dev, "couldn't determine read-delay\n");
1449 if (of_property_read_u32(np, "cdns,tshsl-ns", &f_pdata->tshsl_ns)) {
1450 dev_err(&pdev->dev, "couldn't determine tshsl-ns\n");
1454 if (of_property_read_u32(np, "cdns,tsd2d-ns", &f_pdata->tsd2d_ns)) {
1455 dev_err(&pdev->dev, "couldn't determine tsd2d-ns\n");
1459 if (of_property_read_u32(np, "cdns,tchsh-ns", &f_pdata->tchsh_ns)) {
1460 dev_err(&pdev->dev, "couldn't determine tchsh-ns\n");
1464 if (of_property_read_u32(np, "cdns,tslch-ns", &f_pdata->tslch_ns)) {
1465 dev_err(&pdev->dev, "couldn't determine tslch-ns\n");
1469 if (of_property_read_u32(np, "spi-max-frequency", &f_pdata->clk_rate)) {
1470 dev_err(&pdev->dev, "couldn't determine spi-max-frequency\n");
1477 static int cqspi_of_get_pdata(struct cqspi_st *cqspi)
1479 struct device *dev = &cqspi->pdev->dev;
1480 struct device_node *np = dev->of_node;
1483 cqspi->is_decoded_cs = of_property_read_bool(np, "cdns,is-decoded-cs");
1485 if (of_property_read_u32(np, "cdns,fifo-depth", &cqspi->fifo_depth)) {
1486 dev_err(dev, "couldn't determine fifo-depth\n");
1490 if (of_property_read_u32(np, "cdns,fifo-width", &cqspi->fifo_width)) {
1491 dev_err(dev, "couldn't determine fifo-width\n");
1495 if (of_property_read_u32(np, "cdns,trigger-address",
1496 &cqspi->trigger_address)) {
1497 dev_err(dev, "couldn't determine trigger-address\n");
1501 if (of_property_read_u32(np, "num-cs", &cqspi->num_chipselect))
1502 cqspi->num_chipselect = CQSPI_MAX_CHIPSELECT;
1504 cqspi->rclk_en = of_property_read_bool(np, "cdns,rclk-en");
1506 if (!of_property_read_u32_array(np, "power-domains", id,
1508 cqspi->pd_dev_id = id[1];
1513 static void cqspi_controller_init(struct cqspi_st *cqspi)
1517 cqspi_controller_enable(cqspi, 0);
1519 /* Configure the remap address register, no remap */
1520 writel(0, cqspi->iobase + CQSPI_REG_REMAP);
1522 /* Disable all interrupts. */
1523 writel(0, cqspi->iobase + CQSPI_REG_IRQMASK);
1525 /* Configure the SRAM split to 1:1 . */
1526 writel(cqspi->fifo_depth / 2, cqspi->iobase + CQSPI_REG_SRAMPARTITION);
1528 /* Load indirect trigger address. */
1529 writel(cqspi->trigger_address,
1530 cqspi->iobase + CQSPI_REG_INDIRECTTRIGGER);
1532 /* Program read watermark -- 1/2 of the FIFO. */
1533 writel(cqspi->fifo_depth * cqspi->fifo_width / 2,
1534 cqspi->iobase + CQSPI_REG_INDIRECTRDWATERMARK);
1535 /* Program write watermark -- 1/8 of the FIFO. */
1536 writel(cqspi->fifo_depth * cqspi->fifo_width / 8,
1537 cqspi->iobase + CQSPI_REG_INDIRECTWRWATERMARK);
1539 /* Disable direct access controller */
1540 if (!cqspi->use_direct_mode) {
1541 reg = readl(cqspi->iobase + CQSPI_REG_CONFIG);
1542 reg &= ~CQSPI_REG_CONFIG_ENB_DIR_ACC_CTRL;
1543 writel(reg, cqspi->iobase + CQSPI_REG_CONFIG);
1546 /* Enable DMA interface */
1547 if (cqspi->use_dma_read) {
1548 reg = readl(cqspi->iobase + CQSPI_REG_CONFIG);
1549 reg |= CQSPI_REG_CONFIG_DMA_MASK;
1550 writel(reg, cqspi->iobase + CQSPI_REG_CONFIG);
1553 cqspi_controller_enable(cqspi, 1);
1556 static int cqspi_request_mmap_dma(struct cqspi_st *cqspi)
1558 dma_cap_mask_t mask;
1561 dma_cap_set(DMA_MEMCPY, mask);
1563 cqspi->rx_chan = dma_request_chan_by_mask(&mask);
1564 if (IS_ERR(cqspi->rx_chan)) {
1565 int ret = PTR_ERR(cqspi->rx_chan);
1566 cqspi->rx_chan = NULL;
1567 return dev_err_probe(&cqspi->pdev->dev, ret, "No Rx DMA available\n");
1569 init_completion(&cqspi->rx_dma_complete);
1574 static const char *cqspi_get_name(struct spi_mem *mem)
1576 struct cqspi_st *cqspi = spi_master_get_devdata(mem->spi->master);
1577 struct device *dev = &cqspi->pdev->dev;
1579 return devm_kasprintf(dev, GFP_KERNEL, "%s.%d", dev_name(dev), mem->spi->chip_select);
1582 static const struct spi_controller_mem_ops cqspi_mem_ops = {
1583 .exec_op = cqspi_exec_mem_op,
1584 .get_name = cqspi_get_name,
1585 .supports_op = cqspi_supports_mem_op,
1588 static const struct spi_controller_mem_caps cqspi_mem_caps = {
1592 static int cqspi_setup_flash(struct cqspi_st *cqspi)
1594 struct platform_device *pdev = cqspi->pdev;
1595 struct device *dev = &pdev->dev;
1596 struct device_node *np = dev->of_node;
1597 struct cqspi_flash_pdata *f_pdata;
1601 /* Get flash device data */
1602 for_each_available_child_of_node(dev->of_node, np) {
1603 ret = of_property_read_u32(np, "reg", &cs);
1605 dev_err(dev, "Couldn't determine chip select.\n");
1610 if (cs >= CQSPI_MAX_CHIPSELECT) {
1611 dev_err(dev, "Chip select %d out of range.\n", cs);
1616 f_pdata = &cqspi->f_pdata[cs];
1617 f_pdata->cqspi = cqspi;
1620 ret = cqspi_of_get_flash_pdata(pdev, f_pdata, np);
1630 static int cqspi_probe(struct platform_device *pdev)
1632 const struct cqspi_driver_platdata *ddata;
1633 struct reset_control *rstc, *rstc_ocp;
1634 struct device *dev = &pdev->dev;
1635 struct spi_master *master;
1636 struct resource *res_ahb;
1637 struct cqspi_st *cqspi;
1638 struct resource *res;
1642 master = spi_alloc_master(&pdev->dev, sizeof(*cqspi));
1644 dev_err(&pdev->dev, "spi_alloc_master failed\n");
1647 master->mode_bits = SPI_RX_QUAD | SPI_RX_DUAL;
1648 master->mem_ops = &cqspi_mem_ops;
1649 master->mem_caps = &cqspi_mem_caps;
1650 master->dev.of_node = pdev->dev.of_node;
1652 cqspi = spi_master_get_devdata(master);
1655 platform_set_drvdata(pdev, cqspi);
1657 /* Obtain configuration from OF. */
1658 ret = cqspi_of_get_pdata(cqspi);
1660 dev_err(dev, "Cannot get mandatory OF data.\n");
1662 goto probe_master_put;
1665 /* Obtain QSPI clock. */
1666 cqspi->clk = devm_clk_get(dev, NULL);
1667 if (IS_ERR(cqspi->clk)) {
1668 dev_err(dev, "Cannot claim QSPI clock.\n");
1669 ret = PTR_ERR(cqspi->clk);
1670 goto probe_master_put;
1673 /* Obtain and remap controller address. */
1674 res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
1675 cqspi->iobase = devm_ioremap_resource(dev, res);
1676 if (IS_ERR(cqspi->iobase)) {
1677 dev_err(dev, "Cannot remap controller address.\n");
1678 ret = PTR_ERR(cqspi->iobase);
1679 goto probe_master_put;
1682 /* Obtain and remap AHB address. */
1683 res_ahb = platform_get_resource(pdev, IORESOURCE_MEM, 1);
1684 cqspi->ahb_base = devm_ioremap_resource(dev, res_ahb);
1685 if (IS_ERR(cqspi->ahb_base)) {
1686 dev_err(dev, "Cannot remap AHB address.\n");
1687 ret = PTR_ERR(cqspi->ahb_base);
1688 goto probe_master_put;
1690 cqspi->mmap_phys_base = (dma_addr_t)res_ahb->start;
1691 cqspi->ahb_size = resource_size(res_ahb);
1693 init_completion(&cqspi->transfer_complete);
1695 /* Obtain IRQ line. */
1696 irq = platform_get_irq(pdev, 0);
1699 goto probe_master_put;
1702 pm_runtime_enable(dev);
1703 ret = pm_runtime_get_sync(dev);
1705 pm_runtime_put_noidle(dev);
1706 goto probe_master_put;
1709 ret = clk_prepare_enable(cqspi->clk);
1711 dev_err(dev, "Cannot enable QSPI clock.\n");
1712 goto probe_clk_failed;
1715 /* Obtain QSPI reset control */
1716 rstc = devm_reset_control_get_optional_exclusive(dev, "qspi");
1718 ret = PTR_ERR(rstc);
1719 dev_err(dev, "Cannot get QSPI reset.\n");
1720 goto probe_reset_failed;
1723 rstc_ocp = devm_reset_control_get_optional_exclusive(dev, "qspi-ocp");
1724 if (IS_ERR(rstc_ocp)) {
1725 ret = PTR_ERR(rstc_ocp);
1726 dev_err(dev, "Cannot get QSPI OCP reset.\n");
1727 goto probe_reset_failed;
1730 reset_control_assert(rstc);
1731 reset_control_deassert(rstc);
1733 reset_control_assert(rstc_ocp);
1734 reset_control_deassert(rstc_ocp);
1736 cqspi->master_ref_clk_hz = clk_get_rate(cqspi->clk);
1737 master->max_speed_hz = cqspi->master_ref_clk_hz;
1739 /* write completion is supported by default */
1740 cqspi->wr_completion = true;
1742 ddata = of_device_get_match_data(dev);
1744 if (ddata->quirks & CQSPI_NEEDS_WR_DELAY)
1745 cqspi->wr_delay = 50 * DIV_ROUND_UP(NSEC_PER_SEC,
1746 cqspi->master_ref_clk_hz);
1747 if (ddata->hwcaps_mask & CQSPI_SUPPORTS_OCTAL)
1748 master->mode_bits |= SPI_RX_OCTAL | SPI_TX_OCTAL;
1749 if (!(ddata->quirks & CQSPI_DISABLE_DAC_MODE))
1750 cqspi->use_direct_mode = true;
1751 if (ddata->quirks & CQSPI_SUPPORT_EXTERNAL_DMA)
1752 cqspi->use_dma_read = true;
1753 if (ddata->quirks & CQSPI_NO_SUPPORT_WR_COMPLETION)
1754 cqspi->wr_completion = false;
1756 if (of_device_is_compatible(pdev->dev.of_node,
1757 "xlnx,versal-ospi-1.0"))
1758 dma_set_mask(&pdev->dev, DMA_BIT_MASK(64));
1761 ret = devm_request_irq(dev, irq, cqspi_irq_handler, 0,
1764 dev_err(dev, "Cannot request IRQ.\n");
1765 goto probe_reset_failed;
1768 cqspi_wait_idle(cqspi);
1769 cqspi_controller_init(cqspi);
1770 cqspi->current_cs = -1;
1773 master->num_chipselect = cqspi->num_chipselect;
1775 ret = cqspi_setup_flash(cqspi);
1777 dev_err(dev, "failed to setup flash parameters %d\n", ret);
1778 goto probe_setup_failed;
1781 if (cqspi->use_direct_mode) {
1782 ret = cqspi_request_mmap_dma(cqspi);
1783 if (ret == -EPROBE_DEFER)
1784 goto probe_setup_failed;
1787 ret = devm_spi_register_master(dev, master);
1789 dev_err(&pdev->dev, "failed to register SPI ctlr %d\n", ret);
1790 goto probe_setup_failed;
1795 cqspi_controller_enable(cqspi, 0);
1797 clk_disable_unprepare(cqspi->clk);
1799 pm_runtime_put_sync(dev);
1800 pm_runtime_disable(dev);
1802 spi_master_put(master);
1806 static int cqspi_remove(struct platform_device *pdev)
1808 struct cqspi_st *cqspi = platform_get_drvdata(pdev);
1810 cqspi_controller_enable(cqspi, 0);
1813 dma_release_channel(cqspi->rx_chan);
1815 clk_disable_unprepare(cqspi->clk);
1817 pm_runtime_put_sync(&pdev->dev);
1818 pm_runtime_disable(&pdev->dev);
1823 #ifdef CONFIG_PM_SLEEP
1824 static int cqspi_suspend(struct device *dev)
1826 struct cqspi_st *cqspi = dev_get_drvdata(dev);
1828 cqspi_controller_enable(cqspi, 0);
1832 static int cqspi_resume(struct device *dev)
1834 struct cqspi_st *cqspi = dev_get_drvdata(dev);
1836 cqspi_controller_enable(cqspi, 1);
1840 static const struct dev_pm_ops cqspi__dev_pm_ops = {
1841 .suspend = cqspi_suspend,
1842 .resume = cqspi_resume,
1845 #define CQSPI_DEV_PM_OPS (&cqspi__dev_pm_ops)
1847 #define CQSPI_DEV_PM_OPS NULL
1850 static const struct cqspi_driver_platdata cdns_qspi = {
1851 .quirks = CQSPI_DISABLE_DAC_MODE,
1854 static const struct cqspi_driver_platdata k2g_qspi = {
1855 .quirks = CQSPI_NEEDS_WR_DELAY,
1858 static const struct cqspi_driver_platdata am654_ospi = {
1859 .hwcaps_mask = CQSPI_SUPPORTS_OCTAL,
1860 .quirks = CQSPI_NEEDS_WR_DELAY,
1863 static const struct cqspi_driver_platdata intel_lgm_qspi = {
1864 .quirks = CQSPI_DISABLE_DAC_MODE,
1867 static const struct cqspi_driver_platdata socfpga_qspi = {
1868 .quirks = CQSPI_NO_SUPPORT_WR_COMPLETION,
1871 static const struct cqspi_driver_platdata versal_ospi = {
1872 .hwcaps_mask = CQSPI_SUPPORTS_OCTAL,
1873 .quirks = CQSPI_DISABLE_DAC_MODE | CQSPI_SUPPORT_EXTERNAL_DMA,
1874 .indirect_read_dma = cqspi_versal_indirect_read_dma,
1875 .get_dma_status = cqspi_get_versal_dma_status,
1878 static const struct of_device_id cqspi_dt_ids[] = {
1880 .compatible = "cdns,qspi-nor",
1884 .compatible = "ti,k2g-qspi",
1888 .compatible = "ti,am654-ospi",
1889 .data = &am654_ospi,
1892 .compatible = "intel,lgm-qspi",
1893 .data = &intel_lgm_qspi,
1896 .compatible = "xlnx,versal-ospi-1.0",
1897 .data = (void *)&versal_ospi,
1900 .compatible = "intel,socfpga-qspi",
1901 .data = (void *)&socfpga_qspi,
1903 { /* end of table */ }
1906 MODULE_DEVICE_TABLE(of, cqspi_dt_ids);
1908 static struct platform_driver cqspi_platform_driver = {
1909 .probe = cqspi_probe,
1910 .remove = cqspi_remove,
1913 .pm = CQSPI_DEV_PM_OPS,
1914 .of_match_table = cqspi_dt_ids,
1918 module_platform_driver(cqspi_platform_driver);
1920 MODULE_DESCRIPTION("Cadence QSPI Controller Driver");
1921 MODULE_LICENSE("GPL v2");
1922 MODULE_ALIAS("platform:" CQSPI_NAME);
1923 MODULE_AUTHOR("Ley Foon Tan <lftan@altera.com>");
1924 MODULE_AUTHOR("Graham Moore <grmoore@opensource.altera.com>");
1925 MODULE_AUTHOR("Vadivel Murugan R <vadivel.muruganx.ramuthevar@intel.com>");
1926 MODULE_AUTHOR("Vignesh Raghavendra <vigneshr@ti.com>");
1927 MODULE_AUTHOR("Pratyush Yadav <p.yadav@ti.com>");