spi_flash: extend non-bitbanged flash support

This commit adds support for memory mapped writes
in the same configuration as memory mapped reads
are currently supported.

It also adds support for accessing registers
and erasing sectors in non-bitbanged single SPI
mode.
This commit is contained in:
Jakub Cebulski 2020-03-09 12:28:42 +01:00 committed by Mateusz Holenko
parent a344e20b5e
commit 00f973ea35
1 changed files with 135 additions and 49 deletions

View File

@ -2,6 +2,7 @@
# This file is Copyright (c) 2014-2018 Florent Kermarrec <florent@enjoy-digital.fr> # This file is Copyright (c) 2014-2018 Florent Kermarrec <florent@enjoy-digital.fr>
# This file is Copyright (c) 2013-2014 Robert Jordens <jordens@gmail.com> # This file is Copyright (c) 2013-2014 Robert Jordens <jordens@gmail.com>
# This file is Copyright (c) 2015-2014 Sebastien Bourdeauducq <sb@m-labs.hk> # This file is Copyright (c) 2015-2014 Sebastien Bourdeauducq <sb@m-labs.hk>
# This file is Copyright (c) 2020 Antmicro <www.antmicro.com>
# License: BSD # License: BSD
@ -18,16 +19,13 @@ from litex.soc.cores.spi import SPIMaster
# SpiFlash Quad/Dual/Single (memory-mapped) -------------------------------------------------------- # SpiFlash Quad/Dual/Single (memory-mapped) --------------------------------------------------------
_FAST_READ = 0x0b
_DIOFR = 0xbb
_QIOFR = 0xeb _QIOFR = 0xeb
_QIOPP = 0x12
def _format_cmd(cmd, spi_width): def _format_cmd(cmd, spi_width):
""" """
`cmd` is the read instruction. Since everything is transmitted on all `cmd` is the read instruction. Since everything is transmitted on all
dq lines (cmd, adr and data), extend/interleave cmd to full pads.dq dq lines (cmd, adr and data), we need to reformat cmd in single spi mode.
width even if dq1-dq3 are don't care during the command phase:
For example, for N25Q128, 0xeb is the quad i/o fast read, and For example, for N25Q128, 0xeb is the quad i/o fast read, and
extended to 4 bits (dq1,dq2,dq3 high) is: 0xfffefeff extended to 4 bits (dq1,dq2,dq3 high) is: 0xfffefeff
""" """
@ -37,6 +35,12 @@ def _format_cmd(cmd, spi_width):
c &= ~(1<<(b*spi_width)) c &= ~(1<<(b*spi_width))
return c return c
def accumulate_timeline_deltas(seq):
t, tseq = 0, []
for dt, a in seq:
tseq.append((t, a))
t += dt
return tseq
class SpiFlashCommon(Module): class SpiFlashCommon(Module):
def __init__(self, pads): def __init__(self, pads):
@ -85,6 +89,7 @@ class SpiFlashDualQuad(SpiFlashCommon, AutoCSR):
SpiFlashCommon.__init__(self, pads) SpiFlashCommon.__init__(self, pads)
self.bus = bus = wishbone.Interface() self.bus = bus = wishbone.Interface()
spi_width = len(pads.dq) spi_width = len(pads.dq)
max_transfer_size = 8*8
assert spi_width >= 2 assert spi_width >= 2
if with_bitbang: if with_bitbang:
@ -104,24 +109,31 @@ class SpiFlashDualQuad(SpiFlashCommon, AutoCSR):
self.miso = CSRStatus(description="Incoming value of MISO signal.") self.miso = CSRStatus(description="Incoming value of MISO signal.")
self.bitbang_en = CSRStorage(description="Write a ``1`` here to disable memory-mapped mode and enable bitbang mode.") self.bitbang_en = CSRStorage(description="Write a ``1`` here to disable memory-mapped mode and enable bitbang mode.")
# # # queue = self.queue = CSRStatus(4)
in_len = self.in_len = CSRStorage(4)
out_len = self.out_len = CSRStorage(4)
in_left = self.in_left = Signal(max=2**8)
out_left = self.out_left = Signal(max=2**8)
self.quad_transfer = Signal(reset=0)
spi_in = self.spi_in = CSRStorage(max_transfer_size)
spi_out = self.spi_out = CSRStatus(max_transfer_size)
cs_n = Signal(reset=1) cs_n = Signal(reset=1)
clk = Signal() clk = Signal()
dq_oe = Signal() dq_oe = Signal()
wbone_width = len(bus.dat_r) wbone_width = len(bus.dat_r)
cmd_width = 8
read_cmd_params = {
4: (_format_cmd(_QIOFR, 4), 4*8),
2: (_format_cmd(_DIOFR, 2), 2*8),
1: (_format_cmd(_FAST_READ, 1), 1*8)
}
read_cmd, cmd_width = read_cmd_params[spi_width]
addr_width = 24 addr_width = 24
dq = TSTriple(spi_width) dq = TSTriple(spi_width)
sr = Signal(max(cmd_width, addr_width, wbone_width))
if endianness == "big":
self.comb += bus.dat_r.eq(sr)
else:
self.comb += bus.dat_r.eq(reverse_bytes(sr))
self.specials.dq0 = Tristate(pads.dq[0], o=dq.o[0], i=dq.i[0], oe=dq.oe) self.specials.dq0 = Tristate(pads.dq[0], o=dq.o[0], i=dq.i[0], oe=dq.oe)
self.specials.dq1 = Tristate(pads.dq[1], o=dq.o[1], i=dq.i[1], oe=dq.oe) self.specials.dq1 = Tristate(pads.dq[1], o=dq.o[1], i=dq.i[1], oe=dq.oe)
if with_bitbang: if with_bitbang:
@ -132,18 +144,24 @@ class SpiFlashDualQuad(SpiFlashCommon, AutoCSR):
self.specials.dq2 = Tristate(pads.dq[2], o=dq.o[2], i=dq.i[2], oe=dq.oe) self.specials.dq2 = Tristate(pads.dq[2], o=dq.o[2], i=dq.i[2], oe=dq.oe)
self.specials.dq3 = Tristate(pads.dq[3], o=dq.o[3], i=dq.i[3], oe=dq.oe) self.specials.dq3 = Tristate(pads.dq[3], o=dq.o[3], i=dq.i[3], oe=dq.oe)
sr = Signal(max(cmd_width, addr_width, wbone_width)) sr = Signal(max(cmd_width, addr_width, wbone_width, max_transfer_size))
if endianness == "big":
self.comb += bus.dat_r.eq(sr)
else:
self.comb += bus.dat_r.eq(reverse_bytes(sr))
hw_read_logic = [ if endianness == "big":
self.comb += bus.dat_r.eq(sr[:wbone_width])
else:
self.comb += bus.dat_r.eq(reverse_bytes(sr[:wbone_width]))
hw_read_logic_single = [
pads.clk.eq(clk), pads.clk.eq(clk),
pads.cs_n.eq(cs_n), pads.cs_n.eq(cs_n),
dq.o.eq(sr[-spi_width:]), dq.o.eq(sr[-spi_width:]),
dq.oe.eq(dq_oe) dq.oe.eq(dq_oe)
] ]
hw_read_logic_quad = [
pads.clk.eq(clk),
pads.cs_n.eq(cs_n),
dq.o.eq(Cat(sr[-1:], Replicate(1, 3))),
dq.oe.eq(dq_oe)
]
if with_bitbang: if with_bitbang:
bitbang_logic = [ bitbang_logic = [
@ -170,19 +188,33 @@ class SpiFlashDualQuad(SpiFlashCommon, AutoCSR):
self.comb += [ self.comb += [
If(self.bitbang_en.storage, If(self.bitbang_en.storage,
bitbang_logic bitbang_logic
).Elif(self.quad_transfer,
hw_read_logic_single
).Else( ).Else(
hw_read_logic hw_read_logic_quad
) )
] ]
else: else:
self.comb += hw_read_logic self.comb += [
If(self.quad_transfer,
hw_read_logic_single
).Else(
hw_read_logic_quad
)
]
if div < 2: if div < 2:
raise ValueError("Unsupported value \'{}\' for div parameter for SpiFlash core".format(div)) raise ValueError("Unsupported value \'{}\' for div parameter for SpiFlash core".format(div))
else:
# spi is byte-addressed, prefix by zeros
z = Replicate(0, log2_int(wbone_width//8))
i = Signal(max=div) i = Signal(max=div)
dqi = Signal(spi_width) dqi = Signal(spi_width)
# SPI or memmap mode
self.mode = Signal()
self.sync += [ self.sync += [
If(i == div//2 - 1, If(i == div//2 - 1,
clk.eq(1), clk.eq(1),
@ -191,37 +223,91 @@ class SpiFlashDualQuad(SpiFlashCommon, AutoCSR):
If(i == div - 1, If(i == div - 1,
i.eq(0), i.eq(0),
clk.eq(0), clk.eq(0),
If(self.quad_transfer,
sr.eq(Cat(dqi, sr[:-spi_width])) sr.eq(Cat(dqi, sr[:-spi_width]))
).Else(
sr.eq(Cat(dqi[1], sr[:-1]))
)
).Else( ).Else(
i.eq(i + 1), i.eq(i + 1),
), ),
] ]
# spi is byte-addressed, prefix by zeros read_seq = [
z = Replicate(0, log2_int(wbone_width//8)) (4*cmd_width//spi_width*div,
[dq_oe.eq(1), cs_n.eq(0), sr[-cmd_width:].eq(_QIOFR), self.quad_transfer.eq(0)]),
seq = [
(cmd_width//spi_width*div,
[dq_oe.eq(1), cs_n.eq(0), sr[-cmd_width:].eq(read_cmd)]),
(addr_width//spi_width*div, (addr_width//spi_width*div,
[sr[-addr_width:].eq(Cat(z, bus.adr))]), [sr[-addr_width:].eq(Cat(z, bus.adr)), self.quad_transfer.eq(1)]),
((dummy + wbone_width//spi_width)*div, ((1+dummy + wbone_width//spi_width)*div,
[dq_oe.eq(0)]), [dq_oe.eq(0)]),
(1, (1,
[bus.ack.eq(1), cs_n.eq(1)]), [bus.ack.eq(1), cs_n.eq(1)]),
(div, # tSHSL! (div, # tSHSL!
[bus.ack.eq(0)]), [bus.ack.eq(0)]),
(0, (0,
[]), [queue.status[0].eq(0)]),
] ]
# accumulate timeline deltas
t, tseq = 0, []
for dt, a in seq:
tseq.append((t, a))
t += dt
self.sync += timeline(bus.cyc & bus.stb & (i == div - 1), tseq) write_seq = [
(4*cmd_width//spi_width*div,
[dq_oe.eq(1), cs_n.eq(0), sr[-cmd_width:].eq(_QIOPP), self.quad_transfer.eq(0)]),
(addr_width//spi_width*div,
[sr[-addr_width:].eq(Cat(z, bus.adr)), self.quad_transfer.eq(1)]),
((wbone_width//spi_width)*div,
[sr[-wbone_width:].eq(reverse_bytes(bus.dat_w))]),
(1,
[bus.ack.eq(1), cs_n.eq(1)]),
(div,
[bus.ack.eq(0)]),
(0,
[queue.status[1].eq(0)]),
]
# prepare spi transfer
self.sync += If(self.out_len.re & (self.out_len.storage != 0) & self.en_quad.storage[0],
self.out_left.eq(Cat(1, self.out_len.storage)
)
)
self.sync += If(self.out_len.re & (self.out_len.storage == 0),
self.out_left.eq(0)
)
self.sync += If(self.out_len.re & (self.out_len.storage != 0) & ~self.en_quad.storage[0],
self.out_left.eq(Cat(1, Replicate(0, 2), self.out_len.storage))
)
self.sync += If(self.in_len.re & (self.in_len.storage != 0) & ~self.en_quad.storage[0],
[queue.status[2].eq(1),
self.in_left.eq(Cat(Replicate(0, 3), in_len.storage)),
self.quad_transfer.eq(0)]
)
# write data to sr
self.sync += If(queue.status[2] & (i == div - 1) & ~self.en_quad.storage[0],
sr[-max_transfer_size:].eq(self.spi_in.storage), queue.status[2].eq(0), queue.status[3].eq(1), cs_n.eq(0), dq_oe.eq(1))
# count spi to slave transfer cycles
self.sync += If(queue.status[3] & (self.in_left > 0) & (i == div - 1), self.in_left.eq(self.in_left - 1), dq_oe.eq(1))
# count spi to master transfer cycles
self.sync += If(queue.status[3] & (self.in_left < 1) & (self.out_left > 0) & (i == div - 1), self.out_left.eq(self.out_left - 1), dq_oe.eq(0))
#end transmision and read data from sr
self.sync += If(~self.in_len.re & (in_left < 1) & (out_left < 1) & queue.status[3], queue.status[3].eq(0), cs_n.eq(1),
If(self.out_len.storage == 1, self.spi_out.status.eq(Cat(Replicate(0, 8*7), sr))
).Elif(self.out_len.storage == 2, self.spi_out.status.eq(Cat(Replicate(0, 8*6), sr))
).Elif(self.out_len.storage == 3, self.spi_out.status.eq(Cat(Replicate(0, 8*5), sr))
).Elif(self.out_len.storage == 4, self.spi_out.status.eq(Cat(Replicate(0, 8*4), sr))
).Elif(self.out_len.storage == 5, self.spi_out.status.eq(Cat(Replicate(0, 8*3), sr))
).Elif(self.out_len.storage == 6, self.spi_out.status.eq(Cat(Replicate(0, 8*2), sr))
).Elif(self.out_len.storage == 7, self.spi_out.status.eq(Cat(Replicate(0, 8*1), sr))
).Else(self.spi_out.status.eq(sr)))
# detect mem map access
self.sync += If(~self.mode & bus.cyc & bus.stb & ~bus.we, queue.status[0].eq(1))
self.sync += If(~self.mode & bus.cyc & bus.stb & bus.we, queue.status[1].eq(1))
self.sync += timeline(queue.status[0] & ~self.en_quad.storage[0] & (i == div - 1), accumulate_timeline_deltas(read_seq))
self.sync += timeline(queue.status[1] & ~self.en_quad.storage[0] & (i == div - 1), accumulate_timeline_deltas(write_seq))
class SpiFlashSingle(SpiFlashCommon, AutoCSR): class SpiFlashSingle(SpiFlashCommon, AutoCSR):