1 """ LOAD / STORE Computation Unit. Also capable of doing ADD and ADD immediate
3 This module runs a "revolving door" set of four latches, based on
7 * Go_Write *OR* Go_Store
9 (Note that opc_l has been inverted (and qn used), due to SRLatch
10 default reset state being "0" rather than "1")
12 Also note: the LD/ST Comp Unit can act as a *standard ALU* doing
15 Stores are activated when Go_Store is enabled, and uses the ALU
16 to add the immediate (imm_i) to the address (src1_i), and then
17 when ready (go_st_i and the ALU ready) the operand (src2_i) is stored
18 in the computed address.
21 from nmigen
.compat
.sim
import run_simulation
22 from nmigen
.cli
import verilog
, rtlil
23 from nmigen
import Module
, Signal
, Mux
, Cat
, Elaboratable
25 from nmutil
.latch
import SRLatch
, latchregister
27 from testmem
import TestMemory
29 # internal opcodes. hypothetically this could do more combinations.
31 # * bit 0: 0 = ADD , 1 = SUB
32 # * bit 1: 0 = src1, 1 = IMM
39 # convenience thingies.
40 LDST_OP_ADD
= 0b0000 # plain ADD (src1 + src2) - use this ALU as an ADD
41 LDST_OP_SUB
= 0b0001 # plain SUB (src1 - src2) - use this ALU as a SUB
42 LDST_OP_ADDI
= 0b0010 # immed ADD (imm + src1)
43 LDST_OP_SUBI
= 0b0011 # immed SUB (imm - src1)
44 LDST_OP_ST
= 0b0110 # immed ADD plus LD op. ADD result is address
45 LDST_OP_LD
= 0b1010 # immed ADD plus ST op. ADD result is address
49 class LDSTCompUnit(Elaboratable
):
50 """ LOAD / STORE / ADD / SUB Computation Unit
55 * :rwid: register width
57 * :mem: a Memory Module (read-write capable)
62 * :oper_i: operation being carried out (LDST_OP_ADD, LDST_OP_LD)
63 * :issue_i: LD/ST is being "issued".
64 * :isalu_i: ADD/SUB is being "issued" (aka issue_alu_i)
65 * :shadown_i: Inverted-shadow is being held (stops STORE *and* WRITE)
66 * :go_rd_i: read is being actioned (latches in src regs)
67 * :go_wr_i: write mode (exactly like ALU CompUnit)
68 * :go_ad_i: address is being actioned (triggers actual mem LD)
69 * :go_st_i: store is being actioned (triggers actual mem STORE)
70 * :go_die_i: resets the unit back to "wait for issue"
75 * :busy_o: function unit is busy
76 * :rd_rel_o: request src1/src2
77 * :adr_rel_o: request address (from mem)
78 * :sto_rel_o: request store (to mem)
79 * :req_rel_o: request write (result)
80 * :load_mem_o: activate memory LOAD
81 * :stwd_mem_o: activate memory STORE
83 Note: load_mem_o, stwd_mem_o and req_rel_o MUST all be acknowledged
84 in a single cycle and the CompUnit set back to doing another op.
85 This means deasserting go_st_i, go_ad_i or go_wr_i as appropriate
86 depending on whether the operation is a STORE, LD, or a straight
87 ALU operation respectively.
91 * :data_o: Dest out (LD or ALU)
92 * :addr_o: Address out (LD or ST)
94 def __init__(self
, rwid
, opwid
, alu
, mem
):
100 self
.counter
= Signal(4)
101 self
.go_rd_i
= Signal(reset_less
=True) # go read in
102 self
.go_ad_i
= Signal(reset_less
=True) # go address in
103 self
.go_wr_i
= Signal(reset_less
=True) # go write in
104 self
.go_st_i
= Signal(reset_less
=True) # go store in
105 self
.issue_i
= Signal(reset_less
=True) # fn issue in
106 self
.isalu_i
= Signal(reset_less
=True) # fn issue as ALU in
107 self
.shadown_i
= Signal(reset
=1) # shadow function, defaults to ON
108 self
.go_die_i
= Signal() # go die (reset)
110 self
.oper_i
= Signal(opwid
, reset_less
=True) # opcode in
111 self
.imm_i
= Signal(rwid
, reset_less
=True) # immediate in
112 self
.src1_i
= Signal(rwid
, reset_less
=True) # oper1 in
113 self
.src2_i
= Signal(rwid
, reset_less
=True) # oper2 in
115 self
.busy_o
= Signal(reset_less
=True) # fn busy out
116 self
.rd_rel_o
= Signal(reset_less
=True) # request src1/src2
117 self
.adr_rel_o
= Signal(reset_less
=True) # request address (from mem)
118 self
.sto_rel_o
= Signal(reset_less
=True) # request store (to mem)
119 self
.req_rel_o
= Signal(reset_less
=True) # request write (result)
120 self
.data_o
= Signal(rwid
, reset_less
=True) # Dest out (LD or ALU)
121 self
.addr_o
= Signal(rwid
, reset_less
=True) # Address out (LD or ST)
123 # hmm... TODO... move these to outside of LDSTCompUnit?
124 self
.load_mem_o
= Signal(reset_less
=True) # activate memory LOAD
125 self
.stwd_mem_o
= Signal(reset_less
=True) # activate memory STORE
126 self
.ld_o
= Signal(reset_less
=True) # operation is a LD
127 self
.st_o
= Signal(reset_less
=True) # operation is a ST
129 def elaborate(self
, platform
):
134 m
.submodules
.alu
= self
.alu
135 #m.submodules.mem = self.mem
136 m
.submodules
.src_l
= src_l
= SRLatch(sync
=False, name
="src")
137 m
.submodules
.opc_l
= opc_l
= SRLatch(sync
=False, name
="opc")
138 m
.submodules
.adr_l
= adr_l
= SRLatch(sync
=False, name
="adr")
139 m
.submodules
.req_l
= req_l
= SRLatch(sync
=False, name
="req")
140 m
.submodules
.sto_l
= sto_l
= SRLatch(sync
=False, name
="sto")
143 reset_b
= Signal(reset_less
=True)
144 reset_w
= Signal(reset_less
=True)
145 reset_a
= Signal(reset_less
=True)
146 reset_s
= Signal(reset_less
=True)
147 reset_r
= Signal(reset_less
=True)
148 comb
+= reset_b
.eq(self
.go_st_i|self
.go_wr_i|self
.go_ad_i|self
.go_die_i
)
149 comb
+= reset_w
.eq(self
.go_wr_i | self
.go_die_i
)
150 comb
+= reset_s
.eq(self
.go_st_i | self
.go_die_i
)
151 comb
+= reset_r
.eq(self
.go_rd_i | self
.go_die_i
)
152 # this one is slightly different, issue_alu_i selects go_wr_i)
153 a_sel
= Mux(self
.isalu_i
, self
.go_wr_i
, self
.go_ad_i
)
154 comb
+= reset_a
.eq(a_sel| self
.go_die_i
)
157 op_alu
= Signal(reset_less
=True)
158 op_is_ld
= Signal(reset_less
=True)
159 op_is_st
= Signal(reset_less
=True)
160 op_ldst
= Signal(reset_less
=True)
161 op_is_imm
= Signal(reset_less
=True)
164 src2_r
= Signal(self
.rwid
, reset_less
=True)
166 # select immediate or src2 reg to add
167 src2_or_imm
= Signal(self
.rwid
, reset_less
=True)
168 src_sel
= Signal(reset_less
=True)
170 # issue can be either issue_i or issue_alu_i (isalu_i)
171 issue_i
= Signal(reset_less
=True)
172 comb
+= issue_i
.eq(self
.issue_i | self
.isalu_i
)
174 # Ripple-down the latches, each one set cancels the previous.
175 # NOTE: use sync to stop combinatorial loops.
177 # opcode latch - inverted so that busy resets to 0
178 sync
+= opc_l
.s
.eq(issue_i
) # XXX NOTE: INVERTED FROM book!
179 sync
+= opc_l
.r
.eq(reset_b
) # XXX NOTE: INVERTED FROM book!
182 sync
+= src_l
.s
.eq(issue_i
)
183 sync
+= src_l
.r
.eq(reset_r
)
186 sync
+= adr_l
.s
.eq(self
.go_rd_i
)
187 sync
+= adr_l
.r
.eq(reset_a
)
190 sync
+= req_l
.s
.eq(self
.go_ad_i|self
.go_st_i
)
191 sync
+= req_l
.r
.eq(reset_w
)
194 sync
+= sto_l
.s
.eq(issue_i
)# XXX hmmm... |self.go_st_i)
195 sync
+= sto_l
.r
.eq(reset_s
)
197 # outputs: busy and release signals
199 comb
+= self
.busy_o
.eq(opc_l
.q
) # busy out
200 comb
+= self
.rd_rel_o
.eq(src_l
.q
& busy_o
) # src1/src2 req rel
201 comb
+= self
.sto_rel_o
.eq(sto_l
.q
& busy_o
& self
.shadown_i
& op_is_st
)
203 # request release enabled based on if op is a LD/ST or a plain ALU
204 # if op is an ADD/SUB or a LD, req_rel activates.
205 wr_q
= Signal(reset_less
=True)
206 comb
+= wr_q
.eq(req_l
.q
& (~op_ldst | op_is_ld
))
208 alulatch
= Signal(reset_less
=True)
209 comb
+= alulatch
.eq((op_ldst
& self
.adr_rel_o
) | \
210 (~op_ldst
& self
.req_rel_o
))
212 # select immediate if opcode says so. however also change the latch
213 # to trigger *from* the opcode latch instead.
214 comb
+= src_sel
.eq(Mux(op_is_imm
, opc_l
.qn
, src_l
.q
))
215 comb
+= src2_or_imm
.eq(Mux(op_is_imm
, self
.imm_i
, self
.src2_i
))
217 # create a latch/register for src1/src2 (include immediate select)
218 latchregister(m
, self
.src1_i
, self
.alu
.a
, src_l
.q
, name
="src1_r")
219 latchregister(m
, self
.src2_i
, src2_r
, src_l
.q
, name
="src2_r")
220 latchregister(m
, src2_or_imm
, self
.alu
.b
, src_sel
, name
="imm_r")
222 # create a latch/register for the operand
223 oper_r
= Signal(self
.opwid
, reset_less
=True) # Dest register
224 latchregister(m
, self
.oper_i
, oper_r
, self
.issue_i
, name
="operi_r")
225 alu_op
= Cat(op_alu
, 0, op_is_imm
) # using alu_hier, here.
226 comb
+= self
.alu
.op
.eq(alu_op
)
228 # and one for the output from the ALU
229 data_r
= Signal(self
.rwid
, reset_less
=True) # Dest register
230 latchregister(m
, self
.alu
.o
, data_r
, alulatch
, "aluo_r")
232 # decode bits of operand (latched)
233 comb
+= op_alu
.eq(oper_r
[BIT0_ADD
]) # ADD/SUB
234 comb
+= op_is_imm
.eq(oper_r
[BIT1_SRC
]) # IMMED/reg
235 comb
+= op_is_st
.eq(oper_r
[BIT2_ST
]) # OP is ST
236 comb
+= op_is_ld
.eq(oper_r
[BIT3_LD
]) # OP is LD
237 comb
+= op_ldst
.eq(op_is_ld | op_is_st
)
238 comb
+= self
.load_mem_o
.eq(op_is_ld
& self
.go_ad_i
)
239 comb
+= self
.stwd_mem_o
.eq(op_is_st
& self
.go_st_i
)
240 comb
+= self
.ld_o
.eq(op_is_ld
)
241 comb
+= self
.st_o
.eq(op_is_st
)
243 # on a go_read, tell the ALU we're accepting data.
244 # NOTE: this spells TROUBLE if the ALU isn't ready!
245 # go_read is only valid for one clock!
246 with m
.If(self
.go_rd_i
): # src operands ready, GO!
247 with m
.If(~self
.alu
.p_ready_o
): # no ACK yet
248 m
.d
.comb
+= self
.alu
.p_valid_i
.eq(1) # so indicate valid
250 # only proceed if ALU says its output is valid
251 with m
.If(self
.alu
.n_valid_o
):
252 # write req release out. waits until shadow is dropped.
253 comb
+= self
.req_rel_o
.eq(wr_q
& busy_o
& self
.shadown_i
)
254 # address release only happens on LD/ST, and is shadowed.
255 comb
+= self
.adr_rel_o
.eq(adr_l
.q
& op_ldst
& busy_o
& \
257 # when output latch is ready, and ALU says ready, accept ALU output
258 with m
.If(self
.req_rel_o
):
259 m
.d
.comb
+= self
.alu
.n_ready_i
.eq(1) # tells ALU "thanks got it"
261 # put the register directly onto the output bus on a go_write
262 # this is "ALU mode". go_wr_i *must* be deasserted on next clock
263 with m
.If(self
.go_wr_i
):
264 comb
+= self
.data_o
.eq(data_r
)
266 # "LD/ST" mode: put the register directly onto the *address* bus
267 with m
.If(self
.go_ad_i | self
.go_st_i
):
268 comb
+= self
.addr_o
.eq(data_r
)
270 # TODO: think about moving these to another module
272 # connect ST to memory. NOTE: unit *must* be set back
273 # to start again by dropping go_st_i on next clock
274 with m
.If(self
.stwd_mem_o
):
275 wrport
= self
.mem
.wrport
276 comb
+= wrport
.addr
.eq(self
.addr_o
)
277 comb
+= wrport
.data
.eq(src2_r
)
278 comb
+= wrport
.en
.eq(1)
280 # connect LD to memory. NOTE: unit *must* be set back
281 # to start again by dropping go_ad_i on next clock
282 with m
.If(self
.load_mem_o
):
283 rdport
= self
.mem
.rdport
284 comb
+= rdport
.addr
.eq(self
.addr_o
)
285 comb
+= self
.data_o
.eq(rdport
.data
)
286 # comb += rdport.en.eq(1) # only when transparent=False
309 yield self
.load_mem_o
310 yield self
.stwd_mem_o
317 print ("wait for", sig
, v
)
325 def store(dut
, src1
, src2
, imm
):
326 yield dut
.oper_i
.eq(LDST_OP_ST
)
327 yield dut
.src1_i
.eq(src1
)
328 yield dut
.src2_i
.eq(src2
)
329 yield dut
.imm_i
.eq(imm
)
330 yield dut
.issue_i
.eq(1)
332 yield dut
.issue_i
.eq(0)
334 yield dut
.go_rd_i
.eq(1)
335 yield from wait_for(dut
.rd_rel_o
)
336 yield dut
.go_rd_i
.eq(0)
337 yield from wait_for(dut
.adr_rel_o
)
338 yield dut
.go_st_i
.eq(1)
339 yield from wait_for(dut
.sto_rel_o
)
340 wait_for(dut
.stwd_mem_o
)
341 yield dut
.go_st_i
.eq(0)
345 def load(dut
, src1
, src2
, imm
):
346 yield dut
.oper_i
.eq(LDST_OP_LD
)
347 yield dut
.src1_i
.eq(src1
)
348 yield dut
.src2_i
.eq(src2
)
349 yield dut
.imm_i
.eq(imm
)
350 yield dut
.issue_i
.eq(1)
352 yield dut
.issue_i
.eq(0)
354 yield dut
.go_rd_i
.eq(1)
355 yield from wait_for(dut
.rd_rel_o
)
356 yield dut
.go_rd_i
.eq(0)
357 yield from wait_for(dut
.adr_rel_o
)
358 yield dut
.go_ad_i
.eq(1)
359 yield from wait_for(dut
.busy_o
)
361 data
= (yield dut
.data_o
)
362 yield dut
.go_ad_i
.eq(0)
363 #wait_for(dut.stwd_mem_o)
366 def scoreboard_sim(dut
):
367 yield from store(dut
, 4, 3, 2)
368 yield from store(dut
, 2, 9, 2)
370 data
= yield from load(dut
, 4, 0, 2)
371 assert data
== 0x0003
372 data
= yield from load(dut
, 2, 0, 2)
373 assert data
== 0x0009
377 class TestLDSTCompUnit(LDSTCompUnit
):
379 def __init__(self
, rwid
, opwid
):
380 from alu_hier
import ALU
381 self
.alu
= alu
= ALU(rwid
)
382 self
.mem
= mem
= TestMemory(rwid
, 8)
383 LDSTCompUnit
.__init
__(self
, rwid
, opwid
, alu
, mem
)
385 def elaborate(self
, platform
):
386 m
= LDSTCompUnit
.elaborate(self
, platform
)
387 m
.submodules
.mem
= self
.mem
391 def test_scoreboard():
393 dut
= TestLDSTCompUnit(16, 4)
394 vl
= rtlil
.convert(dut
, ports
=dut
.ports())
395 with
open("test_ldst_comp.il", "w") as f
:
398 run_simulation(dut
, scoreboard_sim(dut
), vcd_name
='test_ldst_comp.vcd')
400 if __name__
== '__main__':