Parameterize the issuer on the number of operands and results
[soc.git] / src / soc / experiment / test / test_compalu_multi.py
1 """Computation Unit (aka "ALU Manager").
2
3 Manages a Pipeline or FSM, ensuring that the start and end time are 100%
4 monitored. At no time may the ALU proceed without this module notifying
5 the Dependency Matrices. At no time is a result production "abandoned".
6 This module blocks (indicates busy) starting from when it first receives
7 an opcode until it receives notification that
8 its result(s) have been successfully stored in the regfile(s)
9
10 Documented at http://libre-soc.org/3d_gpu/architecture/compunit
11 """
12
13 from soc.experiment.alu_fsm import Shifter, CompFSMOpSubset
14 from soc.fu.alu.alu_input_record import CompALUOpSubset
15 from soc.experiment.alu_hier import ALU, DummyALU
16 from soc.experiment.compalu_multi import MultiCompUnit
17 from soc.decoder.power_enums import MicrOp
18 from nmutil.gtkw import write_gtkw
19 from nmigen import Module, Signal
20 from nmigen.cli import rtlil
21
22 # NOTE: to use cxxsim, export NMIGEN_SIM_MODE=cxxsim from the shell
23 # Also, check out the cxxsim nmigen branch, and latest yosys from git
24 from nmutil.sim_tmp_alternative import (Simulator, Settle, is_engine_pysim,
25 Passive)
26
27
28 def wrap(process):
29 def wrapper():
30 yield from process
31 return wrapper
32
33
34 class OperandProducer:
35 """
36 Produces an operand when requested by the Computation Unit
37 (`dut` parameter), using the `rel_o` / `go_i` handshake.
38
39 Attaches itself to the `dut` operand indexed by `op_index`.
40
41 Has a programmable delay between the assertion of `rel_o` and the
42 `go_i` pulse.
43
44 Data is presented only during the cycle in which `go_i` is active.
45
46 It adds itself as a passive process to the simulation (`sim` parameter).
47 Since it is passive, it will not hang the simulation, and does not need a
48 flag to terminate itself.
49 """
50 def __init__(self, sim, dut, op_index):
51 self.count = Signal(8, name=f"src{op_index + 1}_count")
52 """ transaction counter"""
53 # data and handshake signals from the DUT
54 self.port = dut.src_i[op_index]
55 self.go_i = dut.rd.go_i[op_index]
56 self.rel_o = dut.rd.rel_o[op_index]
57 # transaction parameters, passed via signals
58 self.delay = Signal(8)
59 self.data = Signal.like(self.port)
60 # add ourselves to the simulation process list
61 sim.add_sync_process(self._process)
62
63 def _process(self):
64 yield Passive()
65 while True:
66 # Settle() is needed to give a quick response to
67 # the zero delay case
68 yield Settle()
69 # wait for rel_o to become active
70 while not (yield self.rel_o):
71 yield
72 yield Settle()
73 # read the transaction parameters
74 delay = (yield self.delay)
75 data = (yield self.data)
76 # wait for `delay` cycles
77 for _ in range(delay):
78 yield
79 # activate go_i and present data, for one cycle
80 yield self.go_i.eq(1)
81 yield self.port.eq(data)
82 yield self.count.eq(self.count + 1)
83 yield
84 yield self.go_i.eq(0)
85 yield self.port.eq(0)
86
87 def send(self, data, delay):
88 """
89 Schedules the module to send some `data`, counting `delay` cycles after
90 `rel_i` becomes active.
91
92 To be called from the main test-bench process,
93 it returns in the same cycle.
94
95 Communication with the worker process is done by means of
96 combinatorial simulation-only signals.
97
98 """
99 yield self.data.eq(data)
100 yield self.delay.eq(delay)
101
102
103 class ResultConsumer:
104 """
105 Consumes a result when requested by the Computation Unit
106 (`dut` parameter), using the `rel_o` / `go_i` handshake.
107
108 Attaches itself to the `dut` result indexed by `op_index`.
109
110 Has a programmable delay between the assertion of `rel_o` and the
111 `go_i` pulse.
112
113 Data is retrieved only during the cycle in which `go_i` is active.
114
115 It adds itself as a passive process to the simulation (`sim` parameter).
116 Since it is passive, it will not hang the simulation, and does not need a
117 flag to terminate itself.
118 """
119 def __init__(self, sim, dut, op_index):
120 self.count = Signal(8, name=f"dest{op_index + 1}_count")
121 """ transaction counter"""
122 # data and handshake signals from the DUT
123 self.port = dut.dest[op_index]
124 self.go_i = dut.wr.go_i[op_index]
125 self.rel_o = dut.wr.rel_o[op_index]
126 # transaction parameters, passed via signals
127 self.delay = Signal(8)
128 self.expected = Signal.like(self.port)
129 # add ourselves to the simulation process list
130 sim.add_sync_process(self._process)
131
132 def _process(self):
133 yield Passive()
134 while True:
135 # Settle() is needed to give a quick response to
136 # the zero delay case
137 yield Settle()
138 # wait for rel_o to become active
139 while not (yield self.rel_o):
140 yield
141 yield Settle()
142 # read the transaction parameters
143 delay = (yield self.delay)
144 expected = (yield self.expected)
145 # wait for `delay` cycles
146 for _ in range(delay):
147 yield
148 # activate go_i for one cycle
149 yield self.go_i.eq(1)
150 yield self.count.eq(self.count + 1)
151 yield
152 # check received data against the expected value
153 result = (yield self.port)
154 assert result == expected,\
155 f"expected {expected}, received {result}"
156 yield self.go_i.eq(0)
157 yield self.port.eq(0)
158
159 def receive(self, expected, delay):
160 """
161 Schedules the module to receive some result,
162 counting `delay` cycles after `rel_i` becomes active.
163 As 'go_i' goes active, check the result with `expected`.
164
165 To be called from the main test-bench process,
166 it returns in the same cycle.
167
168 Communication with the worker process is done by means of
169 combinatorial simulation-only signals.
170 """
171 yield self.expected.eq(expected)
172 yield self.delay.eq(delay)
173
174
175 def op_sim(dut, a, b, op, inv_a=0, imm=0, imm_ok=0, zero_a=0):
176 yield dut.issue_i.eq(0)
177 yield
178 yield dut.src_i[0].eq(a)
179 yield dut.src_i[1].eq(b)
180 yield dut.oper_i.insn_type.eq(op)
181 yield dut.oper_i.invert_in.eq(inv_a)
182 yield dut.oper_i.imm_data.data.eq(imm)
183 yield dut.oper_i.imm_data.ok.eq(imm_ok)
184 yield dut.oper_i.zero_a.eq(zero_a)
185 yield dut.issue_i.eq(1)
186 yield
187 yield dut.issue_i.eq(0)
188 yield
189 if not imm_ok or not zero_a:
190 yield dut.rd.go_i.eq(0b11)
191 while True:
192 yield
193 rd_rel_o = yield dut.rd.rel_o
194 print("rd_rel", rd_rel_o)
195 if rd_rel_o:
196 break
197 yield dut.rd.go_i.eq(0)
198 else:
199 print("no go rd")
200
201 if len(dut.src_i) == 3:
202 yield dut.rd.go_i.eq(0b100)
203 while True:
204 yield
205 rd_rel_o = yield dut.rd.rel_o
206 print("rd_rel", rd_rel_o)
207 if rd_rel_o:
208 break
209 yield dut.rd.go_i.eq(0)
210 else:
211 print("no 3rd rd")
212
213 req_rel_o = yield dut.wr.rel_o
214 result = yield dut.data_o
215 print("req_rel", req_rel_o, result)
216 while True:
217 req_rel_o = yield dut.wr.rel_o
218 result = yield dut.data_o
219 print("req_rel", req_rel_o, result)
220 if req_rel_o:
221 break
222 yield
223 yield dut.wr.go_i[0].eq(1)
224 yield Settle()
225 result = yield dut.data_o
226 yield
227 print("result", result)
228 yield dut.wr.go_i[0].eq(0)
229 yield
230 return result
231
232
233 def scoreboard_sim_fsm(dut, producers, consumers):
234
235 # stores the operation count
236 op_count = 0
237
238 def op_sim_fsm(a, b, direction, expected, delays):
239 print("op_sim_fsm", a, b, direction, expected)
240 yield dut.issue_i.eq(0)
241 yield
242 # forward data and delays to the producers and consumers
243 yield from producers[0].send(a, delays[0])
244 yield from producers[1].send(b, delays[1])
245 yield from consumers[0].receive(expected, delays[2])
246 # submit operation, and assert issue_i for one cycle
247 yield dut.oper_i.sdir.eq(direction)
248 yield dut.issue_i.eq(1)
249 yield
250 yield dut.issue_i.eq(0)
251 # wait for busy to be negated
252 yield Settle()
253 while (yield dut.busy_o):
254 yield
255 yield Settle()
256 # update the operation count
257 nonlocal op_count
258 op_count = (op_count + 1) & 255
259 # check that producers and consumers have the same count
260 # this assures that no data was left unused or was lost
261 assert (yield producers[0].count) == op_count
262 assert (yield producers[1].count) == op_count
263 assert (yield consumers[0].count) == op_count
264
265 # 13 >> 2 = 3
266 # operand 1 arrives immediately
267 # operand 2 arrives after operand 1
268 # write data is accepted immediately
269 yield from op_sim_fsm(13, 2, 1, 3, [0, 2, 0])
270 # 3 << 4 = 48
271 # operand 2 arrives immediately
272 # operand 1 arrives after operand 2
273 # write data is accepted after some delay
274 yield from op_sim_fsm(3, 4, 0, 48, [2, 0, 2])
275 # 21 << 0 = 21
276 # operands 1 and 2 arrive at the same time
277 # write data is accepted after some delay
278 yield from op_sim_fsm(21, 0, 0, 21, [1, 1, 1])
279
280
281 def scoreboard_sim_dummy(dut):
282 result = yield from op_sim(dut, 5, 2, MicrOp.OP_NOP, inv_a=0,
283 imm=8, imm_ok=1)
284 assert result == 5, result
285
286 result = yield from op_sim(dut, 9, 2, MicrOp.OP_NOP, inv_a=0,
287 imm=8, imm_ok=1)
288 assert result == 9, result
289
290
291 class OpSim:
292 """ALU Operation issuer
293
294 Issues operations to the DUT"""
295 def __init__(self, dut, sim):
296 self.op_count = 0
297 self.zero_a_count = 0
298 self.imm_ok_count = 0
299 self.dut = dut
300 # create one operand producer for each input port
301 self.producers = list()
302 for i in range(len(dut.src_i)):
303 self.producers.append(OperandProducer(sim, dut, i))
304 # create one result consumer for each output port
305 self.consumers = list()
306 for i in range(len(dut.dest)):
307 self.consumers.append(ResultConsumer(sim, dut, i))
308 def issue(self, src_i, op, expected, src_delays, dest_delays,
309 inv_a=0, imm=0, imm_ok=0, zero_a=0):
310 """Executes the issue operation"""
311 dut = self.dut
312 producers = self.producers
313 consumers = self.consumers
314 yield dut.issue_i.eq(0)
315 yield
316 # forward data and delays to the producers and consumers
317 # first, send special cases (with zero_a and/or imm_ok)
318 if not zero_a:
319 yield from producers[0].send(src_i[0], src_delays[0])
320 if not imm_ok:
321 yield from producers[1].send(src_i[1], src_delays[1])
322 # then, send the rest (if any)
323 for i in range(2, len(producers)):
324 yield from producers[i].send(src_i[i], src_delays[i])
325 for i in range(len(consumers)):
326 yield from consumers[i].receive(expected, dest_delays[i])
327 # submit operation, and assert issue_i for one cycle
328 yield dut.oper_i.insn_type.eq(op)
329 yield dut.oper_i.invert_in.eq(inv_a)
330 yield dut.oper_i.imm_data.data.eq(imm)
331 yield dut.oper_i.imm_data.ok.eq(imm_ok)
332 yield dut.oper_i.zero_a.eq(zero_a)
333 yield dut.issue_i.eq(1)
334 yield
335 yield dut.issue_i.eq(0)
336 # wait for busy to be negated
337 yield Settle()
338 while (yield dut.busy_o):
339 yield
340 yield Settle()
341 # update the operation count
342 self.op_count = (self.op_count + 1) & 255
343 # On zero_a and imm_ok executions, the producer counters will fall
344 # behind. But, by summing the following counts, the invariant is
345 # preserved.
346 if zero_a:
347 self.zero_a_count = self.zero_a_count + 1
348 if imm_ok:
349 self.imm_ok_count = self.imm_ok_count + 1
350 # check that producers and consumers have the same count
351 # this assures that no data was left unused or was lost
352 # first, check special cases (zero_a and imm_ok)
353 assert (yield producers[0].count) + self.zero_a_count == self.op_count
354 assert (yield producers[1].count) + self.imm_ok_count == self.op_count
355 # then, check the rest (if any)
356 for i in range(2, len(producers)):
357 assert (yield producers[i].count) == self.op_count
358 for i in range(len(consumers)):
359 assert (yield consumers[i].count) == self.op_count
360
361
362 def scoreboard_sim(op):
363 # zero (no) input operands test
364 # 0 + 8 = 8
365 yield from op.issue([5, 2], MicrOp.OP_ADD,
366 zero_a=1, imm=8, imm_ok=1,
367 expected=8,
368 src_delays=[0, 2], dest_delays=[0])
369 # 5 + 8 = 13
370 yield from op.issue([5, 2], MicrOp.OP_ADD,
371 inv_a=0, imm=8, imm_ok=1,
372 expected=13,
373 src_delays=[2, 0], dest_delays=[2])
374 # 5 + 2 = 7
375 yield from op.issue([5, 2], MicrOp.OP_ADD,
376 expected=7,
377 src_delays=[1, 1], dest_delays=[1])
378 # (-6) + 2 = (-4)
379 yield from op.issue([5, 2], MicrOp.OP_ADD, inv_a=1,
380 expected=65532,
381 src_delays=[1, 2], dest_delays=[0])
382 # 0 + 2 = 2
383 yield from op.issue([5, 2], MicrOp.OP_ADD, zero_a=1,
384 expected=2,
385 src_delays=[2, 0], dest_delays=[1])
386
387 # test combinatorial zero-delay operation
388 # In the test ALU, any operation other than ADD, MUL or SHR
389 # is zero-delay, and do a subtraction.
390 yield from op.issue([5, 2], MicrOp.OP_NOP,
391 expected=3,
392 src_delays=[0, 1], dest_delays=[2])
393
394
395 def test_compunit_fsm():
396 top = "top.cu" if is_engine_pysim() else "cu"
397 style = {
398 'in': {'color': 'orange'},
399 'out': {'color': 'yellow'},
400 }
401 traces = [
402 'clk',
403 ('operation port', {'color': 'red'}, [
404 'cu_issue_i', 'cu_busy_o',
405 {'comment': 'operation'},
406 'oper_i_None__sdir']),
407 ('operand 1 port', 'in', [
408 ('cu_rd__rel_o[1:0]', {'bit': 1}),
409 ('cu_rd__go_i[1:0]', {'bit': 1}),
410 'src1_i[7:0]']),
411 ('operand 2 port', 'in', [
412 ('cu_rd__rel_o[1:0]', {'bit': 0}),
413 ('cu_rd__go_i[1:0]', {'bit': 0}),
414 'src2_i[7:0]']),
415 ('result port', 'out', [
416 'cu_wr__rel_o', 'cu_wr__go_i', 'dest1_o[7:0]']),
417 ('alu', {'module': top+'.alu'}, [
418 ('prev port', 'in', [
419 'op__sdir', 'p_data_i[7:0]', 'p_shift_i[7:0]',
420 'p_valid_i', 'p_ready_o']),
421 ('next port', 'out', [
422 'n_data_o[7:0]', 'n_valid_o', 'n_ready_i']),
423 ]),
424 ('debug', {'module': 'top'},
425 ['src1_count[7:0]', 'src2_count[7:0]', 'dest1_count[7:0]'])
426
427 ]
428 write_gtkw(
429 "test_compunit_fsm1.gtkw",
430 "test_compunit_fsm1.vcd",
431 traces, style,
432 module=top
433 )
434 m = Module()
435 alu = Shifter(8)
436 dut = MultiCompUnit(8, alu, CompFSMOpSubset)
437 m.submodules.cu = dut
438
439 vl = rtlil.convert(dut, ports=dut.ports())
440 with open("test_compunit_fsm1.il", "w") as f:
441 f.write(vl)
442
443 sim = Simulator(m)
444 sim.add_clock(1e-6)
445
446 # create one operand producer for each input port
447 prod_a = OperandProducer(sim, dut, 0)
448 prod_b = OperandProducer(sim, dut, 1)
449 # create an result consumer for the output port
450 cons = ResultConsumer(sim, dut, 0)
451 sim.add_sync_process(wrap(scoreboard_sim_fsm(dut,
452 [prod_a, prod_b],
453 [cons])))
454 sim_writer = sim.write_vcd('test_compunit_fsm1.vcd',
455 traces=[prod_a.count,
456 prod_b.count,
457 cons.count])
458 with sim_writer:
459 sim.run()
460
461
462 def test_compunit():
463
464 m = Module()
465 alu = ALU(16)
466 dut = MultiCompUnit(16, alu, CompALUOpSubset)
467 m.submodules.cu = dut
468
469 vl = rtlil.convert(dut, ports=dut.ports())
470 with open("test_compunit1.il", "w") as f:
471 f.write(vl)
472
473 sim = Simulator(m)
474 sim.add_clock(1e-6)
475
476 # create an operation issuer
477 op = OpSim(dut, sim)
478 sim.add_sync_process(wrap(scoreboard_sim(op)))
479 sim_writer = sim.write_vcd('test_compunit1.vcd')
480 with sim_writer:
481 sim.run()
482
483
484 class CompUnitParallelTest:
485 def __init__(self, dut):
486 self.dut = dut
487
488 # Operation cycle should not take longer than this:
489 self.MAX_BUSY_WAIT = 50
490
491 # Minimum duration in which issue_i will be kept inactive,
492 # during which busy_o must remain low.
493 self.MIN_BUSY_LOW = 5
494
495 # Number of cycles to stall until the assertion of go.
496 # One value, for each port. Can be zero, for no delay.
497 self.RD_GO_DELAY = [0, 3]
498
499 # store common data for the input operation of the processes
500 # input operation:
501 self.op = 0
502 self.inv_a = self.zero_a = 0
503 self.imm = self.imm_ok = 0
504 self.imm_control = (0, 0)
505 self.rdmaskn = (0, 0)
506 # input data:
507 self.operands = (0, 0)
508
509 # Indicates completion of the sub-processes
510 self.rd_complete = [False, False]
511
512 def driver(self):
513 print("Begin parallel test.")
514 yield from self.operation(5, 2, MicrOp.OP_ADD)
515
516 def operation(self, a, b, op, inv_a=0, imm=0, imm_ok=0, zero_a=0,
517 rdmaskn=(0, 0)):
518 # store data for the operation
519 self.operands = (a, b)
520 self.op = op
521 self.inv_a = inv_a
522 self.imm = imm
523 self.imm_ok = imm_ok
524 self.zero_a = zero_a
525 self.imm_control = (zero_a, imm_ok)
526 self.rdmaskn = rdmaskn
527
528 # Initialize completion flags
529 self.rd_complete = [False, False]
530
531 # trigger operation cycle
532 yield from self.issue()
533
534 # check that the sub-processes completed, before the busy_o cycle ended
535 for completion in self.rd_complete:
536 assert completion
537
538 def issue(self):
539 # issue_i starts inactive
540 yield self.dut.issue_i.eq(0)
541
542 for n in range(self.MIN_BUSY_LOW):
543 yield
544 # busy_o must remain inactive. It cannot rise on its own.
545 busy_o = yield self.dut.busy_o
546 assert not busy_o
547
548 # activate issue_i to begin the operation cycle
549 yield self.dut.issue_i.eq(1)
550
551 # at the same time, present the operation
552 yield self.dut.oper_i.insn_type.eq(self.op)
553 yield self.dut.oper_i.invert_in.eq(self.inv_a)
554 yield self.dut.oper_i.imm_data.data.eq(self.imm)
555 yield self.dut.oper_i.imm_data.ok.eq(self.imm_ok)
556 yield self.dut.oper_i.zero_a.eq(self.zero_a)
557 rdmaskn = self.rdmaskn[0] | (self.rdmaskn[1] << 1)
558 yield self.dut.rdmaskn.eq(rdmaskn)
559
560 # give one cycle for the CompUnit to latch the data
561 yield
562
563 # busy_o must keep being low in this cycle, because issue_i was
564 # low on the previous cycle.
565 # It cannot rise on its own.
566 # Also, busy_o and issue_i must never be active at the same time, ever.
567 busy_o = yield self.dut.busy_o
568 assert not busy_o
569
570 # Lower issue_i
571 yield self.dut.issue_i.eq(0)
572
573 # deactivate inputs along with issue_i, so we can be sure the data
574 # was latched at the correct cycle
575 # note: rdmaskn must be held, while busy_o is active
576 # TODO: deactivate rdmaskn when the busy_o cycle ends
577 yield self.dut.oper_i.insn_type.eq(0)
578 yield self.dut.oper_i.invert_in.eq(0)
579 yield self.dut.oper_i.imm_data.data.eq(0)
580 yield self.dut.oper_i.imm_data.ok.eq(0)
581 yield self.dut.oper_i.zero_a.eq(0)
582 yield
583
584 # wait for busy_o to lower
585 # timeout after self.MAX_BUSY_WAIT cycles
586 for n in range(self.MAX_BUSY_WAIT):
587 # sample busy_o in the current cycle
588 busy_o = yield self.dut.busy_o
589 if not busy_o:
590 # operation cycle ends when busy_o becomes inactive
591 break
592 yield
593
594 # if busy_o is still active, a timeout has occurred
595 # TODO: Uncomment this, once the test is complete:
596 # assert not busy_o
597
598 if busy_o:
599 print("If you are reading this, "
600 "it's because the above test failed, as expected,\n"
601 "with a timeout. It must pass, once the test is complete.")
602 return
603
604 print("If you are reading this, "
605 "it's because the above test unexpectedly passed.")
606
607 def rd(self, rd_idx):
608 # wait for issue_i to rise
609 while True:
610 issue_i = yield self.dut.issue_i
611 if issue_i:
612 break
613 # issue_i has not risen yet, so rd must keep low
614 rel = yield self.dut.rd.rel_o[rd_idx]
615 assert not rel
616 yield
617
618 # we do not want rd to rise on an immediate operand
619 # if it is immediate, exit the process
620 # likewise, if the read mask is active
621 # TODO: don't exit the process, monitor rd instead to ensure it
622 # doesn't rise on its own
623 if self.rdmaskn[rd_idx] or self.imm_control[rd_idx]:
624 self.rd_complete[rd_idx] = True
625 return
626
627 # issue_i has risen. rel must rise on the next cycle
628 rel = yield self.dut.rd.rel_o[rd_idx]
629 assert not rel
630
631 # stall for additional cycles. Check that rel doesn't fall on its own
632 for n in range(self.RD_GO_DELAY[rd_idx]):
633 yield
634 rel = yield self.dut.rd.rel_o[rd_idx]
635 assert rel
636
637 # Before asserting "go", make sure "rel" has risen.
638 # The use of Settle allows "go" to be set combinatorially,
639 # rising on the same cycle as "rel".
640 yield Settle()
641 rel = yield self.dut.rd.rel_o[rd_idx]
642 assert rel
643
644 # assert go for one cycle, passing along the operand value
645 yield self.dut.rd.go_i[rd_idx].eq(1)
646 yield self.dut.src_i[rd_idx].eq(self.operands[rd_idx])
647 # check that the operand was sent to the alu
648 # TODO: Properly check the alu protocol
649 yield Settle()
650 alu_input = yield self.dut.get_in(rd_idx)
651 assert alu_input == self.operands[rd_idx]
652 yield
653
654 # rel must keep high, since go was inactive in the last cycle
655 rel = yield self.dut.rd.rel_o[rd_idx]
656 assert rel
657
658 # finish the go one-clock pulse
659 yield self.dut.rd.go_i[rd_idx].eq(0)
660 yield self.dut.src_i[rd_idx].eq(0)
661 yield
662
663 # rel must have gone low in response to go being high
664 # on the previous cycle
665 rel = yield self.dut.rd.rel_o[rd_idx]
666 assert not rel
667
668 self.rd_complete[rd_idx] = True
669
670 # TODO: check that rel doesn't rise again until the end of the
671 # busy_o cycle
672
673 def wr(self, wr_idx):
674 # monitor self.dut.wr.req[rd_idx] and sets dut.wr.go[idx] for one cycle
675 yield
676 # TODO: also when dut.wr.go is set, check the output against the
677 # self.expected_o and assert. use dut.get_out(wr_idx) to do so.
678
679 def run_simulation(self, vcd_name):
680 m = Module()
681 m.submodules.cu = self.dut
682 sim = Simulator(m)
683 sim.add_clock(1e-6)
684
685 sim.add_sync_process(wrap(self.driver()))
686 sim.add_sync_process(wrap(self.rd(0)))
687 sim.add_sync_process(wrap(self.rd(1)))
688 sim.add_sync_process(wrap(self.wr(0)))
689 sim_writer = sim.write_vcd(vcd_name)
690 with sim_writer:
691 sim.run()
692
693
694 def test_compunit_regspec2_fsm():
695
696 inspec = [('INT', 'data', '0:15'),
697 ('INT', 'shift', '0:15'),
698 ]
699 outspec = [('INT', 'data', '0:15'),
700 ]
701
702 regspec = (inspec, outspec)
703
704 m = Module()
705 alu = Shifter(8)
706 dut = MultiCompUnit(regspec, alu, CompFSMOpSubset)
707 m.submodules.cu = dut
708
709 sim = Simulator(m)
710 sim.add_clock(1e-6)
711
712 # create one operand producer for each input port
713 prod_a = OperandProducer(sim, dut, 0)
714 prod_b = OperandProducer(sim, dut, 1)
715 # create an result consumer for the output port
716 cons = ResultConsumer(sim, dut, 0)
717 sim.add_sync_process(wrap(scoreboard_sim_fsm(dut,
718 [prod_a, prod_b],
719 [cons])))
720 sim_writer = sim.write_vcd('test_compunit_regspec2_fsm.vcd',
721 traces=[prod_a.count,
722 prod_b.count,
723 cons.count])
724 with sim_writer:
725 sim.run()
726
727
728 def test_compunit_regspec3():
729
730 inspec = [('INT', 'a', '0:15'),
731 ('INT', 'b', '0:15'),
732 ('INT', 'c', '0:15')]
733 outspec = [('INT', 'o', '0:15'),
734 ]
735
736 regspec = (inspec, outspec)
737
738 m = Module()
739 alu = DummyALU(16)
740 dut = MultiCompUnit(regspec, alu, CompALUOpSubset)
741 m.submodules.cu = dut
742
743 sim = Simulator(m)
744 sim.add_clock(1e-6)
745
746 sim.add_sync_process(wrap(scoreboard_sim_dummy(dut)))
747 sim_writer = sim.write_vcd('test_compunit_regspec3.vcd')
748 with sim_writer:
749 sim.run()
750
751
752 def test_compunit_regspec1():
753
754 style = {
755 'in': {'color': 'orange'},
756 'out': {'color': 'yellow'},
757 }
758 traces = [
759 'clk',
760 ('operation port', {'color': 'red'}, [
761 'cu_issue_i', 'cu_busy_o',
762 {'comment': 'operation'},
763 ('oper_i_None__insn_type', {'display': 'insn_type'}),
764 ('oper_i_None__invert_in', {'display': 'invert_in'}),
765 ('oper_i_None__imm_data__data[63:0]', {'display': 'data[63:0]'}),
766 ('oper_i_None__imm_data__imm_ok', {'display': 'imm_ok'}),
767 ('oper_i_None__zero_a', {'display': 'zero_a'})]),
768 ('operand 1 port', 'in', [
769 ('cu_rd__rel_o[1:0]', {'bit': 1}),
770 ('cu_rd__go_i[1:0]', {'bit': 1}),
771 'src1_i[15:0]']),
772 ('operand 2 port', 'in', [
773 ('cu_rd__rel_o[1:0]', {'bit': 0}),
774 ('cu_rd__go_i[1:0]', {'bit': 0}),
775 'src2_i[15:0]']),
776 ('result port', 'out', [
777 'cu_wr__rel_o', 'cu_wr__go_i', 'dest1_o[15:0]']),
778 ('alu', {'module': 'top.cu.alu'}, [
779 ('prev port', 'in', [
780 'op__insn_type', 'op__invert_i', 'a[15:0]', 'b[15:0]',
781 'valid_i', 'ready_o']),
782 ('next port', 'out', [
783 'alu_o[15:0]', 'valid_o', 'ready_i'])]),
784 ('debug', {'module': 'top'},
785 ['src1_count[7:0]', 'src2_count[7:0]', 'dest1_count[7:0]'])]
786
787 write_gtkw("test_compunit_regspec1.gtkw",
788 "test_compunit_regspec1.vcd",
789 traces, style,
790 clk_period=1e-6,
791 module='top.cu')
792
793 inspec = [('INT', 'a', '0:15'),
794 ('INT', 'b', '0:15')]
795 outspec = [('INT', 'o', '0:15'),
796 ]
797
798 regspec = (inspec, outspec)
799
800 m = Module()
801 alu = ALU(16)
802 dut = MultiCompUnit(regspec, alu, CompALUOpSubset)
803 m.submodules.cu = dut
804
805 vl = rtlil.convert(dut, ports=dut.ports())
806 with open("test_compunit_regspec1.il", "w") as f:
807 f.write(vl)
808
809 sim = Simulator(m)
810 sim.add_clock(1e-6)
811
812 # create an operation issuer
813 op = OpSim(dut, sim)
814 sim.add_sync_process(wrap(scoreboard_sim(op)))
815 sim_writer = sim.write_vcd('test_compunit_regspec1.vcd',
816 traces=[op.producers[0].count,
817 op.producers[1].count,
818 op.consumers[0].count])
819 with sim_writer:
820 sim.run()
821
822 test = CompUnitParallelTest(dut)
823 test.run_simulation("test_compunit_parallel.vcd")
824
825
826 if __name__ == '__main__':
827 test_compunit()
828 test_compunit_fsm()
829 test_compunit_regspec1()
830 test_compunit_regspec2_fsm()
831 test_compunit_regspec3()