Add expected state to case_0_adde in alu_cases unit test
[openpower-isa.git] / src / openpower / decoder / isa / caller.py
1 # SPDX-License-Identifier: LGPLv3+
2 # Copyright (C) 2020, 2021 Luke Kenneth Casson Leighton <lkcl@lkcl.net>
3 # Copyright (C) 2020 Michael Nolan
4 # Funded by NLnet http://nlnet.nl
5 """core of the python-based POWER9 simulator
6
7 this is part of a cycle-accurate POWER9 simulator. its primary purpose is
8 not speed, it is for both learning and educational purposes, as well as
9 a method of verifying the HDL.
10
11 related bugs:
12
13 * https://bugs.libre-soc.org/show_bug.cgi?id=424
14 """
15
16 from nmigen.back.pysim import Settle
17 from functools import wraps
18 from copy import copy, deepcopy
19 from openpower.decoder.orderedset import OrderedSet
20 from openpower.decoder.selectable_int import (FieldSelectableInt, SelectableInt,
21 selectconcat)
22 from openpower.decoder.power_enums import (spr_dict, spr_byname, XER_bits,
23 insns, MicrOp, In1Sel, In2Sel, In3Sel,
24 OutSel, CRInSel, CROutSel, LDSTMode,
25 SVP64RMMode, SVP64PredMode,
26 SVP64PredInt, SVP64PredCR,
27 SVP64LDSTmode)
28
29 from openpower.decoder.power_enums import SVPtype
30
31 from openpower.decoder.helpers import (exts, gtu, ltu, undefined,
32 ISACallerHelper, ISAFPHelpers)
33 from openpower.consts import PIb, MSRb # big-endian (PowerISA versions)
34 from openpower.consts import (SVP64MODE,
35 SVP64CROffs,
36 )
37 from openpower.decoder.power_svp64 import SVP64RM, decode_extra
38
39 from openpower.decoder.isa.radixmmu import RADIX
40 from openpower.decoder.isa.mem import Mem, swap_order, MemException
41 from openpower.decoder.isa.svshape import SVSHAPE
42 from openpower.decoder.isa.svstate import SVP64State
43
44
45 from openpower.util import log
46
47 from collections import namedtuple
48 import math
49 import sys
50
51 instruction_info = namedtuple('instruction_info',
52 'func read_regs uninit_regs write_regs ' +
53 'special_regs op_fields form asmregs')
54
55 special_sprs = {
56 'LR': 8,
57 'CTR': 9,
58 'TAR': 815,
59 'XER': 1,
60 'VRSAVE': 256}
61
62
63 REG_SORT_ORDER = {
64 # TODO (lkcl): adjust other registers that should be in a particular order
65 # probably CA, CA32, and CR
66 "FRT": 0,
67 "FRA": 0,
68 "FRB": 0,
69 "FRC": 0,
70 "FRS": 0,
71 "RT": 0,
72 "RA": 0,
73 "RB": 0,
74 "RC": 0,
75 "RS": 0,
76 "BI": 0,
77 "CR": 0,
78 "LR": 0,
79 "CTR": 0,
80 "TAR": 0,
81 "MSR": 0,
82 "SVSTATE": 0,
83 "SVSHAPE0": 0,
84 "SVSHAPE1": 0,
85 "SVSHAPE2": 0,
86 "SVSHAPE3": 0,
87
88 "CA": 0,
89 "CA32": 0,
90
91 "overflow": 7, # should definitely be last
92 }
93
94 fregs = ['FRA', 'FRB', 'FRC', 'FRS', 'FRT']
95
96
97 def create_args(reglist, extra=None):
98 retval = list(OrderedSet(reglist))
99 retval.sort(key=lambda reg: REG_SORT_ORDER.get(reg, 0))
100 if extra is not None:
101 return [extra] + retval
102 return retval
103
104
105
106 class GPR(dict):
107 def __init__(self, decoder, isacaller, svstate, regfile):
108 dict.__init__(self)
109 self.sd = decoder
110 self.isacaller = isacaller
111 self.svstate = svstate
112 for i in range(len(regfile)):
113 self[i] = SelectableInt(regfile[i], 64)
114
115 def __call__(self, ridx):
116 if isinstance(ridx, SelectableInt):
117 ridx = ridx.value
118 return self[ridx]
119
120 def set_form(self, form):
121 self.form = form
122
123 def __setitem__(self, rnum, value):
124 # rnum = rnum.value # only SelectableInt allowed
125 log("GPR setitem", rnum, value)
126 if isinstance(rnum, SelectableInt):
127 rnum = rnum.value
128 dict.__setitem__(self, rnum, value)
129
130 def getz(self, rnum):
131 # rnum = rnum.value # only SelectableInt allowed
132 log("GPR getzero?", rnum)
133 if rnum == 0:
134 return SelectableInt(0, 64)
135 return self[rnum]
136
137 def _get_regnum(self, attr):
138 getform = self.sd.sigforms[self.form]
139 rnum = getattr(getform, attr)
140 return rnum
141
142 def ___getitem__(self, attr):
143 """ XXX currently not used
144 """
145 rnum = self._get_regnum(attr)
146 log("GPR getitem", attr, rnum)
147 return self.regfile[rnum]
148
149 def dump(self, printout=True):
150 res = []
151 for i in range(len(self)):
152 res.append(self[i].value)
153 if printout:
154 for i in range(0, len(res), 8):
155 s = []
156 for j in range(8):
157 s.append("%08x" % res[i+j])
158 s = ' '.join(s)
159 print("reg", "%2d" % i, s)
160 return res
161
162
163 class SPR(dict):
164 def __init__(self, dec2, initial_sprs={}):
165 self.sd = dec2
166 dict.__init__(self)
167 for key, v in initial_sprs.items():
168 if isinstance(key, SelectableInt):
169 key = key.value
170 key = special_sprs.get(key, key)
171 if isinstance(key, int):
172 info = spr_dict[key]
173 else:
174 info = spr_byname[key]
175 if not isinstance(v, SelectableInt):
176 v = SelectableInt(v, info.length)
177 self[key] = v
178
179 def __getitem__(self, key):
180 log("get spr", key)
181 log("dict", self.items())
182 # if key in special_sprs get the special spr, otherwise return key
183 if isinstance(key, SelectableInt):
184 key = key.value
185 if isinstance(key, int):
186 key = spr_dict[key].SPR
187 key = special_sprs.get(key, key)
188 if key == 'HSRR0': # HACK!
189 key = 'SRR0'
190 if key == 'HSRR1': # HACK!
191 key = 'SRR1'
192 if key in self:
193 res = dict.__getitem__(self, key)
194 else:
195 if isinstance(key, int):
196 info = spr_dict[key]
197 else:
198 info = spr_byname[key]
199 dict.__setitem__(self, key, SelectableInt(0, info.length))
200 res = dict.__getitem__(self, key)
201 log("spr returning", key, res)
202 return res
203
204 def __setitem__(self, key, value):
205 if isinstance(key, SelectableInt):
206 key = key.value
207 if isinstance(key, int):
208 key = spr_dict[key].SPR
209 log("spr key", key)
210 key = special_sprs.get(key, key)
211 if key == 'HSRR0': # HACK!
212 self.__setitem__('SRR0', value)
213 if key == 'HSRR1': # HACK!
214 self.__setitem__('SRR1', value)
215 log("setting spr", key, value)
216 dict.__setitem__(self, key, value)
217
218 def __call__(self, ridx):
219 return self[ridx]
220
221 def dump(self, printout=True):
222 res = []
223 keys = list(self.keys())
224 #keys.sort()
225 for k in keys:
226 sprname = spr_dict.get(k, None)
227 if sprname is None:
228 sprname = k
229 else:
230 sprname = sprname.SPR
231 res.append((sprname, self[k].value))
232 if printout:
233 for sprname, value in res:
234 print(" ", sprname, hex(value))
235 return res
236
237
238 class PC:
239 def __init__(self, pc_init=0):
240 self.CIA = SelectableInt(pc_init, 64)
241 self.NIA = self.CIA + SelectableInt(4, 64) # only true for v3.0B!
242
243 def update_nia(self, is_svp64):
244 increment = 8 if is_svp64 else 4
245 self.NIA = self.CIA + SelectableInt(increment, 64)
246
247 def update(self, namespace, is_svp64):
248 """updates the program counter (PC) by 4 if v3.0B mode or 8 if SVP64
249 """
250 self.CIA = namespace['NIA'].narrow(64)
251 self.update_nia(is_svp64)
252 namespace['CIA'] = self.CIA
253 namespace['NIA'] = self.NIA
254
255
256 # SVP64 ReMap field
257 class SVP64RMFields:
258 def __init__(self, init=0):
259 self.spr = SelectableInt(init, 24)
260 # SVP64 RM fields: see https://libre-soc.org/openpower/sv/svp64/
261 self.mmode = FieldSelectableInt(self.spr, [0])
262 self.mask = FieldSelectableInt(self.spr, tuple(range(1,4)))
263 self.elwidth = FieldSelectableInt(self.spr, tuple(range(4,6)))
264 self.ewsrc = FieldSelectableInt(self.spr, tuple(range(6,8)))
265 self.subvl = FieldSelectableInt(self.spr, tuple(range(8,10)))
266 self.extra = FieldSelectableInt(self.spr, tuple(range(10,19)))
267 self.mode = FieldSelectableInt(self.spr, tuple(range(19,24)))
268 # these cover the same extra field, split into parts as EXTRA2
269 self.extra2 = list(range(4))
270 self.extra2[0] = FieldSelectableInt(self.spr, tuple(range(10,12)))
271 self.extra2[1] = FieldSelectableInt(self.spr, tuple(range(12,14)))
272 self.extra2[2] = FieldSelectableInt(self.spr, tuple(range(14,16)))
273 self.extra2[3] = FieldSelectableInt(self.spr, tuple(range(16,18)))
274 self.smask = FieldSelectableInt(self.spr, tuple(range(16,19)))
275 # and here as well, but EXTRA3
276 self.extra3 = list(range(3))
277 self.extra3[0] = FieldSelectableInt(self.spr, tuple(range(10,13)))
278 self.extra3[1] = FieldSelectableInt(self.spr, tuple(range(13,16)))
279 self.extra3[2] = FieldSelectableInt(self.spr, tuple(range(16,19)))
280
281
282 SVP64RM_MMODE_SIZE = len(SVP64RMFields().mmode.br)
283 SVP64RM_MASK_SIZE = len(SVP64RMFields().mask.br)
284 SVP64RM_ELWIDTH_SIZE = len(SVP64RMFields().elwidth.br)
285 SVP64RM_EWSRC_SIZE = len(SVP64RMFields().ewsrc.br)
286 SVP64RM_SUBVL_SIZE = len(SVP64RMFields().subvl.br)
287 SVP64RM_EXTRA2_SPEC_SIZE = len(SVP64RMFields().extra2[0].br)
288 SVP64RM_EXTRA3_SPEC_SIZE = len(SVP64RMFields().extra3[0].br)
289 SVP64RM_SMASK_SIZE = len(SVP64RMFields().smask.br)
290 SVP64RM_MODE_SIZE = len(SVP64RMFields().mode.br)
291
292
293 # SVP64 Prefix fields: see https://libre-soc.org/openpower/sv/svp64/
294 class SVP64PrefixFields:
295 def __init__(self):
296 self.insn = SelectableInt(0, 32)
297 # 6 bit major opcode EXT001, 2 bits "identifying" (7, 9), 24 SV ReMap
298 self.major = FieldSelectableInt(self.insn, tuple(range(0,6)))
299 self.pid = FieldSelectableInt(self.insn, (7, 9)) # must be 0b11
300 rmfields = [6, 8] + list(range(10,32)) # SVP64 24-bit RM (ReMap)
301 self.rm = FieldSelectableInt(self.insn, rmfields)
302
303
304 SV64P_MAJOR_SIZE = len(SVP64PrefixFields().major.br)
305 SV64P_PID_SIZE = len(SVP64PrefixFields().pid.br)
306 SV64P_RM_SIZE = len(SVP64PrefixFields().rm.br)
307
308
309 # CR register fields
310 # See PowerISA Version 3.0 B Book 1
311 # Section 2.3.1 Condition Register pages 30 - 31
312 class CRFields:
313 LT = FL = 0 # negative, less than, floating-point less than
314 GT = FG = 1 # positive, greater than, floating-point greater than
315 EQ = FE = 2 # equal, floating-point equal
316 SO = FU = 3 # summary overflow, floating-point unordered
317
318 def __init__(self, init=0):
319 # rev_cr = int('{:016b}'.format(initial_cr)[::-1], 2)
320 # self.cr = FieldSelectableInt(self._cr, list(range(32, 64)))
321 self.cr = SelectableInt(init, 64) # underlying reg
322 # field-selectable versions of Condition Register TODO check bitranges?
323 self.crl = []
324 for i in range(8):
325 bits = tuple(range(i*4+32, (i+1)*4+32))
326 _cr = FieldSelectableInt(self.cr, bits)
327 self.crl.append(_cr)
328
329 # decode SVP64 predicate integer to reg number and invert
330 def get_predint(gpr, mask):
331 r10 = gpr(10)
332 r30 = gpr(30)
333 log ("get_predint", mask, SVP64PredInt.ALWAYS.value)
334 if mask == SVP64PredInt.ALWAYS.value:
335 return 0xffff_ffff_ffff_ffff
336 if mask == SVP64PredInt.R3_UNARY.value:
337 return 1 << (gpr(3).value & 0b111111)
338 if mask == SVP64PredInt.R3.value:
339 return gpr(3).value
340 if mask == SVP64PredInt.R3_N.value:
341 return ~gpr(3).value
342 if mask == SVP64PredInt.R10.value:
343 return gpr(10).value
344 if mask == SVP64PredInt.R10_N.value:
345 return ~gpr(10).value
346 if mask == SVP64PredInt.R30.value:
347 return gpr(30).value
348 if mask == SVP64PredInt.R30_N.value:
349 return ~gpr(30).value
350
351 # decode SVP64 predicate CR to reg number and invert status
352 def _get_predcr(mask):
353 if mask == SVP64PredCR.LT.value:
354 return 0, 1
355 if mask == SVP64PredCR.GE.value:
356 return 0, 0
357 if mask == SVP64PredCR.GT.value:
358 return 1, 1
359 if mask == SVP64PredCR.LE.value:
360 return 1, 0
361 if mask == SVP64PredCR.EQ.value:
362 return 2, 1
363 if mask == SVP64PredCR.NE.value:
364 return 2, 0
365 if mask == SVP64PredCR.SO.value:
366 return 3, 1
367 if mask == SVP64PredCR.NS.value:
368 return 3, 0
369
370 # read individual CR fields (0..VL-1), extract the required bit
371 # and construct the mask
372 def get_predcr(crl, mask, vl):
373 idx, noninv = _get_predcr(mask)
374 mask = 0
375 for i in range(vl):
376 cr = crl[i+SVP64CROffs.CRPred]
377 if cr[idx].value == noninv:
378 mask |= (1<<i)
379 return mask
380
381
382 # TODO, really should just be using PowerDecoder2
383 def get_pdecode_idx_in(dec2, name):
384 op = dec2.dec.op
385 in1_sel = yield op.in1_sel
386 in2_sel = yield op.in2_sel
387 in3_sel = yield op.in3_sel
388 # get the IN1/2/3 from the decoder (includes SVP64 remap and isvec)
389 in1 = yield dec2.e.read_reg1.data
390 in2 = yield dec2.e.read_reg2.data
391 in3 = yield dec2.e.read_reg3.data
392 in1_isvec = yield dec2.in1_isvec
393 in2_isvec = yield dec2.in2_isvec
394 in3_isvec = yield dec2.in3_isvec
395 log ("get_pdecode_idx_in in1", name, in1_sel, In1Sel.RA.value,
396 in1, in1_isvec)
397 log ("get_pdecode_idx_in in2", name, in2_sel, In2Sel.RB.value,
398 in2, in2_isvec)
399 log ("get_pdecode_idx_in in3", name, in3_sel, In3Sel.RS.value,
400 in3, in3_isvec)
401 log ("get_pdecode_idx_in FRS in3", name, in3_sel, In3Sel.FRS.value,
402 in3, in3_isvec)
403 log ("get_pdecode_idx_in FRB in2", name, in2_sel, In2Sel.FRB.value,
404 in2, in2_isvec)
405 log ("get_pdecode_idx_in FRC in3", name, in3_sel, In3Sel.FRC.value,
406 in3, in3_isvec)
407 # identify which regnames map to in1/2/3
408 if name == 'RA':
409 if (in1_sel == In1Sel.RA.value or
410 (in1_sel == In1Sel.RA_OR_ZERO.value and in1 != 0)):
411 return in1, in1_isvec
412 if in1_sel == In1Sel.RA_OR_ZERO.value:
413 return in1, in1_isvec
414 elif name == 'RB':
415 if in2_sel == In2Sel.RB.value:
416 return in2, in2_isvec
417 if in3_sel == In3Sel.RB.value:
418 return in3, in3_isvec
419 # XXX TODO, RC doesn't exist yet!
420 elif name == 'RC':
421 assert False, "RC does not exist yet"
422 elif name == 'RS':
423 if in1_sel == In1Sel.RS.value:
424 return in1, in1_isvec
425 if in2_sel == In2Sel.RS.value:
426 return in2, in2_isvec
427 if in3_sel == In3Sel.RS.value:
428 return in3, in3_isvec
429 elif name == 'FRA':
430 if in1_sel == In1Sel.FRA.value:
431 return in1, in1_isvec
432 elif name == 'FRB':
433 if in2_sel == In2Sel.FRB.value:
434 return in2, in2_isvec
435 elif name == 'FRC':
436 if in3_sel == In3Sel.FRC.value:
437 return in3, in3_isvec
438 elif name == 'FRS':
439 if in1_sel == In1Sel.FRS.value:
440 return in1, in1_isvec
441 if in3_sel == In3Sel.FRS.value:
442 return in3, in3_isvec
443 return None, False
444
445
446 # TODO, really should just be using PowerDecoder2
447 def get_pdecode_cr_in(dec2, name):
448 op = dec2.dec.op
449 in_sel = yield op.cr_in
450 in_bitfield = yield dec2.dec_cr_in.cr_bitfield.data
451 sv_cr_in = yield op.sv_cr_in
452 spec = yield dec2.crin_svdec.spec
453 sv_override = yield dec2.dec_cr_in.sv_override
454 # get the IN1/2/3 from the decoder (includes SVP64 remap and isvec)
455 in1 = yield dec2.e.read_cr1.data
456 cr_isvec = yield dec2.cr_in_isvec
457 log ("get_pdecode_cr_in", in_sel, CROutSel.CR0.value, in1, cr_isvec)
458 log (" sv_cr_in", sv_cr_in)
459 log (" cr_bf", in_bitfield)
460 log (" spec", spec)
461 log (" override", sv_override)
462 # identify which regnames map to in / o2
463 if name == 'BI':
464 if in_sel == CRInSel.BI.value:
465 return in1, cr_isvec
466 log ("get_pdecode_cr_in not found", name)
467 return None, False
468
469
470 # TODO, really should just be using PowerDecoder2
471 def get_pdecode_cr_out(dec2, name):
472 op = dec2.dec.op
473 out_sel = yield op.cr_out
474 out_bitfield = yield dec2.dec_cr_out.cr_bitfield.data
475 sv_cr_out = yield op.sv_cr_out
476 spec = yield dec2.crout_svdec.spec
477 sv_override = yield dec2.dec_cr_out.sv_override
478 # get the IN1/2/3 from the decoder (includes SVP64 remap and isvec)
479 out = yield dec2.e.write_cr.data
480 o_isvec = yield dec2.o_isvec
481 log ("get_pdecode_cr_out", out_sel, CROutSel.CR0.value, out, o_isvec)
482 log (" sv_cr_out", sv_cr_out)
483 log (" cr_bf", out_bitfield)
484 log (" spec", spec)
485 log (" override", sv_override)
486 # identify which regnames map to out / o2
487 if name == 'CR0':
488 if out_sel == CROutSel.CR0.value:
489 return out, o_isvec
490 log ("get_pdecode_cr_out not found", name)
491 return None, False
492
493
494 # TODO, really should just be using PowerDecoder2
495 def get_pdecode_idx_out(dec2, name):
496 op = dec2.dec.op
497 out_sel = yield op.out_sel
498 # get the IN1/2/3 from the decoder (includes SVP64 remap and isvec)
499 out = yield dec2.e.write_reg.data
500 o_isvec = yield dec2.o_isvec
501 # identify which regnames map to out / o2
502 if name == 'RA':
503 log ("get_pdecode_idx_out", out_sel, OutSel.RA.value, out, o_isvec)
504 if out_sel == OutSel.RA.value:
505 return out, o_isvec
506 elif name == 'RT':
507 log ("get_pdecode_idx_out", out_sel, OutSel.RT.value,
508 OutSel.RT_OR_ZERO.value, out, o_isvec,
509 dec2.dec.RT)
510 if out_sel == OutSel.RT.value:
511 return out, o_isvec
512 elif name == 'RT_OR_ZERO':
513 log ("get_pdecode_idx_out", out_sel, OutSel.RT.value,
514 OutSel.RT_OR_ZERO.value, out, o_isvec,
515 dec2.dec.RT)
516 if out_sel == OutSel.RT_OR_ZERO.value:
517 return out, o_isvec
518 elif name == 'FRA':
519 log ("get_pdecode_idx_out", out_sel, OutSel.FRA.value, out, o_isvec)
520 if out_sel == OutSel.FRA.value:
521 return out, o_isvec
522 elif name == 'FRT':
523 log ("get_pdecode_idx_out", out_sel, OutSel.FRT.value,
524 OutSel.FRT.value, out, o_isvec)
525 if out_sel == OutSel.FRT.value:
526 return out, o_isvec
527 log ("get_pdecode_idx_out not found", name, out_sel, out, o_isvec)
528 return None, False
529
530
531 # TODO, really should just be using PowerDecoder2
532 def get_pdecode_idx_out2(dec2, name):
533 # check first if register is activated for write
534 op = dec2.dec.op
535 out_sel = yield op.out_sel
536 out = yield dec2.e.write_ea.data
537 o_isvec = yield dec2.o2_isvec
538 out_ok = yield dec2.e.write_ea.ok
539 log ("get_pdecode_idx_out2", name, out_sel, out, out_ok, o_isvec)
540 if not out_ok:
541 return None, False
542
543 if name == 'RA':
544 if hasattr(op, "upd"):
545 # update mode LD/ST uses read-reg A also as an output
546 upd = yield op.upd
547 log ("get_pdecode_idx_out2", upd, LDSTMode.update.value,
548 out_sel, OutSel.RA.value,
549 out, o_isvec)
550 if upd == LDSTMode.update.value:
551 return out, o_isvec
552 if name == 'FRS':
553 int_op = yield dec2.dec.op.internal_op
554 fft_en = yield dec2.use_svp64_fft
555 #if int_op == MicrOp.OP_FP_MADD.value and fft_en:
556 if fft_en:
557 log ("get_pdecode_idx_out2", out_sel, OutSel.FRS.value,
558 out, o_isvec)
559 return out, o_isvec
560 return None, False
561
562
563 class ISACaller(ISACallerHelper, ISAFPHelpers):
564 # decoder2 - an instance of power_decoder2
565 # regfile - a list of initial values for the registers
566 # initial_{etc} - initial values for SPRs, Condition Register, Mem, MSR
567 # respect_pc - tracks the program counter. requires initial_insns
568 def __init__(self, decoder2, regfile, initial_sprs=None, initial_cr=0,
569 initial_mem=None, initial_msr=0,
570 initial_svstate=0,
571 initial_insns=None,
572 fpregfile=None,
573 respect_pc=False,
574 disassembly=None,
575 initial_pc=0,
576 bigendian=False,
577 mmu=False,
578 icachemmu=False):
579
580 self.bigendian = bigendian
581 self.halted = False
582 self.is_svp64_mode = False
583 self.respect_pc = respect_pc
584 if initial_sprs is None:
585 initial_sprs = {}
586 if initial_mem is None:
587 initial_mem = {}
588 if fpregfile is None:
589 fpregfile = [0] * 32
590 if initial_insns is None:
591 initial_insns = {}
592 assert self.respect_pc == False, "instructions required to honor pc"
593
594 log("ISACaller insns", respect_pc, initial_insns, disassembly)
595 log("ISACaller initial_msr", initial_msr)
596
597 # "fake program counter" mode (for unit testing)
598 self.fake_pc = 0
599 disasm_start = 0
600 if not respect_pc:
601 if isinstance(initial_mem, tuple):
602 self.fake_pc = initial_mem[0]
603 disasm_start = self.fake_pc
604 else:
605 disasm_start = initial_pc
606
607 # disassembly: we need this for now (not given from the decoder)
608 self.disassembly = {}
609 if disassembly:
610 for i, code in enumerate(disassembly):
611 self.disassembly[i*4 + disasm_start] = code
612
613 # set up registers, instruction memory, data memory, PC, SPRs, MSR, CR
614 self.svp64rm = SVP64RM()
615 if initial_svstate is None:
616 initial_svstate = 0
617 if isinstance(initial_svstate, int):
618 initial_svstate = SVP64State(initial_svstate)
619 # SVSTATE, MSR and PC
620 self.svstate = initial_svstate
621 self.msr = SelectableInt(initial_msr, 64) # underlying reg
622 self.pc = PC()
623 # GPR FPR SPR registers
624 initial_sprs = deepcopy(initial_sprs) # so as not to get modified
625 self.gpr = GPR(decoder2, self, self.svstate, regfile)
626 self.fpr = GPR(decoder2, self, self.svstate, fpregfile)
627 self.spr = SPR(decoder2, initial_sprs) # initialise SPRs before MMU
628
629 # set up 4 dummy SVSHAPEs if they aren't already set up
630 for i in range(4):
631 sname = 'SVSHAPE%d' % i
632 if sname not in self.spr:
633 self.spr[sname] = SVSHAPE(0)
634 else:
635 # make sure it's an SVSHAPE
636 val = self.spr[sname].value
637 self.spr[sname] = SVSHAPE(val)
638 self.last_op_svshape = False
639
640 # "raw" memory
641 self.mem = Mem(row_bytes=8, initial_mem=initial_mem)
642 self.imem = Mem(row_bytes=4, initial_mem=initial_insns)
643 # MMU mode, redirect underlying Mem through RADIX
644 if mmu:
645 self.mem = RADIX(self.mem, self)
646 if icachemmu:
647 self.imem = RADIX(self.imem, self)
648
649 # TODO, needed here:
650 # FPR (same as GPR except for FP nums)
651 # 4.2.2 p124 FPSCR (definitely "separate" - not in SPR)
652 # note that mffs, mcrfs, mtfsf "manage" this FPSCR
653 # 2.3.1 CR (and sub-fields CR0..CR6 - CR0 SO comes from XER.SO)
654 # note that mfocrf, mfcr, mtcr, mtocrf, mcrxrx "manage" CRs
655 # -- Done
656 # 2.3.2 LR (actually SPR #8) -- Done
657 # 2.3.3 CTR (actually SPR #9) -- Done
658 # 2.3.4 TAR (actually SPR #815)
659 # 3.2.2 p45 XER (actually SPR #1) -- Done
660 # 3.2.3 p46 p232 VRSAVE (actually SPR #256)
661
662 # create CR then allow portions of it to be "selectable" (below)
663 self.cr_fields = CRFields(initial_cr)
664 self.cr = self.cr_fields.cr
665
666 # "undefined", just set to variable-bit-width int (use exts "max")
667 #self.undefined = SelectableInt(0, 256) # TODO, not hard-code 256!
668
669 self.namespace = {}
670 self.namespace.update(self.spr)
671 self.namespace.update({'GPR': self.gpr,
672 'FPR': self.fpr,
673 'MEM': self.mem,
674 'SPR': self.spr,
675 'memassign': self.memassign,
676 'NIA': self.pc.NIA,
677 'CIA': self.pc.CIA,
678 'SVSTATE': self.svstate,
679 'SVSHAPE0': self.spr['SVSHAPE0'],
680 'SVSHAPE1': self.spr['SVSHAPE1'],
681 'SVSHAPE2': self.spr['SVSHAPE2'],
682 'SVSHAPE3': self.spr['SVSHAPE3'],
683 'CR': self.cr,
684 'MSR': self.msr,
685 'undefined': undefined,
686 'mode_is_64bit': True,
687 'SO': XER_bits['SO'],
688 'XLEN': 64 # elwidth overrides, later
689 })
690
691 # update pc to requested start point
692 self.set_pc(initial_pc)
693
694 # field-selectable versions of Condition Register
695 self.crl = self.cr_fields.crl
696 for i in range(8):
697 self.namespace["CR%d" % i] = self.crl[i]
698
699 self.decoder = decoder2.dec
700 self.dec2 = decoder2
701
702 super().__init__(XLEN=self.namespace["XLEN"])
703
704 @property
705 def XLEN(self):
706 return self.namespace["XLEN"]
707
708 def call_trap(self, trap_addr, trap_bit):
709 """calls TRAP and sets up NIA to the new execution location.
710 next instruction will begin at trap_addr.
711 """
712 self.TRAP(trap_addr, trap_bit)
713 self.namespace['NIA'] = self.trap_nia
714 self.pc.update(self.namespace, self.is_svp64_mode)
715
716 def TRAP(self, trap_addr=0x700, trap_bit=PIb.TRAP):
717 """TRAP> saves PC, MSR (and TODO SVSTATE), and updates MSR
718
719 TRAP function is callable from inside the pseudocode itself,
720 hence the default arguments. when calling from inside ISACaller
721 it is best to use call_trap()
722 """
723 log("TRAP:", hex(trap_addr), hex(self.namespace['MSR'].value))
724 # store CIA(+4?) in SRR0, set NIA to 0x700
725 # store MSR in SRR1, set MSR to um errr something, have to check spec
726 # store SVSTATE (if enabled) in SVSRR0
727 self.spr['SRR0'].value = self.pc.CIA.value
728 self.spr['SRR1'].value = self.namespace['MSR'].value
729 if self.is_svp64_mode:
730 self.spr['SVSRR0'] = self.namespace['SVSTATE'].value
731 self.trap_nia = SelectableInt(trap_addr, 64)
732 self.spr['SRR1'][trap_bit] = 1 # change *copy* of MSR in SRR1
733
734 # set exception bits. TODO: this should, based on the address
735 # in figure 66 p1065 V3.0B and the table figure 65 p1063 set these
736 # bits appropriately. however it turns out that *for now* in all
737 # cases (all trap_addrs) the exact same thing is needed.
738 self.msr[MSRb.IR] = 0
739 self.msr[MSRb.DR] = 0
740 self.msr[MSRb.FE0] = 0
741 self.msr[MSRb.FE1] = 0
742 self.msr[MSRb.EE] = 0
743 self.msr[MSRb.RI] = 0
744 self.msr[MSRb.SF] = 1
745 self.msr[MSRb.TM] = 0
746 self.msr[MSRb.VEC] = 0
747 self.msr[MSRb.VSX] = 0
748 self.msr[MSRb.PR] = 0
749 self.msr[MSRb.FP] = 0
750 self.msr[MSRb.PMM] = 0
751 self.msr[MSRb.TEs] = 0
752 self.msr[MSRb.TEe] = 0
753 self.msr[MSRb.UND] = 0
754 self.msr[MSRb.LE] = 1
755
756 def memassign(self, ea, sz, val):
757 self.mem.memassign(ea, sz, val)
758
759 def prep_namespace(self, insn_name, formname, op_fields):
760 # TODO: get field names from form in decoder*1* (not decoder2)
761 # decoder2 is hand-created, and decoder1.sigform is auto-generated
762 # from spec
763 # then "yield" fields only from op_fields rather than hard-coded
764 # list, here.
765 fields = self.decoder.sigforms[formname]
766 log("prep_namespace", formname, op_fields)
767 for name in op_fields:
768 # CR immediates. deal with separately. needs modifying
769 # pseudocode
770 if self.is_svp64_mode and name in ['BI']: # TODO, more CRs
771 # BI is a 5-bit, must reconstruct the value
772 regnum, is_vec = yield from get_pdecode_cr_in(self.dec2, name)
773 sig = getattr(fields, name)
774 val = yield sig
775 # low 2 LSBs (CR field selector) remain same, CR num extended
776 assert regnum <= 7, "sigh, TODO, 128 CR fields"
777 val = (val & 0b11) | (regnum<<2)
778 else:
779 if name == 'spr':
780 sig = getattr(fields, name.upper())
781 else:
782 sig = getattr(fields, name)
783 val = yield sig
784 # these are all opcode fields involved in index-selection of CR,
785 # and need to do "standard" arithmetic. CR[BA+32] for example
786 # would, if using SelectableInt, only be 5-bit.
787 if name in ['BF', 'BFA', 'BC', 'BA', 'BB', 'BT', 'BI']:
788 self.namespace[name] = val
789 else:
790 self.namespace[name] = SelectableInt(val, sig.width)
791
792 self.namespace['XER'] = self.spr['XER']
793 self.namespace['CA'] = self.spr['XER'][XER_bits['CA']].value
794 self.namespace['CA32'] = self.spr['XER'][XER_bits['CA32']].value
795
796 # add some SVSTATE convenience variables
797 vl = self.svstate.vl
798 srcstep = self.svstate.srcstep
799 self.namespace['VL'] = vl
800 self.namespace['srcstep'] = srcstep
801
802 # sv.bc* need some extra fields
803 if self.is_svp64_mode and insn_name.startswith("sv.bc"):
804 # blegh grab bits manually
805 mode = yield self.dec2.rm_dec.rm_in.mode
806 bc_vlset = (mode & SVP64MODE.BC_VLSET) != 0
807 bc_vli = (mode & SVP64MODE.BC_VLI) != 0
808 bc_snz = (mode & SVP64MODE.BC_SNZ) != 0
809 bc_vsb = yield self.dec2.rm_dec.bc_vsb
810 bc_lru = yield self.dec2.rm_dec.bc_lru
811 bc_gate = yield self.dec2.rm_dec.bc_gate
812 sz = yield self.dec2.rm_dec.pred_sz
813 self.namespace['ALL'] = SelectableInt(bc_gate, 1)
814 self.namespace['VSb'] = SelectableInt(bc_vsb, 1)
815 self.namespace['LRu'] = SelectableInt(bc_lru, 1)
816 self.namespace['VLSET'] = SelectableInt(bc_vlset, 1)
817 self.namespace['VLI'] = SelectableInt(bc_vli, 1)
818 self.namespace['sz'] = SelectableInt(sz, 1)
819 self.namespace['SNZ'] = SelectableInt(bc_snz, 1)
820
821 def handle_carry_(self, inputs, outputs, already_done):
822 inv_a = yield self.dec2.e.do.invert_in
823 if inv_a:
824 inputs[0] = ~inputs[0]
825
826 imm_ok = yield self.dec2.e.do.imm_data.ok
827 if imm_ok:
828 imm = yield self.dec2.e.do.imm_data.data
829 inputs.append(SelectableInt(imm, 64))
830 assert len(outputs) >= 1
831 log("outputs", repr(outputs))
832 if isinstance(outputs, list) or isinstance(outputs, tuple):
833 output = outputs[0]
834 else:
835 output = outputs
836 gts = []
837 for x in inputs:
838 log("gt input", x, output)
839 gt = (gtu(x, output))
840 gts.append(gt)
841 log(gts)
842 cy = 1 if any(gts) else 0
843 log("CA", cy, gts)
844 if not (1 & already_done):
845 self.spr['XER'][XER_bits['CA']] = cy
846
847 log("inputs", already_done, inputs)
848 # 32 bit carry
849 # ARGH... different for OP_ADD... *sigh*...
850 op = yield self.dec2.e.do.insn_type
851 if op == MicrOp.OP_ADD.value:
852 res32 = (output.value & (1 << 32)) != 0
853 a32 = (inputs[0].value & (1 << 32)) != 0
854 if len(inputs) >= 2:
855 b32 = (inputs[1].value & (1 << 32)) != 0
856 else:
857 b32 = False
858 cy32 = res32 ^ a32 ^ b32
859 log("CA32 ADD", cy32)
860 else:
861 gts = []
862 for x in inputs:
863 log("input", x, output)
864 log(" x[32:64]", x, x[32:64])
865 log(" o[32:64]", output, output[32:64])
866 gt = (gtu(x[32:64], output[32:64])) == SelectableInt(1, 1)
867 gts.append(gt)
868 cy32 = 1 if any(gts) else 0
869 log("CA32", cy32, gts)
870 if not (2 & already_done):
871 self.spr['XER'][XER_bits['CA32']] = cy32
872
873 def handle_overflow(self, inputs, outputs, div_overflow):
874 if hasattr(self.dec2.e.do, "invert_in"):
875 inv_a = yield self.dec2.e.do.invert_in
876 if inv_a:
877 inputs[0] = ~inputs[0]
878
879 imm_ok = yield self.dec2.e.do.imm_data.ok
880 if imm_ok:
881 imm = yield self.dec2.e.do.imm_data.data
882 inputs.append(SelectableInt(imm, 64))
883 assert len(outputs) >= 1
884 log("handle_overflow", inputs, outputs, div_overflow)
885 if len(inputs) < 2 and div_overflow is None:
886 return
887
888 # div overflow is different: it's returned by the pseudo-code
889 # because it's more complex than can be done by analysing the output
890 if div_overflow is not None:
891 ov, ov32 = div_overflow, div_overflow
892 # arithmetic overflow can be done by analysing the input and output
893 elif len(inputs) >= 2:
894 output = outputs[0]
895
896 # OV (64-bit)
897 input_sgn = [exts(x.value, x.bits) < 0 for x in inputs]
898 output_sgn = exts(output.value, output.bits) < 0
899 ov = 1 if input_sgn[0] == input_sgn[1] and \
900 output_sgn != input_sgn[0] else 0
901
902 # OV (32-bit)
903 input32_sgn = [exts(x.value, 32) < 0 for x in inputs]
904 output32_sgn = exts(output.value, 32) < 0
905 ov32 = 1 if input32_sgn[0] == input32_sgn[1] and \
906 output32_sgn != input32_sgn[0] else 0
907
908 self.spr['XER'][XER_bits['OV']] = ov
909 self.spr['XER'][XER_bits['OV32']] = ov32
910 so = self.spr['XER'][XER_bits['SO']]
911 so = so | ov
912 self.spr['XER'][XER_bits['SO']] = so
913
914 def handle_comparison(self, outputs, cr_idx=0):
915 out = outputs[0]
916 assert isinstance(out, SelectableInt), \
917 "out zero not a SelectableInt %s" % repr(outputs)
918 log("handle_comparison", out.bits, hex(out.value))
919 # TODO - XXX *processor* in 32-bit mode
920 # https://bugs.libre-soc.org/show_bug.cgi?id=424
921 # if is_32bit:
922 # o32 = exts(out.value, 32)
923 # print ("handle_comparison exts 32 bit", hex(o32))
924 out = exts(out.value, out.bits)
925 log("handle_comparison exts", hex(out))
926 zero = SelectableInt(out == 0, 1)
927 positive = SelectableInt(out > 0, 1)
928 negative = SelectableInt(out < 0, 1)
929 SO = self.spr['XER'][XER_bits['SO']]
930 log("handle_comparison SO", SO)
931 cr_field = selectconcat(negative, positive, zero, SO)
932 log("handle_comparison cr_field", self.cr, cr_idx, cr_field)
933 self.crl[cr_idx].eq(cr_field)
934
935 def set_pc(self, pc_val):
936 self.namespace['NIA'] = SelectableInt(pc_val, 64)
937 self.pc.update(self.namespace, self.is_svp64_mode)
938
939 def get_next_insn(self):
940 """check instruction
941 """
942 if self.respect_pc:
943 pc = self.pc.CIA.value
944 else:
945 pc = self.fake_pc
946 ins = self.imem.ld(pc, 4, False, True, instr_fetch=True)
947 if ins is None:
948 raise KeyError("no instruction at 0x%x" % pc)
949 return pc, ins
950
951 def setup_one(self):
952 """set up one instruction
953 """
954 pc, insn = self.get_next_insn()
955 yield from self.setup_next_insn(pc, insn)
956
957 def setup_next_insn(self, pc, ins):
958 """set up next instruction
959 """
960 self._pc = pc
961 log("setup: 0x%x 0x%x %s" % (pc, ins & 0xffffffff, bin(ins)))
962 log("CIA NIA", self.respect_pc, self.pc.CIA.value, self.pc.NIA.value)
963
964 yield self.dec2.sv_rm.eq(0)
965 yield self.dec2.dec.raw_opcode_in.eq(ins & 0xffffffff)
966 yield self.dec2.dec.bigendian.eq(self.bigendian)
967 yield self.dec2.state.msr.eq(self.msr.value)
968 yield self.dec2.state.pc.eq(pc)
969 if self.svstate is not None:
970 yield self.dec2.state.svstate.eq(self.svstate.value)
971
972 # SVP64. first, check if the opcode is EXT001, and SVP64 id bits set
973 yield Settle()
974 opcode = yield self.dec2.dec.opcode_in
975 pfx = SVP64PrefixFields() # TODO should probably use SVP64PrefixDecoder
976 pfx.insn.value = opcode
977 major = pfx.major.asint(msb0=True) # MSB0 inversion
978 log ("prefix test: opcode:", major, bin(major),
979 pfx.insn[7] == 0b1, pfx.insn[9] == 0b1)
980 self.is_svp64_mode = ((major == 0b000001) and
981 pfx.insn[7].value == 0b1 and
982 pfx.insn[9].value == 0b1)
983 self.pc.update_nia(self.is_svp64_mode)
984 yield self.dec2.is_svp64_mode.eq(self.is_svp64_mode) # set SVP64 decode
985 self.namespace['NIA'] = self.pc.NIA
986 self.namespace['SVSTATE'] = self.svstate
987 if not self.is_svp64_mode:
988 return
989
990 # in SVP64 mode. decode/print out svp64 prefix, get v3.0B instruction
991 log ("svp64.rm", bin(pfx.rm.asint(msb0=True)))
992 log (" svstate.vl", self.svstate.vl)
993 log (" svstate.mvl", self.svstate.maxvl)
994 sv_rm = pfx.rm.asint(msb0=True)
995 ins = self.imem.ld(pc+4, 4, False, True, instr_fetch=True)
996 log(" svsetup: 0x%x 0x%x %s" % (pc+4, ins & 0xffffffff, bin(ins)))
997 yield self.dec2.dec.raw_opcode_in.eq(ins & 0xffffffff) # v3.0B suffix
998 yield self.dec2.sv_rm.eq(sv_rm) # svp64 prefix
999 yield Settle()
1000
1001 def execute_one(self):
1002 """execute one instruction
1003 """
1004 # get the disassembly code for this instruction
1005 if self.is_svp64_mode:
1006 if not self.disassembly:
1007 code = yield from self.get_assembly_name()
1008 else:
1009 code = self.disassembly[self._pc+4]
1010 log(" svp64 sim-execute", hex(self._pc), code)
1011 else:
1012 if not self.disassembly:
1013 code = yield from self.get_assembly_name()
1014 else:
1015 code = self.disassembly[self._pc]
1016 log("sim-execute", hex(self._pc), code)
1017 opname = code.split(' ')[0]
1018 try:
1019 yield from self.call(opname) # execute the instruction
1020 except MemException as e: # check for memory errors
1021 if e.args[0] != 'unaligned': # only doing aligned at the mo
1022 raise e # ... re-raise
1023 # run a Trap but set DAR first
1024 print ("memory unaligned exception, DAR", e.dar)
1025 self.spr['DAR'] = SelectableInt(e.dar, 64)
1026 self.call_trap(0x600, PIb.PRIV) # 0x600, privileged
1027 return
1028
1029 # don't use this except in special circumstances
1030 if not self.respect_pc:
1031 self.fake_pc += 4
1032
1033 log("execute one, CIA NIA", hex(self.pc.CIA.value),
1034 hex(self.pc.NIA.value))
1035
1036 def get_assembly_name(self):
1037 # TODO, asmregs is from the spec, e.g. add RT,RA,RB
1038 # see http://bugs.libre-riscv.org/show_bug.cgi?id=282
1039 dec_insn = yield self.dec2.e.do.insn
1040 insn_1_11 = yield self.dec2.e.do.insn[1:11]
1041 asmcode = yield self.dec2.dec.op.asmcode
1042 int_op = yield self.dec2.dec.op.internal_op
1043 log("get assembly name asmcode", asmcode, int_op,
1044 hex(dec_insn), bin(insn_1_11))
1045 asmop = insns.get(asmcode, None)
1046
1047 # sigh reconstruct the assembly instruction name
1048 if hasattr(self.dec2.e.do, "oe"):
1049 ov_en = yield self.dec2.e.do.oe.oe
1050 ov_ok = yield self.dec2.e.do.oe.ok
1051 else:
1052 ov_en = False
1053 ov_ok = False
1054 if hasattr(self.dec2.e.do, "rc"):
1055 rc_en = yield self.dec2.e.do.rc.rc
1056 rc_ok = yield self.dec2.e.do.rc.ok
1057 else:
1058 rc_en = False
1059 rc_ok = False
1060 # grrrr have to special-case MUL op (see DecodeOE)
1061 log("ov %d en %d rc %d en %d op %d" %
1062 (ov_ok, ov_en, rc_ok, rc_en, int_op))
1063 if int_op in [MicrOp.OP_MUL_H64.value, MicrOp.OP_MUL_H32.value]:
1064 log("mul op")
1065 if rc_en & rc_ok:
1066 asmop += "."
1067 else:
1068 if not asmop.endswith("."): # don't add "." to "andis."
1069 if rc_en & rc_ok:
1070 asmop += "."
1071 if hasattr(self.dec2.e.do, "lk"):
1072 lk = yield self.dec2.e.do.lk
1073 if lk:
1074 asmop += "l"
1075 log("int_op", int_op)
1076 if int_op in [MicrOp.OP_B.value, MicrOp.OP_BC.value]:
1077 AA = yield self.dec2.dec.fields.FormI.AA[0:-1]
1078 log("AA", AA)
1079 if AA:
1080 asmop += "a"
1081 spr_msb = yield from self.get_spr_msb()
1082 if int_op == MicrOp.OP_MFCR.value:
1083 if spr_msb:
1084 asmop = 'mfocrf'
1085 else:
1086 asmop = 'mfcr'
1087 # XXX TODO: for whatever weird reason this doesn't work
1088 # https://bugs.libre-soc.org/show_bug.cgi?id=390
1089 if int_op == MicrOp.OP_MTCRF.value:
1090 if spr_msb:
1091 asmop = 'mtocrf'
1092 else:
1093 asmop = 'mtcrf'
1094 return asmop
1095
1096 def get_remap_indices(self):
1097 """WARNING, this function stores remap_idxs and remap_loopends
1098 in the class for later use. this to avoid problems with yield
1099 """
1100 # go through all iterators in lock-step, advance to next remap_idx
1101 srcstep, dststep = self.get_src_dststeps()
1102 # get four SVSHAPEs. here we are hard-coding
1103 SVSHAPE0 = self.spr['SVSHAPE0']
1104 SVSHAPE1 = self.spr['SVSHAPE1']
1105 SVSHAPE2 = self.spr['SVSHAPE2']
1106 SVSHAPE3 = self.spr['SVSHAPE3']
1107 # set up the iterators
1108 remaps = [(SVSHAPE0, SVSHAPE0.get_iterator()),
1109 (SVSHAPE1, SVSHAPE1.get_iterator()),
1110 (SVSHAPE2, SVSHAPE2.get_iterator()),
1111 (SVSHAPE3, SVSHAPE3.get_iterator()),
1112 ]
1113
1114 self.remap_loopends = [0] * 4
1115 self.remap_idxs = [0, 1, 2, 3]
1116 dbg = []
1117 for i, (shape, remap) in enumerate(remaps):
1118 # zero is "disabled"
1119 if shape.value == 0x0:
1120 self.remap_idxs[i] = 0
1121 # pick src or dststep depending on reg num (0-2=in, 3-4=out)
1122 step = dststep if (i in [3, 4]) else srcstep
1123 # this is terrible. O(N^2) looking for the match. but hey.
1124 for idx, (remap_idx, loopends) in enumerate(remap):
1125 if idx == step:
1126 break
1127 self.remap_idxs[i] = remap_idx
1128 self.remap_loopends[i] = loopends
1129 dbg.append((i, step, remap_idx, loopends))
1130 for (i, step, remap_idx, loopends) in dbg:
1131 log ("SVSHAPE %d idx, end" % i, step, remap_idx, bin(loopends))
1132 return remaps
1133
1134 def get_spr_msb(self):
1135 dec_insn = yield self.dec2.e.do.insn
1136 return dec_insn & (1 << 20) != 0 # sigh - XFF.spr[-1]?
1137
1138 def call(self, name):
1139 """call(opcode) - the primary execution point for instructions
1140 """
1141 self.last_st_addr = None # reset the last known store address
1142 self.last_ld_addr = None # etc.
1143
1144 ins_name = name.strip() # remove spaces if not already done so
1145 if self.halted:
1146 log("halted - not executing", ins_name)
1147 return
1148
1149 # TODO, asmregs is from the spec, e.g. add RT,RA,RB
1150 # see http://bugs.libre-riscv.org/show_bug.cgi?id=282
1151 asmop = yield from self.get_assembly_name()
1152 log("call", ins_name, asmop)
1153
1154 # check privileged
1155 int_op = yield self.dec2.dec.op.internal_op
1156 spr_msb = yield from self.get_spr_msb()
1157
1158 instr_is_privileged = False
1159 if int_op in [MicrOp.OP_ATTN.value,
1160 MicrOp.OP_MFMSR.value,
1161 MicrOp.OP_MTMSR.value,
1162 MicrOp.OP_MTMSRD.value,
1163 # TODO: OP_TLBIE
1164 MicrOp.OP_RFID.value]:
1165 instr_is_privileged = True
1166 if int_op in [MicrOp.OP_MFSPR.value,
1167 MicrOp.OP_MTSPR.value] and spr_msb:
1168 instr_is_privileged = True
1169
1170 log("is priv", instr_is_privileged, hex(self.msr.value),
1171 self.msr[MSRb.PR])
1172 # check MSR priv bit and whether op is privileged: if so, throw trap
1173 if instr_is_privileged and self.msr[MSRb.PR] == 1:
1174 self.call_trap(0x700, PIb.PRIV)
1175 return
1176
1177 # check halted condition
1178 if ins_name == 'attn':
1179 self.halted = True
1180 return
1181
1182 # check illegal instruction
1183 illegal = False
1184 if ins_name not in ['mtcrf', 'mtocrf']:
1185 illegal = ins_name != asmop
1186
1187 # sigh deal with setvl not being supported by binutils (.long)
1188 if asmop.startswith('setvl'):
1189 illegal = False
1190 ins_name = 'setvl'
1191
1192 # and svstep not being supported by binutils (.long)
1193 if asmop.startswith('svstep'):
1194 illegal = False
1195 ins_name = 'svstep'
1196
1197 # and svremap not being supported by binutils (.long)
1198 if asmop.startswith('svremap'):
1199 illegal = False
1200 ins_name = 'svremap'
1201
1202 # and svshape not being supported by binutils (.long)
1203 if asmop.startswith('svshape'):
1204 illegal = False
1205 ins_name = 'svshape'
1206
1207 # and fsin and fcos
1208 if asmop == 'fsins':
1209 illegal = False
1210 ins_name = 'fsins'
1211 if asmop == 'fcoss':
1212 illegal = False
1213 ins_name = 'fcoss'
1214
1215 # sigh also deal with ffmadds not being supported by binutils (.long)
1216 if asmop == 'ffmadds':
1217 illegal = False
1218 ins_name = 'ffmadds'
1219
1220 # and fdmadds not being supported by binutils (.long)
1221 if asmop == 'fdmadds':
1222 illegal = False
1223 ins_name = 'fdmadds'
1224
1225 # and ffadds not being supported by binutils (.long)
1226 if asmop == 'ffadds':
1227 illegal = False
1228 ins_name = 'ffadds'
1229
1230 # branch-conditional redirects to sv.bc
1231 if asmop.startswith('bc') and self.is_svp64_mode:
1232 ins_name = 'sv.%s' % ins_name
1233
1234 log(" post-processed name", ins_name, asmop)
1235
1236 # illegal instructions call TRAP at 0x700
1237 if illegal:
1238 print("illegal", ins_name, asmop)
1239 self.call_trap(0x700, PIb.ILLEG)
1240 print("name %s != %s - calling ILLEGAL trap, PC: %x" %
1241 (ins_name, asmop, self.pc.CIA.value))
1242 return
1243
1244 # this is for setvl "Vertical" mode: if set true,
1245 # srcstep/dststep is explicitly advanced. mode says which SVSTATE to
1246 # test for Rc=1 end condition. 3 bits of all 3 loops are put into CR0
1247 self.allow_next_step_inc = False
1248 self.svstate_next_mode = 0
1249
1250 # nop has to be supported, we could let the actual op calculate
1251 # but PowerDecoder has a pattern for nop
1252 if ins_name is 'nop':
1253 self.update_pc_next()
1254 return
1255
1256 # look up instruction in ISA.instrs, prepare namespace
1257 info = self.instrs[ins_name]
1258 yield from self.prep_namespace(ins_name, info.form, info.op_fields)
1259
1260 # preserve order of register names
1261 input_names = create_args(list(info.read_regs) +
1262 list(info.uninit_regs))
1263 log("input names", input_names)
1264
1265 # get SVP64 entry for the current instruction
1266 sv_rm = self.svp64rm.instrs.get(ins_name)
1267 if sv_rm is not None:
1268 dest_cr, src_cr, src_byname, dest_byname = decode_extra(sv_rm)
1269 else:
1270 dest_cr, src_cr, src_byname, dest_byname = False, False, {}, {}
1271 log ("sv rm", sv_rm, dest_cr, src_cr, src_byname, dest_byname)
1272
1273 # see if srcstep/dststep need skipping over masked-out predicate bits
1274 if (self.is_svp64_mode or ins_name == 'setvl' or
1275 ins_name in ['svremap', 'svstate']):
1276 yield from self.svstate_pre_inc()
1277 if self.is_svp64_mode:
1278 pre = yield from self.update_new_svstate_steps()
1279 if pre:
1280 self.svp64_reset_loop()
1281 self.update_nia()
1282 self.update_pc_next()
1283 return
1284 srcstep, dststep = self.get_src_dststeps()
1285 pred_dst_zero = self.pred_dst_zero
1286 pred_src_zero = self.pred_src_zero
1287 vl = self.svstate.vl
1288
1289 # VL=0 in SVP64 mode means "do nothing: skip instruction"
1290 if self.is_svp64_mode and vl == 0:
1291 self.pc.update(self.namespace, self.is_svp64_mode)
1292 log("SVP64: VL=0, end of call", self.namespace['CIA'],
1293 self.namespace['NIA'])
1294 return
1295
1296 # for when SVREMAP is active, using pre-arranged schedule.
1297 # note: modifying PowerDecoder2 needs to "settle"
1298 remap_en = self.svstate.SVme
1299 persist = self.svstate.RMpst
1300 active = (persist or self.last_op_svshape) and remap_en != 0
1301 yield self.dec2.remap_active.eq(remap_en if active else 0)
1302 yield Settle()
1303 if persist or self.last_op_svshape:
1304 remaps = self.get_remap_indices()
1305 if self.is_svp64_mode and (persist or self.last_op_svshape):
1306 # just some convenient debug info
1307 for i in range(4):
1308 sname = 'SVSHAPE%d' % i
1309 shape = self.spr[sname]
1310 log (sname, bin(shape.value))
1311 log (" lims", shape.lims)
1312 log (" mode", shape.mode)
1313 log (" skip", shape.skip)
1314
1315 # set up the list of steps to remap
1316 mi0 = self.svstate.mi0
1317 mi1 = self.svstate.mi1
1318 mi2 = self.svstate.mi2
1319 mo0 = self.svstate.mo0
1320 mo1 = self.svstate.mo1
1321 steps = [(self.dec2.in1_step, mi0), # RA
1322 (self.dec2.in2_step, mi1), # RB
1323 (self.dec2.in3_step, mi2), # RC
1324 (self.dec2.o_step, mo0), # RT
1325 (self.dec2.o2_step, mo1), # EA
1326 ]
1327 remap_idxs = self.remap_idxs
1328 rremaps = []
1329 # now cross-index the required SHAPE for each of 3-in 2-out regs
1330 rnames = ['RA', 'RB', 'RC', 'RT', 'EA']
1331 for i, (dstep, shape_idx) in enumerate(steps):
1332 (shape, remap) = remaps[shape_idx]
1333 remap_idx = remap_idxs[shape_idx]
1334 # zero is "disabled"
1335 if shape.value == 0x0:
1336 continue
1337 # now set the actual requested step to the current index
1338 yield dstep.eq(remap_idx)
1339
1340 # debug printout info
1341 rremaps.append((shape.mode, i, rnames[i], shape_idx,
1342 remap_idx))
1343 for x in rremaps:
1344 log ("shape remap", x)
1345 # after that, settle down (combinatorial) to let Vector reg numbers
1346 # work themselves out
1347 yield Settle()
1348 remap_active = yield self.dec2.remap_active
1349 log ("remap active", bin(remap_active))
1350
1351 # main input registers (RT, RA ...)
1352 inputs = []
1353 for name in input_names:
1354 # using PowerDecoder2, first, find the decoder index.
1355 # (mapping name RA RB RC RS to in1, in2, in3)
1356 regnum, is_vec = yield from get_pdecode_idx_in(self.dec2, name)
1357 if regnum is None:
1358 # doing this is not part of svp64, it's because output
1359 # registers, to be modified, need to be in the namespace.
1360 regnum, is_vec = yield from get_pdecode_idx_out(self.dec2, name)
1361 if regnum is None:
1362 regnum, is_vec = yield from get_pdecode_idx_out2(self.dec2,
1363 name)
1364
1365 # in case getting the register number is needed, _RA, _RB
1366 regname = "_" + name
1367 self.namespace[regname] = regnum
1368 if not self.is_svp64_mode or not pred_src_zero:
1369 log('reading reg %s %s' % (name, str(regnum)), is_vec)
1370 if name in fregs:
1371 reg_val = SelectableInt(self.fpr(regnum))
1372 elif name is not None:
1373 reg_val = SelectableInt(self.gpr(regnum))
1374 else:
1375 log('zero input reg %s %s' % (name, str(regnum)), is_vec)
1376 reg_val = 0
1377 inputs.append(reg_val)
1378 # arrrrgh, awful hack, to get _RT into namespace
1379 if ins_name in ['setvl', 'svstep']:
1380 regname = "_RT"
1381 RT = yield self.dec2.dec.RT
1382 self.namespace[regname] = SelectableInt(RT, 5)
1383 if RT == 0:
1384 self.namespace["RT"] = SelectableInt(0, 5)
1385 regnum, is_vec = yield from get_pdecode_idx_out(self.dec2, "RT")
1386 log('hack input reg %s %s' % (name, str(regnum)), is_vec)
1387
1388 # in SVP64 mode for LD/ST work out immediate
1389 # XXX TODO: replace_ds for DS-Form rather than D-Form.
1390 # use info.form to detect
1391 replace_d = False # update / replace constant in pseudocode
1392 if self.is_svp64_mode:
1393 ldstmode = yield self.dec2.rm_dec.ldstmode
1394 # shift mode reads SVD (or SVDS - TODO)
1395 # *BUT*... because this is "overloading" of LD operations,
1396 # it gets *STORED* into D (or DS, TODO)
1397 if ldstmode == SVP64LDSTmode.SHIFT.value:
1398 imm = yield self.dec2.dec.fields.FormSVD.SVD[0:11]
1399 imm = exts(imm, 11) # sign-extend to integer
1400 log ("shift SVD", imm)
1401 replace_d = True
1402 else:
1403 if info.form == 'DS':
1404 # DS-Form, multiply by 4 then knock 2 bits off after
1405 imm = yield self.dec2.dec.fields.FormDS.DS[0:14] * 4
1406 else:
1407 imm = yield self.dec2.dec.fields.FormD.D[0:16]
1408 imm = exts(imm, 16) # sign-extend to integer
1409 # get the right step. LD is from srcstep, ST is dststep
1410 op = yield self.dec2.e.do.insn_type
1411 offsmul = 0
1412 if op == MicrOp.OP_LOAD.value:
1413 if remap_active:
1414 offsmul = yield self.dec2.in1_step
1415 log("D-field REMAP src", imm, offsmul)
1416 else:
1417 offsmul = srcstep
1418 log("D-field src", imm, offsmul)
1419 elif op == MicrOp.OP_STORE.value:
1420 # XXX NOTE! no bit-reversed STORE! this should not ever be used
1421 offsmul = dststep
1422 log("D-field dst", imm, offsmul)
1423 # bit-reverse mode, rev already done through get_src_dst_steps()
1424 if ldstmode == SVP64LDSTmode.SHIFT.value:
1425 # manually look up RC, sigh
1426 RC = yield self.dec2.dec.RC[0:5]
1427 RC = self.gpr(RC)
1428 log ("LD-SHIFT:", "VL", vl,
1429 "RC", RC.value, "imm", imm,
1430 "offs", bin(offsmul),
1431 )
1432 imm = SelectableInt((imm * offsmul) << RC.value, 32)
1433 # Unit-Strided LD/ST adds offset*width to immediate
1434 elif ldstmode == SVP64LDSTmode.UNITSTRIDE.value:
1435 ldst_len = yield self.dec2.e.do.data_len
1436 imm = SelectableInt(imm + offsmul * ldst_len, 32)
1437 replace_d = True
1438 # Element-strided multiplies the immediate by element step
1439 elif ldstmode == SVP64LDSTmode.ELSTRIDE.value:
1440 imm = SelectableInt(imm * offsmul, 32)
1441 replace_d = True
1442 if replace_d:
1443 ldst_ra_vec = yield self.dec2.rm_dec.ldst_ra_vec
1444 ldst_imz_in = yield self.dec2.rm_dec.ldst_imz_in
1445 log("LDSTmode", SVP64LDSTmode(ldstmode),
1446 offsmul, imm, ldst_ra_vec, ldst_imz_in)
1447 # new replacement D... errr.. DS
1448 if replace_d:
1449 if info.form == 'DS':
1450 # TODO: assert 2 LSBs are zero?
1451 log("DS-Form, TODO, assert 2 LSBs zero?", bin(imm.value))
1452 imm.value = imm.value >> 2
1453 self.namespace['DS'] = imm
1454 else:
1455 self.namespace['D'] = imm
1456
1457 # "special" registers
1458 for special in info.special_regs:
1459 if special in special_sprs:
1460 inputs.append(self.spr[special])
1461 else:
1462 inputs.append(self.namespace[special])
1463
1464 # clear trap (trap) NIA
1465 self.trap_nia = None
1466
1467 # check if this was an sv.bc* and create an indicator that
1468 # this is the last check to be made as a loop. combined with
1469 # the ALL/ANY mode we can early-exit
1470 if self.is_svp64_mode and ins_name.startswith("sv.bc"):
1471 no_in_vec = yield self.dec2.no_in_vec # BI is scalar
1472 end_loop = no_in_vec or srcstep == vl-1 or dststep == vl-1
1473 self.namespace['end_loop'] = SelectableInt(end_loop, 1)
1474
1475 # execute actual instruction here (finally)
1476 log("inputs", inputs)
1477 results = info.func(self, *inputs)
1478 log("results", results)
1479
1480 # "inject" decorator takes namespace from function locals: we need to
1481 # overwrite NIA being overwritten (sigh)
1482 if self.trap_nia is not None:
1483 self.namespace['NIA'] = self.trap_nia
1484
1485 log("after func", self.namespace['CIA'], self.namespace['NIA'])
1486
1487 # check if op was a LD/ST so that debugging can check the
1488 # address
1489 if int_op in [MicrOp.OP_STORE.value,
1490 ]:
1491 self.last_st_addr = self.mem.last_st_addr
1492 if int_op in [MicrOp.OP_LOAD.value,
1493 ]:
1494 self.last_ld_addr = self.mem.last_ld_addr
1495 log ("op", int_op, MicrOp.OP_STORE.value, MicrOp.OP_LOAD.value,
1496 self.last_st_addr, self.last_ld_addr)
1497
1498 # detect if CA/CA32 already in outputs (sra*, basically)
1499 already_done = 0
1500 if info.write_regs:
1501 output_names = create_args(info.write_regs)
1502 for name in output_names:
1503 if name == 'CA':
1504 already_done |= 1
1505 if name == 'CA32':
1506 already_done |= 2
1507
1508 log("carry already done?", bin(already_done))
1509 if hasattr(self.dec2.e.do, "output_carry"):
1510 carry_en = yield self.dec2.e.do.output_carry
1511 else:
1512 carry_en = False
1513 if carry_en:
1514 yield from self.handle_carry_(inputs, results, already_done)
1515
1516 if not self.is_svp64_mode: # yeah just no. not in parallel processing
1517 # detect if overflow was in return result
1518 overflow = None
1519 if info.write_regs:
1520 for name, output in zip(output_names, results):
1521 if name == 'overflow':
1522 overflow = output
1523
1524 if hasattr(self.dec2.e.do, "oe"):
1525 ov_en = yield self.dec2.e.do.oe.oe
1526 ov_ok = yield self.dec2.e.do.oe.ok
1527 else:
1528 ov_en = False
1529 ov_ok = False
1530 log("internal overflow", overflow, ov_en, ov_ok)
1531 if ov_en & ov_ok:
1532 yield from self.handle_overflow(inputs, results, overflow)
1533
1534 # only do SVP64 dest predicated Rc=1 if dest-pred is not enabled
1535 rc_en = False
1536 if not self.is_svp64_mode or not pred_dst_zero:
1537 if hasattr(self.dec2.e.do, "rc"):
1538 rc_en = yield self.dec2.e.do.rc.rc
1539 if rc_en and ins_name not in ['svstep']:
1540 regnum, is_vec = yield from get_pdecode_cr_out(self.dec2, "CR0")
1541 self.handle_comparison(results, regnum)
1542
1543 # any modified return results?
1544 if info.write_regs:
1545 for name, output in zip(output_names, results):
1546 if name == 'overflow': # ignore, done already (above)
1547 continue
1548 if isinstance(output, int):
1549 output = SelectableInt(output, 256)
1550 if name in ['CA', 'CA32']:
1551 if carry_en:
1552 log("writing %s to XER" % name, output)
1553 self.spr['XER'][XER_bits[name]] = output.value
1554 else:
1555 log("NOT writing %s to XER" % name, output)
1556 elif name in info.special_regs:
1557 log('writing special %s' % name, output, special_sprs)
1558 if name in special_sprs:
1559 self.spr[name] = output
1560 else:
1561 self.namespace[name].eq(output)
1562 if name == 'MSR':
1563 log('msr written', hex(self.msr.value))
1564 else:
1565 regnum, is_vec = yield from get_pdecode_idx_out(self.dec2,
1566 name)
1567 if regnum is None:
1568 regnum, is_vec = yield from get_pdecode_idx_out2(
1569 self.dec2, name)
1570 if regnum is None:
1571 # temporary hack for not having 2nd output
1572 regnum = yield getattr(self.decoder, name)
1573 is_vec = False
1574 if self.is_svp64_mode and pred_dst_zero:
1575 log('zeroing reg %d %s' % (regnum, str(output)),
1576 is_vec)
1577 output = SelectableInt(0, 256)
1578 else:
1579 if name in fregs:
1580 ftype = 'fpr'
1581 else:
1582 ftype = 'gpr'
1583 log('writing %s %s %s' % (ftype, regnum, str(output)),
1584 is_vec)
1585 if output.bits > 64:
1586 output = SelectableInt(output.value, 64)
1587 if name in fregs:
1588 self.fpr[regnum] = output
1589 else:
1590 self.gpr[regnum] = output
1591
1592 # check if it is the SVSTATE.src/dest step that needs incrementing
1593 # this is our Sub-Program-Counter loop from 0 to VL-1
1594 pre = False
1595 post = False
1596 nia_update = True
1597 if self.allow_next_step_inc:
1598 log("SVSTATE_NEXT: inc requested, mode",
1599 self.svstate_next_mode, self.allow_next_step_inc)
1600 yield from self.svstate_pre_inc()
1601 pre = yield from self.update_new_svstate_steps()
1602 if pre:
1603 # reset at end of loop including exit Vertical Mode
1604 log ("SVSTATE_NEXT: end of loop, reset")
1605 self.svp64_reset_loop()
1606 self.svstate.vfirst = 0
1607 self.update_nia()
1608 if rc_en:
1609 results = [SelectableInt(0, 64)]
1610 self.handle_comparison(results) # CR0
1611 else:
1612 if self.allow_next_step_inc == 2:
1613 log ("SVSTATE_NEXT: read")
1614 nia_update = (yield from self.svstate_post_inc(ins_name))
1615 else:
1616 log ("SVSTATE_NEXT: post-inc")
1617 # use actual src/dst-step here to check end, do NOT
1618 # use bit-reversed version
1619 srcstep, dststep = self.new_srcstep, self.new_dststep
1620 remaps = self.get_remap_indices()
1621 remap_idxs = self.remap_idxs
1622 vl = self.svstate.vl
1623 end_src = srcstep == vl-1
1624 end_dst = dststep == vl-1
1625 if self.allow_next_step_inc != 2:
1626 if not end_src:
1627 self.svstate.srcstep += SelectableInt(1, 7)
1628 if not end_dst:
1629 self.svstate.dststep += SelectableInt(1, 7)
1630 self.namespace['SVSTATE'] = self.svstate.spr
1631 # set CR0 (if Rc=1) based on end
1632 if rc_en:
1633 srcstep = self.svstate.srcstep
1634 dststep = self.svstate.srcstep
1635 endtest = 1 if (end_src or end_dst) else 0
1636 #results = [SelectableInt(endtest, 64)]
1637 #self.handle_comparison(results) # CR0
1638
1639 # see if svstep was requested, if so, which SVSTATE
1640 endings = 0b111
1641 if self.svstate_next_mode > 0:
1642 shape_idx = self.svstate_next_mode.value-1
1643 endings = self.remap_loopends[shape_idx]
1644 cr_field = SelectableInt((~endings)<<1 | endtest, 4)
1645 print ("svstep Rc=1, CR0", cr_field)
1646 self.crl[0].eq(cr_field) # CR0
1647 if end_src or end_dst:
1648 # reset at end of loop including exit Vertical Mode
1649 log ("SVSTATE_NEXT: after increments, reset")
1650 self.svp64_reset_loop()
1651 self.svstate.vfirst = 0
1652
1653 elif self.is_svp64_mode:
1654 nia_update = (yield from self.svstate_post_inc(ins_name))
1655 else:
1656 # XXX only in non-SVP64 mode!
1657 # record state of whether the current operation was an svshape,
1658 # to be able to know if it should apply in the next instruction.
1659 # also (if going to use this instruction) should disable ability
1660 # to interrupt in between. sigh.
1661 self.last_op_svshape = asmop == 'svremap'
1662
1663 if nia_update:
1664 self.update_pc_next()
1665
1666 def SVSTATE_NEXT(self, mode, submode):
1667 """explicitly moves srcstep/dststep on to next element, for
1668 "Vertical-First" mode. this function is called from
1669 setvl pseudo-code, as a pseudo-op "svstep"
1670
1671 WARNING: this function uses information that was created EARLIER
1672 due to it being in the middle of a yield, but this function is
1673 *NOT* called from yield (it's called from compiled pseudocode).
1674 """
1675 self.allow_next_step_inc = submode.value + 1
1676 log("SVSTATE_NEXT mode", mode, submode, self.allow_next_step_inc)
1677 self.svstate_next_mode = mode
1678 if self.svstate_next_mode > 0:
1679 shape_idx = self.svstate_next_mode.value-1
1680 return SelectableInt(self.remap_idxs[shape_idx], 7)
1681 return SelectableInt(0, 7)
1682
1683 def svstate_pre_inc(self):
1684 """check if srcstep/dststep need to skip over masked-out predicate bits
1685 """
1686 # get SVSTATE VL (oh and print out some debug stuff)
1687 vl = self.svstate.vl
1688 srcstep = self.svstate.srcstep
1689 dststep = self.svstate.dststep
1690 sv_a_nz = yield self.dec2.sv_a_nz
1691 fft_mode = yield self.dec2.use_svp64_fft
1692 in1 = yield self.dec2.e.read_reg1.data
1693 log ("SVP64: VL, srcstep, dststep, sv_a_nz, in1 fft, svp64",
1694 vl, srcstep, dststep, sv_a_nz, in1, fft_mode,
1695 self.is_svp64_mode)
1696
1697 # get predicate mask
1698 srcmask = dstmask = 0xffff_ffff_ffff_ffff
1699
1700 pmode = yield self.dec2.rm_dec.predmode
1701 reverse_gear = yield self.dec2.rm_dec.reverse_gear
1702 sv_ptype = yield self.dec2.dec.op.SV_Ptype
1703 srcpred = yield self.dec2.rm_dec.srcpred
1704 dstpred = yield self.dec2.rm_dec.dstpred
1705 pred_src_zero = yield self.dec2.rm_dec.pred_sz
1706 pred_dst_zero = yield self.dec2.rm_dec.pred_dz
1707 if pmode == SVP64PredMode.INT.value:
1708 srcmask = dstmask = get_predint(self.gpr, dstpred)
1709 if sv_ptype == SVPtype.P2.value:
1710 srcmask = get_predint(self.gpr, srcpred)
1711 elif pmode == SVP64PredMode.CR.value:
1712 srcmask = dstmask = get_predcr(self.crl, dstpred, vl)
1713 if sv_ptype == SVPtype.P2.value:
1714 srcmask = get_predcr(self.crl, srcpred, vl)
1715 log (" pmode", pmode)
1716 log (" reverse", reverse_gear)
1717 log (" ptype", sv_ptype)
1718 log (" srcpred", bin(srcpred))
1719 log (" dstpred", bin(dstpred))
1720 log (" srcmask", bin(srcmask))
1721 log (" dstmask", bin(dstmask))
1722 log (" pred_sz", bin(pred_src_zero))
1723 log (" pred_dz", bin(pred_dst_zero))
1724
1725 # okaaay, so here we simply advance srcstep (TODO dststep)
1726 # until the predicate mask has a "1" bit... or we run out of VL
1727 # let srcstep==VL be the indicator to move to next instruction
1728 if not pred_src_zero:
1729 while (((1<<srcstep) & srcmask) == 0) and (srcstep != vl):
1730 log (" skip", bin(1<<srcstep))
1731 srcstep += 1
1732 # same for dststep
1733 if not pred_dst_zero:
1734 while (((1<<dststep) & dstmask) == 0) and (dststep != vl):
1735 log (" skip", bin(1<<dststep))
1736 dststep += 1
1737
1738 # now work out if the relevant mask bits require zeroing
1739 if pred_dst_zero:
1740 pred_dst_zero = ((1<<dststep) & dstmask) == 0
1741 if pred_src_zero:
1742 pred_src_zero = ((1<<srcstep) & srcmask) == 0
1743
1744 # store new srcstep / dststep
1745 self.new_srcstep, self.new_dststep = srcstep, dststep
1746 self.pred_dst_zero, self.pred_src_zero = pred_dst_zero, pred_src_zero
1747 log (" new srcstep", srcstep)
1748 log (" new dststep", dststep)
1749
1750 def get_src_dststeps(self):
1751 """gets srcstep and dststep
1752 """
1753 return self.new_srcstep, self.new_dststep
1754
1755 def update_new_svstate_steps(self):
1756 # note, do not get the bit-reversed srcstep here!
1757 srcstep, dststep = self.new_srcstep, self.new_dststep
1758
1759 # update SVSTATE with new srcstep
1760 self.svstate.srcstep = srcstep
1761 self.svstate.dststep = dststep
1762 self.namespace['SVSTATE'] = self.svstate
1763 yield self.dec2.state.svstate.eq(self.svstate.value)
1764 yield Settle() # let decoder update
1765 srcstep = self.svstate.srcstep
1766 dststep = self.svstate.dststep
1767 vl = self.svstate.vl
1768 log (" srcstep", srcstep)
1769 log (" dststep", dststep)
1770 log (" vl", vl)
1771
1772 # check if end reached (we let srcstep overrun, above)
1773 # nothing needs doing (TODO zeroing): just do next instruction
1774 return srcstep == vl or dststep == vl
1775
1776 def svstate_post_inc(self, insn_name, vf=0):
1777 # check if SV "Vertical First" mode is enabled
1778 vfirst = self.svstate.vfirst
1779 log (" SV Vertical First", vf, vfirst)
1780 if not vf and vfirst == 1:
1781 self.update_nia()
1782 return True
1783
1784 # check if it is the SVSTATE.src/dest step that needs incrementing
1785 # this is our Sub-Program-Counter loop from 0 to VL-1
1786 # XXX twin predication TODO
1787 vl = self.svstate.vl
1788 mvl = self.svstate.maxvl
1789 srcstep = self.svstate.srcstep
1790 dststep = self.svstate.dststep
1791 rm_mode = yield self.dec2.rm_dec.mode
1792 reverse_gear = yield self.dec2.rm_dec.reverse_gear
1793 sv_ptype = yield self.dec2.dec.op.SV_Ptype
1794 out_vec = not (yield self.dec2.no_out_vec)
1795 in_vec = not (yield self.dec2.no_in_vec)
1796 log (" svstate.vl", vl)
1797 log (" svstate.mvl", mvl)
1798 log (" svstate.srcstep", srcstep)
1799 log (" svstate.dststep", dststep)
1800 log (" mode", rm_mode)
1801 log (" reverse", reverse_gear)
1802 log (" out_vec", out_vec)
1803 log (" in_vec", in_vec)
1804 log (" sv_ptype", sv_ptype, sv_ptype == SVPtype.P2.value)
1805 # check if srcstep needs incrementing by one, stop PC advancing
1806 # svp64 loop can end early if the dest is scalar for single-pred
1807 # but for 2-pred both src/dest have to be checked.
1808 # XXX this might not be true! it may just be LD/ST
1809 if sv_ptype == SVPtype.P2.value:
1810 svp64_is_vector = (out_vec or in_vec)
1811 else:
1812 svp64_is_vector = out_vec
1813 # check if this was an sv.bc* and if so did it succeed
1814 if self.is_svp64_mode and insn_name.startswith("sv.bc"):
1815 end_loop = self.namespace['end_loop']
1816 log("branch %s end_loop" % insn_name, end_loop)
1817 if end_loop.value:
1818 self.svp64_reset_loop()
1819 self.update_pc_next()
1820 return False
1821 if svp64_is_vector and srcstep != vl-1 and dststep != vl-1:
1822 self.svstate.srcstep += SelectableInt(1, 7)
1823 self.svstate.dststep += SelectableInt(1, 7)
1824 self.namespace['SVSTATE'] = self.svstate
1825 # not an SVP64 branch, so fix PC (NIA==CIA) for next loop
1826 # (by default, NIA is CIA+4 if v3.0B or CIA+8 if SVP64)
1827 # this way we keep repeating the same instruction (with new steps)
1828 self.pc.NIA.value = self.pc.CIA.value
1829 self.namespace['NIA'] = self.pc.NIA
1830 log("end of sub-pc call", self.namespace['CIA'],
1831 self.namespace['NIA'])
1832 return False # DO NOT allow PC update whilst Sub-PC loop running
1833
1834 # reset loop to zero and update NIA
1835 self.svp64_reset_loop()
1836 self.update_nia()
1837
1838 return True
1839
1840 def update_pc_next(self):
1841 # UPDATE program counter
1842 self.pc.update(self.namespace, self.is_svp64_mode)
1843 self.svstate.spr = self.namespace['SVSTATE']
1844 log("end of call", self.namespace['CIA'],
1845 self.namespace['NIA'],
1846 self.namespace['SVSTATE'])
1847
1848 def svp64_reset_loop(self):
1849 self.svstate.srcstep = 0
1850 self.svstate.dststep = 0
1851 log (" svstate.srcstep loop end (PC to update)")
1852 self.namespace['SVSTATE'] = self.svstate
1853
1854 def update_nia(self):
1855 self.pc.update_nia(self.is_svp64_mode)
1856 self.namespace['NIA'] = self.pc.NIA
1857
1858
1859 def inject():
1860 """Decorator factory.
1861
1862 this decorator will "inject" variables into the function's namespace,
1863 from the *dictionary* in self.namespace. it therefore becomes possible
1864 to make it look like a whole stack of variables which would otherwise
1865 need "self." inserted in front of them (*and* for those variables to be
1866 added to the instance) "appear" in the function.
1867
1868 "self.namespace['SI']" for example becomes accessible as just "SI" but
1869 *only* inside the function, when decorated.
1870 """
1871 def variable_injector(func):
1872 @wraps(func)
1873 def decorator(*args, **kwargs):
1874 try:
1875 func_globals = func.__globals__ # Python 2.6+
1876 except AttributeError:
1877 func_globals = func.func_globals # Earlier versions.
1878
1879 context = args[0].namespace # variables to be injected
1880 saved_values = func_globals.copy() # Shallow copy of dict.
1881 log("globals before", context.keys())
1882 func_globals.update(context)
1883 result = func(*args, **kwargs)
1884 log("globals after", func_globals['CIA'], func_globals['NIA'])
1885 log("args[0]", args[0].namespace['CIA'],
1886 args[0].namespace['NIA'],
1887 args[0].namespace['SVSTATE'])
1888 if 'end_loop' in func_globals:
1889 log("args[0] end_loop", func_globals['end_loop'])
1890 args[0].namespace = func_globals
1891 #exec (func.__code__, func_globals)
1892
1893 # finally:
1894 # func_globals = saved_values # Undo changes.
1895
1896 return result
1897
1898 return decorator
1899
1900 return variable_injector
1901
1902