61a4074bca43c043853be311282c4a80a2d49d67
[openpower-isa.git] / src / openpower / decoder / isa / test_caller_svp64_maxloc.py
1 """Implementation of FORTRAN MAXLOC SVP64
2 Copyright (C) 2022,2023 Luke Kenneth Casson Leighton <lkcl@lkcl.net>
3 Licensed under the LGPLv3+
4 Funded by NLnet NGI-ASSURE under EU grant agreement No 957073.
5 * https://nlnet.nl/project/Libre-SOC-OpenPOWER-ISA
6 * https://bugs.libre-soc.org/show_bug.cgi?id=676
7 * https://libre-soc.org/openpower/sv/cookbook/fortran_maxloc/
8 """
9
10 import unittest
11 from copy import deepcopy
12
13 from nmutil.formaltest import FHDLTestCase
14 from openpower.decoder.isa.caller import SVP64State
15 from openpower.decoder.isa.test_caller import run_tst
16 from openpower.decoder.selectable_int import SelectableInt
17 from openpower.simulator.program import Program
18 from openpower.insndb.asm import SVP64Asm
19 from openpower.util import log
20 from openpower.decoder.isa.maxloc import m2
21
22
23
24 def cmpd(x, y):
25 class CRfield:
26 def __repr__(self):
27 return "<lt %d gt %d eq %d>" % (self.lt, self.gt, self.eq)
28 def __int__(self):
29 return (CRf.lt<<3) | (CRf.gt<<2) | (CRf.eq<<1)
30 CRf = CRfield()
31 CRf.lt = x < y
32 CRf.gt = x > y
33 CRf.eq = x == y
34 return CRf
35
36
37 # example sv.minmax/ff=lt 0, 1, *10, 5
38 # see https://bugs.libre-soc.org/show_bug.cgi?id=1183#c3
39 def sv_maxu(gpr, vl, ra, rb, rt):
40 CR0, i = None, 0
41 while i < vl:
42 CR0 = cmpd(gpr[ra+i], gpr[rb])
43 log("sv_maxss test", i, gpr[ra + i], gpr[rb], CR0, int(CR0))
44 gpr[rt] = gpr[ra+i] if CR0.lt else gpr[rb]
45 if not CR0.gt:
46 break
47 i += 1
48 return i, CR0 # new VL
49
50
51 class DDFFirstTestCase(FHDLTestCase):
52
53 def _check_regs(self, sim, expected):
54 for i in range(32):
55 self.assertEqual(sim.gpr(i), SelectableInt(expected[i], 64))
56
57 def test_sv_maxloc_1(self):
58 self.sv_maxloc([1,3,3,3])
59
60 def tst_sv_maxloc_2(self):
61 self.sv_maxloc([3,4,1,5])
62
63 def tst_sv_maxloc_3(self):
64 self.sv_maxloc([2,9,8,0])
65
66 def tst_sv_maxloc_4(self):
67 self.sv_maxloc([2,1,3,0])
68
69 def sv_maxloc(self, ra):
70 """
71 m, nm, i, n = 0, 0, 0, len(a)
72 while (i<n):
73 while (i<n and a[i]<=m) : i += 1
74 while (i<n and a[i] > m): m, nm, i = a[i], i, i+1
75 return nm
76 """
77
78 lst = SVP64Asm([
79 "mtspr 9, 3", # move r3 to CTR
80 "addi 0, 0, 0", # r0=0
81 #"addi 5, 4, 0", # copy m(r4) to r5
82 # VL = MIN(CTR,MAXVL=4)
83 "mtcrf 255,0", # clear CR entirely
84 "setvl 2,0,4,0,1,1", # set MVL=4, VL=MIN(MVL,CTR)
85 # load VL bytes (update r4 addr) but compressed (dw=8)
86 #"addi 6, 0, 0", # initialise r6 to zero
87 #"sv.lbzu/pi/dw=8 *6, 1(4)", # should be /lf here as well
88 # while (i<n and a[i]<=m) : i += 1
89 "sv.cmp/ff=gt/m=ge *0,0,*10,4", # truncates VL to min
90 "sv.creqv *16,*16,*16", # set mask on already-tested
91 "setvl 2,0,4,0,1,1", # set MVL=4, VL=MIN(MVL,CTR)
92 #"sv.addi/mr/sm=ge/dm=ns 4, *4, 0", # r4 = last non-masked value
93 "mtcrf 128, 0", # clear CR0 (in case VL=0?)
94 "sv.minmax./ff=le/m=ge 4, *10, 4, 1", # uses r4 as accumulator
95 "cror 0,1,0", # test for greater or equal, or VL=0
96 "cror 0,2,0", # test for greater or equal, or VL=0
97 "sv.creqv *19,*16,*16", # set mask on already-tested
98 "sv.crand *19,*19,0", # clear if CR0=0
99 "sv.svstep/mr/m=so 1, 0, 6, 1", # svstep: get vector dststep
100 "sv.creqv *16,*16,*16", # set mask on already-tested
101 #"sv.addi/dm=1<<r3 *5, 4, 0", # put r4 into vector at r5
102 "bc 12,0, -0x4c" # CR0 lt bit clear, branch back
103 #"setvl 3,0,4,0,1,1", # set MVL=4, VL=MIN(MVL,CTR)
104 #"sv.bc/m=ge 16, 19, -0x3c", # until r10[i]>r4 (and dec CTR)
105 ])
106 lst = list(lst)
107
108 # SVSTATE
109 svstate = SVP64State()
110 vl = len(ra) # VL is length of array ra
111 svstate.vl = vl # VL
112 svstate.maxvl = vl # MAXVL
113 print("SVSTATE", bin(svstate.asint()))
114
115 gprs = [0] * 32
116 gprs[3] = vl # variable n: to go into CTR
117 gprs[4] = 2 # variable m: max current number found
118 for i, ra in enumerate(ra): # vector in ra starts at r10
119 gprs[10+i] = ra
120 log("maxu ddff", i, gprs[10+i])
121
122 cr_res = [0]*8
123 res = deepcopy(gprs)
124
125 #expected_vl, expected_cr = sv_maxu(res, cr_res, vl, 10, 4, 4)
126 #log("sv_maxu", expected_vl, cr_res)
127
128 with Program(lst, bigendian=False) as program:
129 sim = self.run_tst_program(program, initial_regs=gprs,
130 svstate=svstate)
131 for i in range(vl):
132 val = sim.gpr(i).value
133 res.append(val)
134 cr_res.append(0)
135 log("i", i, val)
136
137 for i in range(vl):
138 crf = sim.crl[i].get_range().value
139 log("crf", i, bin(crf))
140
141 # confirm that the results are as expected
142 return
143
144 for i, v in enumerate(cr_res[:vl]):
145 crf = sim.crl[i].get_range().value
146 log("crf", i, res[i], bin(crf), bin(int(v)))
147 self.assertEqual(crf, int(v))
148
149 for i, v in enumerate(res):
150 self.assertEqual(v, res[i])
151
152 #self.assertEqual(sim.svstate.vl, expected_vl)
153 #self.assertEqual(sim.svstate.maxvl, 4)
154 #self.assertEqual(sim.svstate.srcstep, 0)
155 #self.assertEqual(sim.svstate.dststep, 0)
156
157 def run_tst_program(self, prog, initial_regs=None,
158 svstate=None,
159 initial_mem=None,
160 initial_fprs=None):
161 if initial_regs is None:
162 initial_regs = [0] * 32
163 simulator = run_tst(prog, initial_regs, mem=initial_mem,
164 initial_fprs=initial_fprs,
165 svstate=svstate)
166
167 print("GPRs")
168 simulator.gpr.dump()
169 print("FPRs")
170 simulator.fpr.dump()
171
172 return simulator
173
174
175 if __name__ == "__main__":
176 unittest.main()