e5d231894d3f1bd53b33f99147e89fa9985d6dc2
[openpower-isa.git] / src / openpower / decoder / isa / test_caller_svp64_maxloc.py
1 """Implementation of FORTRAN MAXLOC SVP64
2 Copyright (C) 2022,2023 Luke Kenneth Casson Leighton <lkcl@lkcl.net>
3 Licensed under the LGPLv3+
4 Funded by NLnet NGI-ASSURE under EU grant agreement No 957073.
5 * https://nlnet.nl/project/Libre-SOC-OpenPOWER-ISA
6 * https://bugs.libre-soc.org/show_bug.cgi?id=676
7 * https://libre-soc.org/openpower/sv/cookbook/fortran_maxloc/
8 """
9
10 import unittest
11 from copy import deepcopy
12
13 from nmutil.formaltest import FHDLTestCase
14 from openpower.decoder.isa.caller import SVP64State
15 from openpower.decoder.isa.test_caller import run_tst
16 from openpower.decoder.selectable_int import SelectableInt
17 from openpower.simulator.program import Program
18 from openpower.insndb.asm import SVP64Asm
19 from openpower.util import log
20 from openpower.decoder.isa.maxloc import m2
21
22
23
24 def cmpd(x, y):
25 class CRfield:
26 def __repr__(self):
27 return "<lt %d gt %d eq %d>" % (self.lt, self.gt, self.eq)
28 def __int__(self):
29 return (CRf.lt<<3) | (CRf.gt<<2) | (CRf.eq<<1)
30 CRf = CRfield()
31 CRf.lt = x < y
32 CRf.gt = x > y
33 CRf.eq = x == y
34 return CRf
35
36
37 # example sv.minmax/ff=lt 0, 1, *10, 5
38 # see https://bugs.libre-soc.org/show_bug.cgi?id=1183#c3
39 def sv_maxu(gpr, vl, ra, rb, rt):
40 CR0, i = None, 0
41 while i < vl:
42 CR0 = cmpd(gpr[ra+i], gpr[rb])
43 log("sv_maxss test", i, gpr[ra + i], gpr[rb], CR0, int(CR0))
44 gpr[rt] = gpr[ra+i] if CR0.lt else gpr[rb]
45 if not CR0.gt:
46 break
47 i += 1
48 return i, CR0 # new VL
49
50
51 class DDFFirstTestCase(FHDLTestCase):
52
53 def _check_regs(self, sim, expected):
54 for i in range(32):
55 self.assertEqual(sim.gpr(i), SelectableInt(expected[i], 64))
56
57 def test_sv_maxloc_1(self):
58 self.sv_maxloc([0,6,1,2])
59
60 def tst_sv_maxloc_2(self):
61 self.sv_maxloc([3,4,1,5])
62
63 def tst_sv_maxloc_3(self):
64 self.sv_maxloc([2,9,8,0])
65
66 def tst_sv_maxloc_4(self):
67 self.sv_maxloc([2,1,3,0])
68
69 def sv_maxloc(self, ra):
70 """
71 m, nm, i, n = 0, 0, 0, len(a)
72 while (i<n):
73 while (i<n and a[i]<=m) : i += 1
74 while (i<n and a[i] > m): m, nm, i = a[i], i, i+1
75 return nm
76 """
77
78 lst = SVP64Asm([
79 "mtspr 9, 3", # move r3 to CTR
80 "addi 0, 0, 0", # r0=0
81 #"addi 5, 4, 0", # copy m(r4) to r5
82 # VL = MIN(CTR,MAXVL=4)
83 "mtcrf 255,0", # clear CR entirely
84 "setvl 2,0,4,0,1,1", # set MVL=4, VL=MIN(MVL,CTR)
85 # load VL bytes (update r4 addr) but compressed (dw=8)
86 #"addi 6, 0, 0", # initialise r6 to zero
87 #"sv.lbzu/pi/dw=8 *6, 1(4)", # should be /lf here as well
88 # while (i<n and a[i]<=m) : i += 1
89 "sv.minmax./ff=ge/m=ge *5, *10, *4, 1",
90 "sv.mcrf/m=ge *4,*0", # masked-copy CR0-CR3 to CR4-CR7
91 "setvl 2,0,4,0,1,1", # set MVL=4, VL=MIN(MVL,CTR)
92 "sv.addi/mr/m=lt 4, *5, 0", # r4 = last non-masked value
93 "mtcrf 128, 0", # clear CR0
94 "sv.minmax./ff=lt/m=ge 4, *10, 4, 1", # uses r4 as accumulator
95 "sv.svstep/mr 3, 0, 6, 1", # svstep: get vector dststep
96 "sv.addi/m=1<<r3 *10, 4, 0", # put r4 into vector at r10
97 "sv.creqv *16,*16,*16", # set mask on already-tested
98 "bc 12,0, -0x44" # CR0 lt bit clear, branch back
99 #"setvl 3,0,4,0,1,1", # set MVL=4, VL=MIN(MVL,CTR)
100 #"sv.bc/all/m=ge 16, 19, -0x3c", # until r10[i]>r4 (and dec CTR)
101 ])
102 lst = list(lst)
103
104 # SVSTATE
105 svstate = SVP64State()
106 vl = len(ra) # VL is length of array ra
107 svstate.vl = vl # VL
108 svstate.maxvl = vl # MAXVL
109 print("SVSTATE", bin(svstate.asint()))
110
111 gprs = [0] * 32
112 gprs[3] = vl # variable n: to go into CTR
113 gprs[4] = 2 # variable m: max current number found
114 for i, ra in enumerate(ra): # vector in ra starts at r10
115 gprs[10+i] = ra
116 log("maxu ddff", i, gprs[10+i])
117
118 cr_res = [0]*8
119 res = deepcopy(gprs)
120
121 #expected_vl, expected_cr = sv_maxu(res, cr_res, vl, 10, 4, 4)
122 #log("sv_maxu", expected_vl, cr_res)
123
124 with Program(lst, bigendian=False) as program:
125 sim = self.run_tst_program(program, initial_regs=gprs,
126 svstate=svstate)
127 for i in range(vl):
128 val = sim.gpr(i).value
129 res.append(val)
130 cr_res.append(0)
131 log("i", i, val)
132
133 for i in range(vl):
134 crf = sim.crl[i].get_range().value
135 log("crf", i, bin(crf))
136
137 # confirm that the results are as expected
138 return
139
140 for i, v in enumerate(cr_res[:vl]):
141 crf = sim.crl[i].get_range().value
142 log("crf", i, res[i], bin(crf), bin(int(v)))
143 self.assertEqual(crf, int(v))
144
145 for i, v in enumerate(res):
146 self.assertEqual(v, res[i])
147
148 #self.assertEqual(sim.svstate.vl, expected_vl)
149 #self.assertEqual(sim.svstate.maxvl, 4)
150 #self.assertEqual(sim.svstate.srcstep, 0)
151 #self.assertEqual(sim.svstate.dststep, 0)
152
153 def run_tst_program(self, prog, initial_regs=None,
154 svstate=None,
155 initial_mem=None,
156 initial_fprs=None):
157 if initial_regs is None:
158 initial_regs = [0] * 32
159 simulator = run_tst(prog, initial_regs, mem=initial_mem,
160 initial_fprs=initial_fprs,
161 svstate=svstate)
162
163 print("GPRs")
164 simulator.gpr.dump()
165 print("FPRs")
166 simulator.fpr.dump()
167
168 return simulator
169
170
171 if __name__ == "__main__":
172 unittest.main()