add priv and mode to RADIXMMU
[soc.git] / src / soc / decoder / isa / radixmmu.py
1 # SPDX-License-Identifier: LGPLv3+
2 # Copyright (C) 2020, 2021 Luke Kenneth Casson Leighton <lkcl@lkcl.net>
3 # Copyright (C) 2021 Tobias Platen
4 # Funded by NLnet http://nlnet.nl
5 """core of the python-based POWER9 simulator
6
7 this is part of a cycle-accurate POWER9 simulator. its primary purpose is
8 not speed, it is for both learning and educational purposes, as well as
9 a method of verifying the HDL.
10
11 related bugs:
12
13 * https://bugs.libre-soc.org/show_bug.cgi?id=604
14 """
15
16 from nmigen.back.pysim import Settle
17 from copy import copy
18 from soc.decoder.selectable_int import (FieldSelectableInt, SelectableInt,
19 selectconcat)
20 from soc.decoder.helpers import exts, gtu, ltu, undefined
21 from soc.decoder.isa.mem import Mem
22
23 import math
24 import sys
25
26 # very quick, TODO move to SelectableInt utils later
27 def genmask(shift, size):
28 res = SelectableInt(0, size)
29 for i in range(size):
30 if i < shift:
31 res[size-1-i] = SelectableInt(1, 1)
32 return res
33
34 # NOTE: POWER 3.0B annotation order! see p4 1.3.2
35 # MSB is indexed **LOWEST** (sigh)
36 # from gem5 radixwalk.hh
37 # Bitfield<63> valid; 64 - (63 + 1) = 0
38 # Bitfield<62> leaf; 64 - (62 + 1) = 1
39
40 def rpte_valid(r):
41 return bool(r[0])
42
43 def rpte_leaf(r):
44 return bool(r[1])
45
46 def NLB(x):
47 """
48 Next Level Base
49 right shifted by 8
50 """
51 return x[4:55]
52
53 def NLS(x):
54 """
55 Next Level Size
56 NLS >= 5
57 """
58 return x[59:63]
59
60 """
61 Get Root Page
62
63 //Accessing 2nd double word of partition table (pate1)
64 //Ref: Power ISA Manual v3.0B, Book-III, section 5.7.6.1
65 // PTCR Layout
66 // ====================================================
67 // -----------------------------------------------
68 // | /// | PATB | /// | PATS |
69 // -----------------------------------------------
70 // 0 4 51 52 58 59 63
71 // PATB[4:51] holds the base address of the Partition Table,
72 // right shifted by 12 bits.
73 // This is because the address of the Partition base is
74 // 4k aligned. Hence, the lower 12bits, which are always
75 // 0 are ommitted from the PTCR.
76 //
77 // Thus, The Partition Table Base is obtained by (PATB << 12)
78 //
79 // PATS represents the partition table size right-shifted by 12 bits.
80 // The minimal size of the partition table is 4k.
81 // Thus partition table size = (1 << PATS + 12).
82 //
83 // Partition Table
84 // ====================================================
85 // 0 PATE0 63 PATE1 127
86 // |----------------------|----------------------|
87 // | | |
88 // |----------------------|----------------------|
89 // | | |
90 // |----------------------|----------------------|
91 // | | | <-- effLPID
92 // |----------------------|----------------------|
93 // .
94 // .
95 // .
96 // |----------------------|----------------------|
97 // | | |
98 // |----------------------|----------------------|
99 //
100 // The effective LPID forms the index into the Partition Table.
101 //
102 // Each entry in the partition table contains 2 double words, PATE0, PATE1,
103 // corresponding to that partition.
104 //
105 // In case of Radix, The structure of PATE0 and PATE1 is as follows.
106 //
107 // PATE0 Layout
108 // -----------------------------------------------
109 // |1|RTS1|/| RPDB | RTS2 | RPDS |
110 // -----------------------------------------------
111 // 0 1 2 3 4 55 56 58 59 63
112 //
113 // HR[0] : For Radix Page table, first bit should be 1.
114 // RTS1[1:2] : Gives one fragment of the Radix treesize
115 // RTS2[56:58] : Gives the second fragment of the Radix Tree size.
116 // RTS = (RTS1 << 3 + RTS2) + 31.
117 //
118 // RPDB[4:55] = Root Page Directory Base.
119 // RPDS = Logarithm of Root Page Directory Size right shifted by 3.
120 // Thus, Root page directory size = 1 << (RPDS + 3).
121 // Note: RPDS >= 5.
122 //
123 // PATE1 Layout
124 // -----------------------------------------------
125 // |///| PRTB | // | PRTS |
126 // -----------------------------------------------
127 // 0 3 4 51 52 58 59 63
128 //
129 // PRTB[4:51] = Process Table Base. This is aligned to size.
130 // PRTS[59: 63] = Process Table Size right shifted by 12.
131 // Minimal size of the process table is 4k.
132 // Process Table Size = (1 << PRTS + 12).
133 // Note: PRTS <= 24.
134 //
135 // Computing the size aligned Process Table Base:
136 // table_base = (PRTB & ~((1 << PRTS) - 1)) << 12
137 // Thus, the lower 12+PRTS bits of table_base will
138 // be zero.
139
140
141 //Ref: Power ISA Manual v3.0B, Book-III, section 5.7.6.2
142 //
143 // Process Table
144 // ==========================
145 // 0 PRTE0 63 PRTE1 127
146 // |----------------------|----------------------|
147 // | | |
148 // |----------------------|----------------------|
149 // | | |
150 // |----------------------|----------------------|
151 // | | | <-- effPID
152 // |----------------------|----------------------|
153 // .
154 // .
155 // .
156 // |----------------------|----------------------|
157 // | | |
158 // |----------------------|----------------------|
159 //
160 // The effective Process id (PID) forms the index into the Process Table.
161 //
162 // Each entry in the partition table contains 2 double words, PRTE0, PRTE1,
163 // corresponding to that process
164 //
165 // In case of Radix, The structure of PRTE0 and PRTE1 is as follows.
166 //
167 // PRTE0 Layout
168 // -----------------------------------------------
169 // |/|RTS1|/| RPDB | RTS2 | RPDS |
170 // -----------------------------------------------
171 // 0 1 2 3 4 55 56 58 59 63
172 //
173 // RTS1[1:2] : Gives one fragment of the Radix treesize
174 // RTS2[56:58] : Gives the second fragment of the Radix Tree size.
175 // RTS = (RTS1 << 3 + RTS2) << 31,
176 // since minimal Radix Tree size is 4G.
177 //
178 // RPDB = Root Page Directory Base.
179 // RPDS = Root Page Directory Size right shifted by 3.
180 // Thus, Root page directory size = RPDS << 3.
181 // Note: RPDS >= 5.
182 //
183 // PRTE1 Layout
184 // -----------------------------------------------
185 // | /// |
186 // -----------------------------------------------
187 // 0 63
188 // All bits are reserved.
189
190
191 """
192
193 # see qemu/target/ppc/mmu-radix64.c for reference
194 class RADIX:
195 def __init__(self, mem, caller):
196 self.mem = mem
197 self.caller = caller
198 #TODO move to lookup
199 self.dsisr = self.caller.spr["DSISR"]
200 self.dar = self.caller.spr["DAR"]
201 self.pidr = self.caller.spr["PIDR"]
202 self.prtbl = self.caller.spr["PRTBL"]
203
204 # cached page table stuff
205 self.pgtbl0 = 0
206 self.pt0_valid = False
207 self.pgtbl3 = 0
208 self.pt3_valid = False
209
210 def __call__(self, addr, sz):
211 val = self.ld(addr.value, sz, swap=False)
212 print("RADIX memread", addr, sz, val)
213 return SelectableInt(val, sz*8)
214
215 def ld(self, address, width=8, swap=True, check_in_mem=False,
216 instr_fetch=False):
217 print("RADIX: ld from addr 0x%x width %d" % (address, width))
218
219 priv = 1 # XXX TODO: read MSR PR bit here priv = not ctrl.msr(MSR_PR);
220 if instr_fetch:
221 mode = 'EXECUTE'
222 else:
223 mode = 'LOAD'
224 addr = SelectableInt(address, 64)
225 (shift, mbits, pgbase) = self._decode_prte(addr)
226 #shift = SelectableInt(0, 32)
227
228 pte = self._walk_tree(addr, pgbase, mode, mbits, shift, priv)
229 # use pte to caclculate phys address
230 return self.mem.ld(address, width, swap, check_in_mem)
231
232 # XXX set SPRs on error
233
234 # TODO implement
235 def st(self, address, v, width=8, swap=True):
236 print("RADIX: st to addr 0x%x width %d data %x" % (address, width, v))
237
238 priv = 1 # XXX TODO: read MSR PR bit here priv = not ctrl.msr(MSR_PR);
239 mode = 'STORE'
240 addr = SelectableInt(address, 64)
241 (shift, mbits, pgbase) = self._decode_prte(addr)
242 pte = self._walk_tree(addr, pgbase, mode, mbits, shift, priv)
243
244 # use pte to caclculate phys address (addr)
245 return self.mem.st(addr.value, v, width, swap)
246
247 # XXX set SPRs on error
248
249 def memassign(self, addr, sz, val):
250 print("memassign", addr, sz, val)
251 self.st(addr.value, val.value, sz, swap=False)
252
253 def _next_level(self,r):
254 return rpte_valid(r), rpte_leaf(r)
255 ## DSISR_R_BADCONFIG
256 ## read_entry
257 ## DSISR_NOPTE
258 ## Prepare for next iteration
259
260 def _walk_tree(self, addr, pgbase, mode, mbits, shift, priv=1):
261 """walk tree
262
263 // vaddr 64 Bit
264 // vaddr |-----------------------------------------------------|
265 // | Unused | Used |
266 // |-----------|-----------------------------------------|
267 // | 0000000 | usefulBits = X bits (typically 52) |
268 // |-----------|-----------------------------------------|
269 // | |<--Cursize---->| |
270 // | | Index | |
271 // | | into Page | |
272 // | | Directory | |
273 // |-----------------------------------------------------|
274 // | |
275 // V |
276 // PDE |---------------------------| |
277 // |V|L|//| NLB |///|NLS| |
278 // |---------------------------| |
279 // PDE = Page Directory Entry |
280 // [0] = V = Valid Bit |
281 // [1] = L = Leaf bit. If 0, then |
282 // [4:55] = NLB = Next Level Base |
283 // right shifted by 8 |
284 // [59:63] = NLS = Next Level Size |
285 // | NLS >= 5 |
286 // | V
287 // | |--------------------------|
288 // | | usfulBits = X-Cursize |
289 // | |--------------------------|
290 // |---------------------><--NLS-->| |
291 // | Index | |
292 // | into | |
293 // | PDE | |
294 // |--------------------------|
295 // |
296 // If the next PDE obtained by |
297 // (NLB << 8 + 8 * index) is a |
298 // nonleaf, then repeat the above. |
299 // |
300 // If the next PDE is a leaf, |
301 // then Leaf PDE structure is as |
302 // follows |
303 // |
304 // |
305 // Leaf PDE |
306 // |------------------------------| |----------------|
307 // |V|L|sw|//|RPN|sw|R|C|/|ATT|EAA| | usefulBits |
308 // |------------------------------| |----------------|
309 // [0] = V = Valid Bit |
310 // [1] = L = Leaf Bit = 1 if leaf |
311 // PDE |
312 // [2] = Sw = Sw bit 0. |
313 // [7:51] = RPN = Real Page Number, V
314 // real_page = RPN << 12 -------------> Logical OR
315 // [52:54] = Sw Bits 1:3 |
316 // [55] = R = Reference |
317 // [56] = C = Change V
318 // [58:59] = Att = Physical Address
319 // 0b00 = Normal Memory
320 // 0b01 = SAO
321 // 0b10 = Non Idenmpotent
322 // 0b11 = Tolerant I/O
323 // [60:63] = Encoded Access
324 // Authority
325 //
326 """
327 # get sprs
328 print("_walk_tree")
329 pidr = self.caller.spr["PIDR"]
330 prtbl = self.caller.spr["PRTBL"]
331 print(pidr)
332 print(prtbl)
333 p = addr[55:63]
334 print("last 8 bits ----------")
335 print
336
337 # get address of root entry
338 prtable_addr = self._get_prtable_addr(shift, prtbl, addr, pidr)
339 print("prtable_addr",prtable_addr)
340
341 # read root entry - imcomplete
342 swap = False
343 check_in_mem = False
344 entry_width = 8
345 value = self.mem.ld(prtable_addr.value, entry_width, swap, check_in_mem)
346 print("value",value)
347
348 test_input = [
349 SelectableInt(0x8000000000000007, 64), #valid
350 SelectableInt(0xc000000000000000, 64) #exit
351 ]
352 index = 0
353
354 # walk tree starts on prtbl
355 while True:
356 print("nextlevel----------------------------")
357 l = test_input[index]
358 index += 1
359 valid,leaf = self._next_level(l)
360 if leaf:
361 data = SelectableInt(value, 64) # convert to SelectableInt
362 ok = self._check_perms(data, priv, mode)
363 else:
364 mbits = l[59:64]
365 print("mbits=")
366 print(mbits)
367 if mbits < 5 or mbits > 16:
368 print("badtree")
369 return None
370 """
371 mbits := unsigned('0' & data(4 downto 0));
372 if mbits < 5 or mbits > 16 or mbits > r.shift then
373 v.state := RADIX_FINISH;
374 v.badtree := '1'; -- throw error
375 else
376 v.shift := v.shift - mbits;
377 v.mask_size := mbits(4 downto 0);
378 v.pgbase := data(55 downto 8) & x"00"; NLB?
379 v.state := RADIX_LOOKUP; --> next level
380 end if;
381 """
382 print(valid)
383 print(leaf)
384 if not valid: return None
385 if leaf: return None
386
387 def _decode_prte(self, data):
388 """PRTE0 Layout
389 -----------------------------------------------
390 |/|RTS1|/| RPDB | RTS2 | RPDS |
391 -----------------------------------------------
392 0 1 2 3 4 55 56 58 59 63
393 """
394 # note that SelectableInt does big-endian! so the indices
395 # below *directly* match the spec, unlike microwatt which
396 # has to turn them around (to LE)
397 zero = SelectableInt(0, 1)
398 rts = selectconcat(zero,
399 data[56:59], # RTS2
400 data[1:3], # RTS1
401 )
402 masksize = data[59:64] # RPDS
403 mbits = selectconcat(zero, masksize)
404 pgbase = selectconcat(data[8:56], # part of RPDB
405 SelectableInt(0, 16),)
406
407 return (rts, mbits, pgbase)
408
409 def _segment_check(self, addr, mbits, shift):
410 """checks segment valid
411 mbits := '0' & r.mask_size;
412 v.shift := r.shift + (31 - 12) - mbits;
413 nonzero := or(r.addr(61 downto 31) and not finalmask(30 downto 0));
414 if r.addr(63) /= r.addr(62) or nonzero = '1' then
415 v.state := RADIX_FINISH;
416 v.segerror := '1';
417 elsif mbits < 5 or mbits > 16 or mbits > (r.shift + (31 - 12)) then
418 v.state := RADIX_FINISH;
419 v.badtree := '1';
420 else
421 v.state := RADIX_LOOKUP;
422 """
423 # note that SelectableInt does big-endian! so the indices
424 # below *directly* match the spec, unlike microwatt which
425 # has to turn them around (to LE)
426 mask = genmask(shift, 44)
427 nonzero = addr[1:32] & mask[13:44] # mask 31 LSBs (BE numbered 13:44)
428 print ("RADIX _segment_check nonzero", bin(nonzero.value))
429 print ("RADIX _segment_check addr[0-1]", addr[0].value, addr[1].value)
430 if addr[0] != addr[1] or nonzero == 1:
431 return "segerror"
432 limit = shift + (31 - 12)
433 if mbits < 5 or mbits > 16 or mbits > limit:
434 return "badtree"
435 new_shift = shift + (31 - 12) - mbits
436 return new_shift
437
438 def _check_perms(self, data, priv, mode):
439 """check page permissions
440 // Leaf PDE |
441 // |------------------------------| |----------------|
442 // |V|L|sw|//|RPN|sw|R|C|/|ATT|EAA| | usefulBits |
443 // |------------------------------| |----------------|
444 // [0] = V = Valid Bit |
445 // [1] = L = Leaf Bit = 1 if leaf |
446 // PDE |
447 // [2] = Sw = Sw bit 0. |
448 // [7:51] = RPN = Real Page Number, V
449 // real_page = RPN << 12 -------------> Logical OR
450 // [52:54] = Sw Bits 1:3 |
451 // [55] = R = Reference |
452 // [56] = C = Change V
453 // [58:59] = Att = Physical Address
454 // 0b00 = Normal Memory
455 // 0b01 = SAO
456 // 0b10 = Non Idenmpotent
457 // 0b11 = Tolerant I/O
458 // [60:63] = Encoded Access
459 // Authority
460 //
461 -- test leaf bit
462 -- check permissions and RC bits
463 perm_ok := '0';
464 if r.priv = '1' or data(3) = '0' then
465 if r.iside = '0' then
466 perm_ok := data(1) or (data(2) and not r.store);
467 else
468 -- no IAMR, so no KUEP support for now
469 -- deny execute permission if cache inhibited
470 perm_ok := data(0) and not data(5);
471 end if;
472 end if;
473 rc_ok := data(8) and (data(7) or not r.store);
474 if perm_ok = '1' and rc_ok = '1' then
475 v.state := RADIX_LOAD_TLB;
476 else
477 v.state := RADIX_FINISH;
478 v.perm_err := not perm_ok;
479 -- permission error takes precedence over RC error
480 v.rc_error := perm_ok;
481 end if;
482 """
483 # decode mode into something that matches microwatt equivalent code
484 instr_fetch, store = 0, 0
485 if mode == 'STORE':
486 store = 1
487 if mode == 'EXECUTE':
488 inst_fetch = 1
489
490 # check permissions and RC bits
491 perm_ok = 0
492 if priv == 1 or data[60] == 0:
493 if instr_fetch == 0:
494 perm_ok = data[62] | (data[61] & (store == 0))
495 # no IAMR, so no KUEP support for now
496 # deny execute permission if cache inhibited
497 perm_ok = data[63] & ~data[58]
498 rc_ok = data[55] & (data[56] | (store == 0))
499 if perm_ok == 1 and rc_ok == 1:
500 return True
501
502 return "perm_err" if perm_ok == 0 else "rc_err"
503
504 def _get_prtable_addr(self, shift, prtbl, addr, pid):
505 """
506 if r.addr(63) = '1' then
507 effpid := x"00000000";
508 else
509 effpid := r.pid;
510 end if;
511 x"00" & r.prtbl(55 downto 36) &
512 ((r.prtbl(35 downto 12) and not finalmask(23 downto 0)) or
513 (effpid(31 downto 8) and finalmask(23 downto 0))) &
514 effpid(7 downto 0) & "0000";
515 """
516 print ("_get_prtable_addr_", shift, prtbl, addr, pid)
517 finalmask = genmask(shift, 44)
518 finalmask24 = finalmask[20:44]
519 if addr[0].value == 1:
520 effpid = SelectableInt(0, 32)
521 else:
522 effpid = pid #self.pid # TODO, check on this
523 zero16 = SelectableInt(0, 16)
524 zero4 = SelectableInt(0, 4)
525 res = selectconcat(zero16,
526 prtbl[8:28], #
527 (prtbl[28:52] & ~finalmask24) | #
528 (effpid[0:24] & finalmask24), #
529 effpid[24:32],
530 zero4
531 )
532 return res
533
534 def _get_pgtable_addr(self, mask_size, pgbase, addrsh):
535 """
536 x"00" & r.pgbase(55 downto 19) &
537 ((r.pgbase(18 downto 3) and not mask) or (addrsh and mask)) &
538 "000";
539 """
540 mask16 = genmask(mask_size+5, 16)
541 zero8 = SelectableInt(0, 8)
542 zero3 = SelectableInt(0, 3)
543 res = selectconcat(zero8,
544 pgbase[8:45], #
545 (prtbl[45:61] & ~mask16) | #
546 (addrsh & mask16), #
547 zero3
548 )
549 return res
550
551 def _get_pte(self, shift, addr, pde):
552 """
553 x"00" &
554 ((r.pde(55 downto 12) and not finalmask) or
555 (r.addr(55 downto 12) and finalmask))
556 & r.pde(11 downto 0);
557 """
558 finalmask = genmask(shift, 44)
559 zero8 = SelectableInt(0, 8)
560 res = selectconcat(zero8,
561 (pde[8:52] & ~finalmask) | #
562 (addr[8:52] & finalmask), #
563 pde[52:64],
564 )
565 return res
566
567
568 # very quick test of maskgen function (TODO, move to util later)
569 if __name__ == '__main__':
570 # set up dummy minimal ISACaller
571 spr = {'DSISR': SelectableInt(0, 64),
572 'DAR': SelectableInt(0, 64),
573 'PIDR': SelectableInt(0, 64),
574 'PRTBL': SelectableInt(0, 64)
575 }
576 class ISACaller: pass
577 caller = ISACaller()
578 caller.spr = spr
579
580 shift = SelectableInt(5, 6)
581 mask = genmask(shift, 43)
582 print (" mask", bin(mask.value))
583
584 mem = Mem(row_bytes=8)
585 mem = RADIX(mem, caller)
586 # -----------------------------------------------
587 # |/|RTS1|/| RPDB | RTS2 | RPDS |
588 # -----------------------------------------------
589 # |0|1 2|3|4 55|56 58|59 63|
590 data = SelectableInt(0, 64)
591 data[1:3] = 0b01
592 data[56:59] = 0b11
593 data[59:64] = 0b01101 # mask
594 data[55] = 1
595 (rts, mbits, pgbase) = mem._decode_prte(data)
596 print (" rts", bin(rts.value), rts.bits)
597 print (" mbits", bin(mbits.value), mbits.bits)
598 print (" pgbase", hex(pgbase.value), pgbase.bits)
599 addr = SelectableInt(0x1000, 64)
600 check = mem._segment_check(addr, mbits, shift)
601 print (" segment check", check)
602
603 print("walking tree")
604 # addr = unchanged
605 # pgbase = None
606 mode = None
607 #mbits = None
608 shift = rts
609 result = mem._walk_tree(addr, pgbase, mode, mbits, shift)
610 print(result)