fa03fa125b2d927fa30f03af1fa489b211322175
1 # SPDX-License-Identifier: LGPLv3+
2 # Copyright (C) 2020, 2021 Luke Kenneth Casson Leighton <lkcl@lkcl.net>
3 # Copyright (C) 2021 Tobias Platen
4 # Funded by NLnet http://nlnet.nl
5 """core of the python-based POWER9 simulator
7 this is part of a cycle-accurate POWER9 simulator. its primary purpose is
8 not speed, it is for both learning and educational purposes, as well as
9 a method of verifying the HDL.
13 * https://bugs.libre-soc.org/show_bug.cgi?id=604
16 from nmigen
.back
.pysim
import Settle
18 from soc
.decoder
.selectable_int
import (FieldSelectableInt
, SelectableInt
,
20 from soc
.decoder
.helpers
import exts
, gtu
, ltu
, undefined
21 from soc
.decoder
.isa
.mem
import Mem
26 # very quick, TODO move to SelectableInt utils later
27 def genmask(shift
, size
):
28 res
= SelectableInt(0, size
)
31 res
[size
-1-i
] = SelectableInt(1, 1)
34 # NOTE: POWER 3.0B annotation order! see p4 1.3.2
35 # MSB is indexed **LOWEST** (sigh)
36 # from gem5 radixwalk.hh
37 # Bitfield<63> valid; 64 - (63 + 1) = 0
38 # Bitfield<62> leaf; 64 - (62 + 1) = 1
63 //Accessing 2nd double word of partition table (pate1)
64 //Ref: Power ISA Manual v3.0B, Book-III, section 5.7.6.1
66 // ====================================================
67 // -----------------------------------------------
68 // | /// | PATB | /// | PATS |
69 // -----------------------------------------------
71 // PATB[4:51] holds the base address of the Partition Table,
72 // right shifted by 12 bits.
73 // This is because the address of the Partition base is
74 // 4k aligned. Hence, the lower 12bits, which are always
75 // 0 are ommitted from the PTCR.
77 // Thus, The Partition Table Base is obtained by (PATB << 12)
79 // PATS represents the partition table size right-shifted by 12 bits.
80 // The minimal size of the partition table is 4k.
81 // Thus partition table size = (1 << PATS + 12).
84 // ====================================================
85 // 0 PATE0 63 PATE1 127
86 // |----------------------|----------------------|
88 // |----------------------|----------------------|
90 // |----------------------|----------------------|
92 // |----------------------|----------------------|
96 // |----------------------|----------------------|
98 // |----------------------|----------------------|
100 // The effective LPID forms the index into the Partition Table.
102 // Each entry in the partition table contains 2 double words, PATE0, PATE1,
103 // corresponding to that partition.
105 // In case of Radix, The structure of PATE0 and PATE1 is as follows.
108 // -----------------------------------------------
109 // |1|RTS1|/| RPDB | RTS2 | RPDS |
110 // -----------------------------------------------
111 // 0 1 2 3 4 55 56 58 59 63
113 // HR[0] : For Radix Page table, first bit should be 1.
114 // RTS1[1:2] : Gives one fragment of the Radix treesize
115 // RTS2[56:58] : Gives the second fragment of the Radix Tree size.
116 // RTS = (RTS1 << 3 + RTS2) + 31.
118 // RPDB[4:55] = Root Page Directory Base.
119 // RPDS = Logarithm of Root Page Directory Size right shifted by 3.
120 // Thus, Root page directory size = 1 << (RPDS + 3).
124 // -----------------------------------------------
125 // |///| PRTB | // | PRTS |
126 // -----------------------------------------------
127 // 0 3 4 51 52 58 59 63
129 // PRTB[4:51] = Process Table Base. This is aligned to size.
130 // PRTS[59: 63] = Process Table Size right shifted by 12.
131 // Minimal size of the process table is 4k.
132 // Process Table Size = (1 << PRTS + 12).
135 // Computing the size aligned Process Table Base:
136 // table_base = (PRTB & ~((1 << PRTS) - 1)) << 12
137 // Thus, the lower 12+PRTS bits of table_base will
141 //Ref: Power ISA Manual v3.0B, Book-III, section 5.7.6.2
144 // ==========================
145 // 0 PRTE0 63 PRTE1 127
146 // |----------------------|----------------------|
148 // |----------------------|----------------------|
150 // |----------------------|----------------------|
152 // |----------------------|----------------------|
156 // |----------------------|----------------------|
158 // |----------------------|----------------------|
160 // The effective Process id (PID) forms the index into the Process Table.
162 // Each entry in the partition table contains 2 double words, PRTE0, PRTE1,
163 // corresponding to that process
165 // In case of Radix, The structure of PRTE0 and PRTE1 is as follows.
168 // -----------------------------------------------
169 // |/|RTS1|/| RPDB | RTS2 | RPDS |
170 // -----------------------------------------------
171 // 0 1 2 3 4 55 56 58 59 63
173 // RTS1[1:2] : Gives one fragment of the Radix treesize
174 // RTS2[56:58] : Gives the second fragment of the Radix Tree size.
175 // RTS = (RTS1 << 3 + RTS2) << 31,
176 // since minimal Radix Tree size is 4G.
178 // RPDB = Root Page Directory Base.
179 // RPDS = Root Page Directory Size right shifted by 3.
180 // Thus, Root page directory size = RPDS << 3.
184 // -----------------------------------------------
186 // -----------------------------------------------
188 // All bits are reserved.
193 # see qemu/target/ppc/mmu-radix64.c for reference
195 def __init__(self
, mem
, caller
):
199 self
.dsisr
= self
.caller
.spr
["DSISR"]
200 self
.dar
= self
.caller
.spr
["DAR"]
201 self
.pidr
= self
.caller
.spr
["PIDR"]
202 self
.prtbl
= self
.caller
.spr
["PRTBL"]
204 # cached page table stuff
206 self
.pt0_valid
= False
208 self
.pt3_valid
= False
210 def __call__(self
, addr
, sz
):
211 val
= self
.ld(addr
.value
, sz
, swap
=False)
212 print("RADIX memread", addr
, sz
, val
)
213 return SelectableInt(val
, sz
*8)
215 def ld(self
, address
, width
=8, swap
=True, check_in_mem
=False,
217 print("RADIX: ld from addr 0x%x width %d" % (address
, width
))
219 priv
= 1 # XXX TODO: read MSR PR bit here priv = not ctrl.msr(MSR_PR);
224 addr
= SelectableInt(address
, 64)
225 (shift
, mbits
, pgbase
) = self
._decode
_prte
(addr
)
226 #shift = SelectableInt(0, 32)
228 pte
= self
._walk
_tree
(addr
, pgbase
, mode
, mbits
, shift
, priv
)
229 # use pte to caclculate phys address
230 return self
.mem
.ld(address
, width
, swap
, check_in_mem
)
232 # XXX set SPRs on error
235 def st(self
, address
, v
, width
=8, swap
=True):
236 print("RADIX: st to addr 0x%x width %d data %x" % (address
, width
, v
))
238 priv
= 1 # XXX TODO: read MSR PR bit here priv = not ctrl.msr(MSR_PR);
240 addr
= SelectableInt(address
, 64)
241 (shift
, mbits
, pgbase
) = self
._decode
_prte
(addr
)
242 pte
= self
._walk
_tree
(addr
, pgbase
, mode
, mbits
, shift
, priv
)
244 # use pte to caclculate phys address (addr)
245 return self
.mem
.st(addr
.value
, v
, width
, swap
)
247 # XXX set SPRs on error
249 def memassign(self
, addr
, sz
, val
):
250 print("memassign", addr
, sz
, val
)
251 self
.st(addr
.value
, val
.value
, sz
, swap
=False)
253 def _next_level(self
,r
):
254 return rpte_valid(r
), rpte_leaf(r
)
258 ## Prepare for next iteration
260 def _walk_tree(self
, addr
, pgbase
, mode
, mbits
, shift
, priv
=1):
264 // vaddr |-----------------------------------------------------|
266 // |-----------|-----------------------------------------|
267 // | 0000000 | usefulBits = X bits (typically 52) |
268 // |-----------|-----------------------------------------|
269 // | |<--Cursize---->| |
273 // |-----------------------------------------------------|
276 // PDE |---------------------------| |
277 // |V|L|//| NLB |///|NLS| |
278 // |---------------------------| |
279 // PDE = Page Directory Entry |
280 // [0] = V = Valid Bit |
281 // [1] = L = Leaf bit. If 0, then |
282 // [4:55] = NLB = Next Level Base |
283 // right shifted by 8 |
284 // [59:63] = NLS = Next Level Size |
287 // | |--------------------------|
288 // | | usfulBits = X-Cursize |
289 // | |--------------------------|
290 // |---------------------><--NLS-->| |
294 // |--------------------------|
296 // If the next PDE obtained by |
297 // (NLB << 8 + 8 * index) is a |
298 // nonleaf, then repeat the above. |
300 // If the next PDE is a leaf, |
301 // then Leaf PDE structure is as |
306 // |------------------------------| |----------------|
307 // |V|L|sw|//|RPN|sw|R|C|/|ATT|EAA| | usefulBits |
308 // |------------------------------| |----------------|
309 // [0] = V = Valid Bit |
310 // [1] = L = Leaf Bit = 1 if leaf |
312 // [2] = Sw = Sw bit 0. |
313 // [7:51] = RPN = Real Page Number, V
314 // real_page = RPN << 12 -------------> Logical OR
315 // [52:54] = Sw Bits 1:3 |
316 // [55] = R = Reference |
317 // [56] = C = Change V
318 // [58:59] = Att = Physical Address
319 // 0b00 = Normal Memory
321 // 0b10 = Non Idenmpotent
322 // 0b11 = Tolerant I/O
323 // [60:63] = Encoded Access
329 pidr
= self
.caller
.spr
["PIDR"]
330 prtbl
= self
.caller
.spr
["PRTBL"]
334 print("last 8 bits ----------")
337 # get address of root entry
338 prtable_addr
= self
._get
_prtable
_addr
(shift
, prtbl
, addr
, pidr
)
339 print("prtable_addr",prtable_addr
)
341 # read root entry - imcomplete
345 value
= self
.mem
.ld(prtable_addr
.value
, entry_width
, swap
, check_in_mem
)
346 data
= SelectableInt(value
, 64) # convert to SelectableInt
350 SelectableInt(0x8000000000000007, 64), #valid
351 SelectableInt(0xc000000000000000, 64) #exit
355 # walk tree starts on prtbl
357 print("nextlevel----------------------------")
358 l
= test_input
[index
]
360 valid
, leaf
= self
._next
_level
(l
)
361 print(" valid, leaf", valid
, leaf
)
363 ok
= self
._check
_perms
(data
, priv
, mode
)
364 # TODO: check permissions
366 data
= l
# TODO put actual data here
367 newlookup
= self
._new
_lookup
(data
, mbits
, shift
)
368 if newlookup
== 'badtree':
370 shift
, mask
, pgbase
= newlookup
371 print (" next level", shift
, mask
, pgbase
)
373 return None # TODO: return error
375 return None # TODO return something
377 def _new_lookup(self
, data
, mbits
, shift
):
379 mbits := unsigned('0' & data(4 downto 0));
380 if mbits < 5 or mbits > 16 or mbits > r.shift then
381 v.state := RADIX_FINISH;
382 v.badtree := '1'; -- throw error
384 v.shift := v.shift - mbits;
385 v.mask_size := mbits(4 downto 0);
386 v.pgbase := data(55 downto 8) & x"00"; NLB?
387 v.state := RADIX_LOOKUP; --> next level
391 print("mbits=", mbits
)
392 if mbits
< 5 or mbits
> 16:
395 shift
= shift
- mbits
396 mask_size
= mbits
[1:5] # get 4 LSBs
397 pgbase
= selectconcat(data
[8:56], SelectableInt(0, 8)) # shift up 8
398 return shift
, mask_size
, pgbase
400 def _decode_prte(self
, data
):
402 -----------------------------------------------
403 |/|RTS1|/| RPDB | RTS2 | RPDS |
404 -----------------------------------------------
405 0 1 2 3 4 55 56 58 59 63
407 # note that SelectableInt does big-endian! so the indices
408 # below *directly* match the spec, unlike microwatt which
409 # has to turn them around (to LE)
410 zero
= SelectableInt(0, 1)
411 rts
= selectconcat(zero
,
415 masksize
= data
[59:64] # RPDS
416 mbits
= selectconcat(zero
, masksize
)
417 pgbase
= selectconcat(data
[8:56], # part of RPDB
418 SelectableInt(0, 16),)
420 return (rts
, mbits
, pgbase
)
422 def _segment_check(self
, addr
, mbits
, shift
):
423 """checks segment valid
424 mbits := '0' & r.mask_size;
425 v.shift := r.shift + (31 - 12) - mbits;
426 nonzero := or(r.addr(61 downto 31) and not finalmask(30 downto 0));
427 if r.addr(63) /= r.addr(62) or nonzero = '1' then
428 v.state := RADIX_FINISH;
430 elsif mbits < 5 or mbits > 16 or mbits > (r.shift + (31 - 12)) then
431 v.state := RADIX_FINISH;
434 v.state := RADIX_LOOKUP;
436 # note that SelectableInt does big-endian! so the indices
437 # below *directly* match the spec, unlike microwatt which
438 # has to turn them around (to LE)
439 mask
= genmask(shift
, 44)
440 nonzero
= addr
[1:32] & mask
[13:44] # mask 31 LSBs (BE numbered 13:44)
441 print ("RADIX _segment_check nonzero", bin(nonzero
.value
))
442 print ("RADIX _segment_check addr[0-1]", addr
[0].value
, addr
[1].value
)
443 if addr
[0] != addr
[1] or nonzero
== 1:
445 limit
= shift
+ (31 - 12)
446 if mbits
< 5 or mbits
> 16 or mbits
> limit
:
448 new_shift
= shift
+ (31 - 12) - mbits
451 def _check_perms(self
, data
, priv
, mode
):
452 """check page permissions
454 // |------------------------------| |----------------|
455 // |V|L|sw|//|RPN|sw|R|C|/|ATT|EAA| | usefulBits |
456 // |------------------------------| |----------------|
457 // [0] = V = Valid Bit |
458 // [1] = L = Leaf Bit = 1 if leaf |
460 // [2] = Sw = Sw bit 0. |
461 // [7:51] = RPN = Real Page Number, V
462 // real_page = RPN << 12 -------------> Logical OR
463 // [52:54] = Sw Bits 1:3 |
464 // [55] = R = Reference |
465 // [56] = C = Change V
466 // [58:59] = Att = Physical Address
467 // 0b00 = Normal Memory
469 // 0b10 = Non Idenmpotent
470 // 0b11 = Tolerant I/O
471 // [60:63] = Encoded Access
475 -- check permissions and RC bits
477 if r.priv = '1' or data(3) = '0' then
478 if r.iside = '0' then
479 perm_ok := data(1) or (data(2) and not r.store);
481 -- no IAMR, so no KUEP support for now
482 -- deny execute permission if cache inhibited
483 perm_ok := data(0) and not data(5);
486 rc_ok := data(8) and (data(7) or not r.store);
487 if perm_ok = '1' and rc_ok = '1' then
488 v.state := RADIX_LOAD_TLB;
490 v.state := RADIX_FINISH;
491 v.perm_err := not perm_ok;
492 -- permission error takes precedence over RC error
493 v.rc_error := perm_ok;
496 # decode mode into something that matches microwatt equivalent code
497 instr_fetch
, store
= 0, 0
500 if mode
== 'EXECUTE':
503 # check permissions and RC bits
505 if priv
== 1 or data
[60] == 0:
507 perm_ok
= data
[62] |
(data
[61] & (store
== 0))
508 # no IAMR, so no KUEP support for now
509 # deny execute permission if cache inhibited
510 perm_ok
= data
[63] & ~data
[58]
511 rc_ok
= data
[55] & (data
[56] |
(store
== 0))
512 if perm_ok
== 1 and rc_ok
== 1:
515 return "perm_err" if perm_ok
== 0 else "rc_err"
517 def _get_prtable_addr(self
, shift
, prtbl
, addr
, pid
):
519 if r.addr(63) = '1' then
520 effpid := x"00000000";
524 x"00" & r.prtbl(55 downto 36) &
525 ((r.prtbl(35 downto 12) and not finalmask(23 downto 0)) or
526 (effpid(31 downto 8) and finalmask(23 downto 0))) &
527 effpid(7 downto 0) & "0000";
529 print ("_get_prtable_addr_", shift
, prtbl
, addr
, pid
)
530 finalmask
= genmask(shift
, 44)
531 finalmask24
= finalmask
[20:44]
532 if addr
[0].value
== 1:
533 effpid
= SelectableInt(0, 32)
535 effpid
= pid
#self.pid # TODO, check on this
536 zero16
= SelectableInt(0, 16)
537 zero4
= SelectableInt(0, 4)
538 res
= selectconcat(zero16
,
540 (prtbl
[28:52] & ~finalmask24
) |
#
541 (effpid
[0:24] & finalmask24
), #
547 def _get_pgtable_addr(self
, mask_size
, pgbase
, addrsh
):
549 x"00" & r.pgbase(55 downto 19) &
550 ((r.pgbase(18 downto 3) and not mask) or (addrsh and mask)) &
553 mask16
= genmask(mask_size
+5, 16)
554 zero8
= SelectableInt(0, 8)
555 zero3
= SelectableInt(0, 3)
556 res
= selectconcat(zero8
,
558 (prtbl
[45:61] & ~mask16
) |
#
564 def _get_pte(self
, shift
, addr
, pde
):
567 ((r.pde(55 downto 12) and not finalmask) or
568 (r.addr(55 downto 12) and finalmask))
569 & r.pde(11 downto 0);
571 finalmask
= genmask(shift
, 44)
572 zero8
= SelectableInt(0, 8)
573 res
= selectconcat(zero8
,
574 (pde
[8:52] & ~finalmask
) |
#
575 (addr
[8:52] & finalmask
), #
581 # very quick test of maskgen function (TODO, move to util later)
582 if __name__
== '__main__':
583 # set up dummy minimal ISACaller
584 spr
= {'DSISR': SelectableInt(0, 64),
585 'DAR': SelectableInt(0, 64),
586 'PIDR': SelectableInt(0, 64),
587 'PRTBL': SelectableInt(0, 64)
589 class ISACaller
: pass
593 shift
= SelectableInt(5, 6)
594 mask
= genmask(shift
, 43)
595 print (" mask", bin(mask
.value
))
597 mem
= Mem(row_bytes
=8)
598 mem
= RADIX(mem
, caller
)
599 # -----------------------------------------------
600 # |/|RTS1|/| RPDB | RTS2 | RPDS |
601 # -----------------------------------------------
602 # |0|1 2|3|4 55|56 58|59 63|
603 data
= SelectableInt(0, 64)
606 data
[59:64] = 0b01101 # mask
608 (rts
, mbits
, pgbase
) = mem
._decode
_prte
(data
)
609 print (" rts", bin(rts
.value
), rts
.bits
)
610 print (" mbits", bin(mbits
.value
), mbits
.bits
)
611 print (" pgbase", hex(pgbase
.value
), pgbase
.bits
)
612 addr
= SelectableInt(0x1000, 64)
613 check
= mem
._segment
_check
(addr
, mbits
, shift
)
614 print (" segment check", check
)
616 print("walking tree")
622 result
= mem
._walk
_tree
(addr
, pgbase
, mode
, mbits
, shift
)