power_insn: support PPC multi-records
[openpower-isa.git] / src / openpower / decoder / power_insn.py
index e0af08d2db600a0175e77971437b2bc4f528abec..d4baa44715b4902e8369567dd056cf14971ae4a5 100644 (file)
@@ -1,11 +1,9 @@
 import collections as _collections
-import copy as _copy
 import csv as _csv
 import dataclasses as _dataclasses
 import enum as _enum
 import functools as _functools
 import os as _os
-import operator as _operator
 import pathlib as _pathlib
 import re as _re
 
@@ -25,16 +23,28 @@ from openpower.decoder.power_enums import (
     CROutSel as _CROutSel,
     LDSTLen as _LDSTLen,
     LDSTMode as _LDSTMode,
-    RC as _RC,
+    RCOE as _RCOE,
     CryIn as _CryIn,
     Form as _Form,
     SVEtype as _SVEtype,
     SVMode as _SVMode,
     SVPtype as _SVPtype,
     SVExtra as _SVExtra,
+    RegType as _RegType,
     SVExtraRegType as _SVExtraRegType,
     SVExtraReg as _SVExtraReg,
 )
+from openpower.decoder.selectable_int import (
+    SelectableInt as _SelectableInt,
+    selectconcat as _selectconcat,
+)
+from openpower.decoder.power_fields import (
+    Field as _Field,
+    Array as _Array,
+    Mapping as _Mapping,
+    DecodeFields as _DecodeFields,
+)
+from openpower.decoder.pseudo.pagereader import ISA as _ISA
 
 
 def dataclass(cls, record, keymap=None, typemap=None):
@@ -179,7 +189,7 @@ class PPCRecord:
     comment: str
     flags: Flags = Flags()
     comment2: str = ""
-    unit: _Function = _Function.NONE
+    function: _Function = _Function.NONE
     intop: _MicrOp = _MicrOp.OP_ILLEGAL
     in1: _In1Sel = _In1Sel.RA
     in2: _In2Sel = _In2Sel.NONE
@@ -190,17 +200,19 @@ class PPCRecord:
     cry_in: _CryIn = _CryIn.ZERO
     ldst_len: _LDSTLen = _LDSTLen.NONE
     upd: _LDSTMode = _LDSTMode.NONE
-    rc: _RC = _RC.NONE
+    Rc: _RCOE = _RCOE.NONE
     form: _Form = _Form.NONE
     conditions: str = ""
     unofficial: bool = False
 
     __KEYMAP = {
+        "unit": "function",
         "internal op": "intop",
         "CR in": "cr_in",
         "CR out": "cr_out",
         "cry in": "cry_in",
         "ldst len": "ldst_len",
+        "rc": "Rc",
         "CONDITIONS": "conditions",
     }
 
@@ -217,15 +229,43 @@ class PPCRecord:
 
         return dataclass(cls, record, keymap=PPCRecord.__KEYMAP, typemap=typemap)
 
-    @property
-    def identifier(self):
-        return self.comment
-
     @cached_property
     def names(self):
         return frozenset(self.comment.split("=")[-1].split("/"))
 
 
+class PPCMultiRecord(tuple):
+    @cached_property
+    def unified(self):
+        def merge(lhs, rhs):
+            value = 0
+            mask = 0
+            lvalue = lhs.opcode.value
+            rvalue = rhs.opcode.value
+            lmask = lhs.opcode.mask
+            rmask = rhs.opcode.mask
+            bits = max(lmask.bit_length(), rmask.bit_length())
+            for bit in range(bits):
+                lvstate = ((lvalue & (1 << bit)) != 0)
+                rvstate = ((rvalue & (1 << bit)) != 0)
+                lmstate = ((lmask & (1 << bit)) != 0)
+                rmstate = ((rmask & (1 << bit)) != 0)
+                vstate = lvstate
+                mstate = True
+                if (not lmstate or not rmstate) or (lvstate != rvstate):
+                    vstate = 0
+                    mstate = 0
+                value |= (vstate << bit)
+                mask |= (mstate << bit)
+
+            return _dataclasses.replace(lhs, opcode=Opcode(value=value, mask=mask))
+
+        return _functools.reduce(merge, self)
+
+    def __getattr__(self, attr):
+        return getattr(self.unified, attr)
+
+
 @_dataclasses.dataclass(eq=True, frozen=True)
 class SVP64Record:
     class ExtraMap(tuple):
@@ -265,7 +305,7 @@ class SVP64Record:
         def __repr__(self):
             return repr({index:self[index] for index in range(0, 4)})
 
-    identifier: str
+    name: str
     ptype: _SVPtype = _SVPtype.NONE
     etype: _SVEtype = _SVEtype.NONE
     in1: _In1Sel = _In1Sel.NONE
@@ -276,18 +316,16 @@ class SVP64Record:
     cr_in: _CRInSel = _CRInSel.NONE
     cr_out: _CROutSel = _CROutSel.NONE
     extra: ExtraMap = ExtraMap()
-    pu: bool = False
     conditions: str = ""
     mode: _SVMode = _SVMode.NORMAL
 
     __KEYMAP = {
-        "insn": "identifier",
+        "insn": "name",
         "CONDITIONS": "conditions",
         "Ptype": "ptype",
         "Etype": "etype",
         "CR in": "cr_in",
         "CR out": "cr_out",
-        "PU": "pu",
     }
 
     @classmethod
@@ -379,7 +417,7 @@ class Fields:
 
         def transform(item):
             (name, bitrange) = item
-            return (name, tuple(bitrange.values()))
+            return (name, list(bitrange.values()))
 
         self.__mapping = dict(map(transform, items))
 
@@ -388,24 +426,179 @@ class Fields:
     def __repr__(self):
         return repr(self.__mapping)
 
+    def __iter__(self):
+        yield from self.__mapping.items()
+
     def __contains__(self, key):
         return self.__mapping.__contains__(key)
 
     def __getitem__(self, key):
-        return self.__mapping.__getitem__(key)
+        return self.__mapping.get(key, None)
+
+
+class Operands:
+    @_dataclasses.dataclass(eq=True, frozen=True)
+    class Operand:
+        name: str
+
+        def disassemble(self, value, record, verbose=False):
+            raise NotImplementedError
+
+    @_dataclasses.dataclass(eq=True, frozen=True)
+    class DynamicOperand(Operand):
+        def disassemble(self, value, record, verbose=False):
+            span = record.fields[self.name]
+            value = value[span]
+            if verbose:
+                return f"{int(value):0{value.bits}b} {span}"
+            else:
+                return str(int(value))
+
+    @_dataclasses.dataclass(eq=True, frozen=True)
+    class StaticOperand(Operand):
+        value: int
+
+        def disassemble(self, value, record, verbose=False):
+            span = record.fields[self.name]
+            value = value[span]
+            if verbose:
+                return f"{int(value):0{value.bits}b} {span}"
+            else:
+                return str(int(value))
+
+    @_dataclasses.dataclass(eq=True, frozen=True)
+    class DynamicOperandIFormLI(DynamicOperand):
+        @property
+        def name(self):
+            return "LI"
+
+        @name.setter
+        def name(self, _):
+            pass
+
+        def disassemble(self, value, record, verbose=False):
+            span = record.fields["LI"]
+            value = value[span]
+            if verbose:
+                hints = "(target_addr=EXTS(LI || 0b00)))"
+                return f"{int(value):0{value.bits}b} {span} {hints}"
+            else:
+                return hex(int(_selectconcat(value,
+                    _SelectableInt(value=0b00, bits=2))))
+
+    class DynamicOperandBFormBD(DynamicOperand):
+        @property
+        def name(self):
+            return "BD"
+
+        @name.setter
+        def name(self, _):
+            pass
+
+        def disassemble(self, value, record, verbose=False):
+            span = record.fields["BD"]
+            value = value[span]
+            if verbose:
+                hints = "(target_addr=EXTS(BD || 0b00))"
+                return f"{int(value):0{value.bits}b} {span} {hints}"
+            else:
+                return hex(int(_selectconcat(value,
+                    _SelectableInt(value=0b00, bits=2))))
+
+    @_dataclasses.dataclass(eq=True, frozen=True)
+    class DynamicOperandGPR(DynamicOperand):
+        def disassemble(self, value, record, verbose=False):
+            result = super().disassemble(value=value,
+                record=record, verbose=verbose)
+            if not verbose:
+                result = f"r{result}"
+            return result
+
+    @_dataclasses.dataclass(eq=True, frozen=True)
+    class DynamicOperandFPR(DynamicOperand):
+        def disassemble(self, value, record, verbose=False):
+            result = super().disassemble(value=value,
+                record=record, verbose=verbose)
+            if not verbose:
+                result = f"f{result}"
+            return result
+
+    def __init__(self, insn, iterable):
+        branches = {
+            "b": {"LI": self.__class__.DynamicOperandIFormLI},
+            "ba": {"LI": self.__class__.DynamicOperandIFormLI},
+            "bl": {"LI": self.__class__.DynamicOperandIFormLI},
+            "bla": {"LI": self.__class__.DynamicOperandIFormLI},
+            "bc": {"BD": self.__class__.DynamicOperandBFormBD},
+            "bca": {"BD": self.__class__.DynamicOperandBFormBD},
+            "bcl": {"BD": self.__class__.DynamicOperandBFormBD},
+            "bcla": {"BD": self.__class__.DynamicOperandBFormBD},
+        }
+
+        operands = []
+        for operand in iterable:
+            dynamic_cls = self.__class__.DynamicOperand
+            static_cls = self.__class__.StaticOperand
+
+            if "=" in operand:
+                (name, value) = operand.split("=")
+                operand = static_cls(name=name, value=int(value))
+            else:
+                if insn in branches and operand in branches[insn]:
+                    dynamic_cls = branches[insn][operand]
+
+                if operand in _RegType.__members__:
+                    regtype = _RegType[operand]
+                    if regtype is _RegType.GPR:
+                        dynamic_cls = self.__class__.DynamicOperandGPR
+                    elif regtype is _RegType.FPR:
+                        dynamic_cls = self.__class__.DynamicOperandFPR
+
+                operand = dynamic_cls(name=operand)
+
+            operands.append(operand)
+
+        self.__operands = operands
+
+        return super().__init__()
+
+    def __repr__(self):
+        return self.__operands.__repr__()
+
+    def __iter__(self):
+        yield from self.__operands
+
+    def __contains__(self, key):
+        return self.__getitem__(key) is not None
+
+    def __getitem__(self, key):
+        for operand in self.__operands:
+            if operand.name == key:
+                return operand
 
-    def get(self, key, default):
-        return self.__mapping.get(key, default)
+        return None
+
+    @property
+    def dynamic(self):
+        for operand in self:
+            if isinstance(operand, self.__class__.DynamicOperand):
+                yield operand
+
+    @property
+    def static(self):
+        for operand in self:
+            if isinstance(operand, self.__class__.StaticOperand):
+                yield operand
 
 
 @_functools.total_ordering
 @_dataclasses.dataclass(eq=True, frozen=True)
-class Instruction:
+class Record:
     name: str
-    rc: bool
     section: Section
     ppc: PPCRecord
     fields: Fields
+    operands: Operands
     svp64: SVP64Record = None
 
     __EXTRA = (
@@ -416,13 +609,10 @@ class Instruction:
     )
 
     def __lt__(self, other):
-        if not isinstance(other, Instruction):
+        if not isinstance(other, Record):
             return NotImplemented
         return (self.opcode < other.opcode)
 
-    def __repr__(self):
-        return f"{self.__class__.__name__}(name={self.name!r}, opcode={self.opcode})"
-
     @cached_property
     def opcode(self):
         fields = []
@@ -432,14 +622,15 @@ class Instruction:
         else:
             fields += [(self.ppc.opcode.value, self.section.bitsel)]
 
-        # Some instructions are special regarding Rc handling.
-        # They are marked with Rc.ONE, but don't have Rc field.
-        # At least addic., andi., andis. belong to this list.
-        if self.rc and "Rc" in self.fields:
-            fields += [(1, self.fields["Rc"])]
+        for operand in self.operands.static:
+            fields += [(operand.value, self.fields[operand.name])]
 
         return FieldsOpcode(fields)
 
+    @property
+    def function(self):
+        return self.ppc.function
+
     @property
     def in1(self):
         return self.ppc.in1
@@ -490,7 +681,7 @@ class Instruction:
         }
         for index in range(0, 4):
             for entry in self.svp64.extra[index]:
-                extra_map[entry.regtype][entry.reg] = Instruction.__EXTRA[index]
+                extra_map[entry.regtype][entry.reg] = Record.__EXTRA[index]
 
         for regtype in (_SVExtraRegType.SRC, _SVExtraRegType.DST):
             extra = extra_map[regtype].get(reg, _SVExtra.NONE)
@@ -520,112 +711,654 @@ class Instruction:
         return self.svp64.etype
 
 
-class Database:
-    def __init__(self, root):
-        root = _pathlib.Path(root)
+class Instruction(_Mapping):
+    @classmethod
+    def integer(cls, value=0, bits=None, byteorder="little"):
+        if isinstance(value, (int, bytes)) and not isinstance(bits, int):
+            raise ValueError(bits)
+
+        if isinstance(value, bytes):
+            if ((len(value) * 8) != bits):
+                raise ValueError(f"bit length mismatch")
+            value = int.from_bytes(value, byteorder=byteorder)
 
-        def parse(stream, factory):
-            lines = filter(lambda line: not line.strip().startswith("#"), stream)
-            entries = _csv.DictReader(lines)
-            entries = filter(lambda entry: "TODO" not in frozenset(entry.values()), entries)
-            return tuple(map(factory, entries))
-
-        def database_ppc(root):
-            db = _collections.defaultdict(set)
-            path = (root / "insndb.csv")
-            with open(path, "r", encoding="UTF-8") as stream:
-                for section in parse(stream, Section.CSV):
-                    path = (root / section.path)
-                    opcode_cls = {
-                        section.Mode.INTEGER: IntegerOpcode,
-                        section.Mode.PATTERN: PatternOpcode,
-                    }[section.mode]
-                    factory = _functools.partial(PPCRecord.CSV, opcode_cls=opcode_cls)
-                    with open(path, "r", encoding="UTF-8") as stream:
-                        db[section].update(parse(stream, factory))
-            for (section, records) in db.items():
-                db[section] = {record.identifier:record for record in records}
-            return db
-
-        def database_svp64(root):
-            db = set()
-            pattern = _re.compile(r"^(?:LDST)?RM-(1P|2P)-.*?\.csv$")
-            for (prefix, _, names) in _os.walk(root):
-                prefix = _pathlib.Path(prefix)
-                for name in filter(lambda name: pattern.match(name), names):
-                    path = (prefix / _pathlib.Path(name))
-                    with open(path, "r", encoding="UTF-8") as stream:
-                        db.update(parse(stream, SVP64Record.CSV))
-            db = {record.identifier:record for record in db}
-            return db
-
-        def database_forms(root):
-            # This is hack. The whole code there should be moved here.
-            # The fields.text parser should take care of the validation.
-            from openpower.decoder.power_fields import DecodeFields as _DecodeFields
-            db = {}
-            df = _DecodeFields()
-            df.create_specs()
-            for (form, fields) in df.instrs.items():
-                if form in {"DQE", "TX"}:
-                    continue
-                if form == "all":
-                    form = "NONE"
-                db[_Form[form]] = Fields(fields)
-            return db
-
-        def database(ppcdb, svp64db, formsdb):
-            items = set()
-            for section in ppcdb:
-                for (identifier, ppc) in ppcdb[section].items():
-                    fields = formsdb[ppc.form]
-                    svp64 = svp64db.get(identifier)
-                    if ppc.rc is _RC.ONE:
-                        variants = {name:True for name in ppc.names}
-                    elif ppc.rc is _RC.RC:
-                        variants = {name:False for name in ppc.names}
-                        variants.update({f"{name}.":True for name in ppc.names})
+        if isinstance(value, int):
+            value = _SelectableInt(value=value, bits=bits)
+        elif isinstance(value, Instruction):
+            value = value.storage
+
+        if not isinstance(value, _SelectableInt):
+            raise ValueError(value)
+        if bits is None:
+            bits = len(cls)
+        if len(value) != bits:
+            raise ValueError(value)
+
+        value = _SelectableInt(value=value, bits=bits)
+
+        return cls(storage=value)
+
+    def __hash__(self):
+        return hash(int(self))
+
+    def disassemble(self, db, byteorder="little", verbose=False):
+        raise NotImplementedError
+
+
+class WordInstruction(Instruction):
+    _: _Field = range(0, 32)
+    po: _Field = range(0, 6)
+
+    @classmethod
+    def integer(cls, value, byteorder="little"):
+        return super().integer(bits=32, value=value, byteorder=byteorder)
+
+    def spec(self, record):
+        dynamic_operands = []
+        for operand in record.operands.dynamic:
+            dynamic_operands.append(operand.name)
+        static_operands = []
+        for operand in record.operands.static:
+            static_operands.append(f"{operand.name}={operand.value}")
+        operands = ""
+        if dynamic_operands:
+            operands += f" {','.join(dynamic_operands)}"
+        if static_operands:
+            operands += f" ({' '.join(static_operands)})"
+        return f"{record.name}{operands}"
+
+    def opcode(self, record):
+        return f"0x{record.opcode.value:08x}"
+
+    def mask(self, record):
+        return f"0x{record.opcode.mask:08x}"
+
+    def disassemble(self, db, byteorder="little", verbose=False):
+        integer = int(self)
+        blob = integer.to_bytes(length=4, byteorder=byteorder)
+        blob = " ".join(map(lambda byte: f"{byte:02x}", blob))
+
+        record = db[self]
+        if record is None:
+            yield f"{blob}    .long 0x{integer:08x}"
+            return
+
+        operands = []
+        for operand in record.operands.dynamic:
+            operand = operand.disassemble(value=self,
+                record=record, verbose=False)
+            operands.append(operand)
+        if operands:
+            operands = ",".join(operands)
+            operands = f" {operands}"
+        else:
+            operands = ""
+
+        yield f"{blob}    {record.name}{operands}"
+
+        if verbose:
+            lindent = (" " * 4)
+            rindent = (len(blob) - len(lindent))
+            spec = self.spec(record=record)
+            opcode = self.opcode(record=record)
+            mask = self.mask(record=record)
+            yield f"{lindent}{'spec':{rindent}}{spec}"
+            yield f"{lindent}{'opcode':{rindent}}{opcode}"
+            yield f"{lindent}{'mask':{rindent}}{mask}"
+            for operand in record.operands:
+                name = operand.name
+                value = operand.disassemble(value=self,
+                    record=record, verbose=True)
+                yield f"{lindent}{name:{rindent}}{value}"
+
+
+class PrefixedInstruction(Instruction):
+    class Prefix(WordInstruction.remap(range(0, 32))):
+        pass
+
+    class Suffix(WordInstruction.remap(range(32, 64))):
+        pass
+
+    _: _Field = range(64)
+    prefix: Prefix
+    suffix: Suffix
+    po: Suffix.po
+
+    @classmethod
+    def integer(cls, value, byteorder="little"):
+        return super().integer(bits=64, value=value, byteorder=byteorder)
+
+    @classmethod
+    def pair(cls, prefix=0, suffix=0, byteorder="little"):
+        def transform(value):
+            return WordInstruction.integer(value=value,
+                byteorder=byteorder)[0:32]
+
+        (prefix, suffix) = map(transform, (prefix, suffix))
+        value = _selectconcat(prefix, suffix)
+
+        return super().integer(value=value)
+
+
+class Mode(_Mapping):
+    _: _Field = range(0, 5)
+    sel: _Field = range(0, 2)
+
+
+class NormalMode(Mode):
+    class simple(Mode):
+        """simple mode"""
+        dz: Mode[3]
+        sz: Mode[4]
+
+    class smr(Mode):
+        """scalar reduce mode (mapreduce), SUBVL=1"""
+        RG: Mode[4]
+
+    class pmr(Mode):
+        """parallel reduce mode (mapreduce), SUBVL=1"""
+        pass
+
+    class svmr(Mode):
+        """subvector reduce mode, SUBVL>1"""
+        SVM: Mode[3]
+
+    class pu(Mode):
+        """Pack/Unpack mode, SUBVL>1"""
+        SVM: Mode[3]
+
+    class ffrc1(Mode):
+        """Rc=1: ffirst CR sel"""
+        inv: Mode[2]
+        CRbit: Mode[3, 4]
+
+    class ffrc0(Mode):
+        """Rc=0: ffirst z/nonz"""
+        inv: Mode[2]
+        VLi: Mode[3]
+        RC1: Mode[4]
+
+    class sat(Mode):
+        """sat mode: N=0/1 u/s, SUBVL=1"""
+        N: Mode[2]
+        dz: Mode[3]
+        sz: Mode[4]
+
+    class satx(Mode):
+        """sat mode: N=0/1 u/s, SUBVL>1"""
+        N: Mode[2]
+        zz: Mode[3]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    class satpu(Mode):
+        """Pack/Unpack sat mode: N=0/1 u/s, SUBVL>1"""
+        N: Mode[2]
+        zz: Mode[3]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    class prrc1(Mode):
+        """Rc=1: pred-result CR sel"""
+        inv: Mode[2]
+        CRbit: Mode[3, 4]
+
+    class prrc0(Mode):
+        """Rc=0: pred-result z/nonz"""
+        inv: Mode[2]
+        zz: Mode[3]
+        RC1: Mode[4]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    simple: simple
+    smr: smr
+    pmr: pmr
+    svmr: svmr
+    pu: pu
+    ffrc1: ffrc1
+    ffrc0: ffrc0
+    sat: sat
+    satx: satx
+    satpu: satpu
+    prrc1: prrc1
+    prrc0: prrc0
+
+
+class LDSTImmMode(Mode):
+    class simple(Mode):
+        """simple mode"""
+        zz: Mode[3]
+        els: Mode[4]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    class spu(Mode):
+        """Structured Pack/Unpack"""
+        zz: Mode[3]
+        els: Mode[4]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    class ffrc1(Mode):
+        """Rc=1: ffirst CR sel"""
+        inv: Mode[2]
+        CRbit: Mode[3, 4]
+
+    class ffrc0(Mode):
+        """Rc=0: ffirst z/nonz"""
+        inv: Mode[2]
+        els: Mode[3]
+        RC1: Mode[4]
+
+    class sat(Mode):
+        """sat mode: N=0/1 u/s"""
+        N: Mode[2]
+        zz: Mode[3]
+        els: Mode[4]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    class prrc1(Mode):
+        """Rc=1: pred-result CR sel"""
+        inv: Mode[2]
+        CRbit: Mode[3, 4]
+
+    class prrc0(Mode):
+        """Rc=0: pred-result z/nonz"""
+        inv: Mode[2]
+        els: Mode[3]
+        RC1: Mode[4]
+
+    simple: simple
+    spu: spu
+    ffrc1: ffrc1
+    ffrc0: ffrc0
+    sat: sat
+    prrc1: prrc1
+    prrc0: prrc0
+
+
+class LDSTIdxMode(Mode):
+    class simple(Mode):
+        """simple mode"""
+        SEA: Mode[2]
+        sz: Mode[3]
+        dz: Mode[3]
+
+    class stride(Mode):
+        """strided (scalar only source)"""
+        SEA: Mode[2]
+        dz: Mode[3]
+        sz: Mode[4]
+
+    class sat(Mode):
+        """sat mode: N=0/1 u/s"""
+        N: Mode[2]
+        dz: Mode[3]
+        sz: Mode[4]
+
+    class prrc1(Mode):
+        """Rc=1: pred-result CR sel"""
+        inv: Mode[2]
+        CRbit: Mode[3, 4]
+
+    class prrc0(Mode):
+        """Rc=0: pred-result z/nonz"""
+        inv: Mode[2]
+        zz: Mode[3]
+        RC1: Mode[4]
+        dz: Mode[3]
+        sz: Mode[3]
+
+    simple: simple
+    stride: stride
+    sat: sat
+    prrc1: prrc1
+    prrc0: prrc0
+
+
+class RM(_Mapping):
+    class Mode(Mode):
+        normal: NormalMode
+        ldst_imm: LDSTImmMode
+        ldst_idx: LDSTIdxMode
+
+    _: _Field = range(24)
+    mmode: _Field = (0,)
+    mask: _Field = range(1, 4)
+    elwidth: _Field = range(4, 6)
+    ewsrc: _Field = range(6, 8)
+    subvl: _Field = range(8, 10)
+    extra: _Field = range(10, 19)
+    mode: Mode.remap(range(19, 24))
+    extra2: _Array[4] = (
+        range(10, 12),
+        range(12, 14),
+        range(14, 16),
+        range(16, 18),
+    )
+    smask: _Field = range(16, 19)
+    extra3: _Array[3] = (
+        range(10, 13),
+        range(13, 16),
+        range(16, 19),
+    )
+
+
+class SVP64Instruction(PrefixedInstruction):
+    """SVP64 instruction: https://libre-soc.org/openpower/sv/svp64/"""
+    class Prefix(PrefixedInstruction.Prefix):
+        id: _Field = (7, 9)
+        rm: RM.remap((6, 8) + tuple(range(10, 32)))
+
+    prefix: Prefix
+
+    def disassemble(self, db, byteorder="little", verbose=False):
+        integer_prefix = int(self.prefix)
+        blob_prefix = integer_prefix.to_bytes(length=4, byteorder=byteorder)
+        blob_prefix = " ".join(map(lambda byte: f"{byte:02x}", blob_prefix))
+
+        integer_suffix = int(self.suffix)
+        blob_suffix = integer_suffix.to_bytes(length=4, byteorder=byteorder)
+        blob_suffix = " ".join(map(lambda byte: f"{byte:02x}", blob_suffix))
+
+        record = db[self.suffix]
+        if record is None or record.svp64 is None:
+            yield f"{blob_prefix}    .long 0x{int(self.prefix):08x}"
+            yield f"{blob_suffix}    .long 0x{int(self.suffix):08x}"
+            return
+
+        Rc = False
+        if record.operands["Rc"] is not None:
+            Rc = bool(self[record.fields["Rc"]])
+
+        subvl = self.prefix.rm.subvl
+        mode = self.prefix.rm.mode
+        sel = mode.sel
+
+        if record.svp64.mode is _SVMode.NORMAL:
+            mode = mode.normal
+            if sel == 0b00:
+                if mode[2] == 0b0:
+                    mode = mode.simple
+                else:
+                    if subvl == 0b00:
+                        if mode[3] == 0b0:
+                            mode = mode.smr
+                        else:
+                            mode = mode.pmr
                     else:
-                        variants = {name:False for name in ppc.names}
-                    for (name, rc) in variants.items():
-                        items.add(Instruction(name=name, rc=rc,
-                            section=section, ppc=ppc, fields=fields, svp64=svp64))
+                        if mode[4] == 0b0:
+                            mode = mode.svmr
+                        else:
+                            mode = mode.pu
+            elif sel == 0b01:
+                if Rc:
+                    mode = mode.ffrc1
+                else:
+                    mode = mode.ffrc0
+            elif sel == 0b10:
+                if subvl == 0b00:
+                    mode = mode.sat
+                else:
+                    if mode[4]:
+                        mode = mode.satx
+                    else:
+                        mode = mode.satpu
+            elif sel == 0b11:
+                if Rc:
+                    mode = mode.prrc1
+                else:
+                    mode = mode.prrc0
+        elif record.svp64.mode is _SVMode.LDST_IMM:
+            mode = mode.ldst_imm
+            if sel == 0b00:
+                if mode[2] == 0b0:
+                    mode = mode.simple
+                else:
+                    mode = mode.spu
+            elif sel == 0b01:
+                if Rc:
+                    mode = mode.ffrc1
+                else:
+                    mode = mode.ffrc0
+            elif sel == 0b10:
+                mode = mode.sat
+            elif sel == 0b11:
+                if Rc:
+                    mode = mode.prrc1
+                else:
+                    mode = mode.prrc0
+        elif record.svp64.mode is _SVMode.LDST_IMM:
+            mode = mode.ldst_idx
+            if mode.sel == 0b00:
+                mode = mode.simple
+            elif mode.sel == 0b01:
+                mode = mode.stride
+            elif mode.sel == 0b10:
+                mode = mode.sat
+            elif mode.sel == 0b11:
+                if Rc:
+                    mode = mode.prrc1
+                else:
+                    mode = mode.prrc0
 
-            items = tuple(sorted(items, key=_operator.attrgetter("opcode")))
-            opcodes = {item.opcode:item for item in items}
-            names = {item.name:item for item in sorted(items, key=_operator.attrgetter("name"))}
+        if type(mode) is Mode:
+            raise NotImplementedError
 
-            return (items, opcodes, names)
+        yield f"{blob_prefix}    sv.{record.name}"
+        yield f"{blob_suffix}"
 
-        ppcdb = database_ppc(root)
-        svp64db = database_svp64(root)
-        formsdb = database_forms(root)
 
-        (items, opcodes, names) = database(ppcdb, svp64db, formsdb)
-        self.__items = items
-        self.__opcodes = opcodes
-        self.__names = names
+def parse(stream, factory):
+    lines = filter(lambda line: not line.strip().startswith("#"), stream)
+    entries = _csv.DictReader(lines)
+    entries = filter(lambda entry: "TODO" not in frozenset(entry.values()), entries)
+    return tuple(map(factory, entries))
+
+
+class MarkdownDatabase:
+    def __init__(self):
+        db = {}
+        for (name, desc) in _ISA():
+            operands = []
+            if desc.regs:
+                (dynamic, *static) = desc.regs
+                operands.extend(dynamic)
+                operands.extend(static)
+            db[name] = Operands(insn=name, iterable=operands)
+        self.__db = db
+        return super().__init__()
+
+    def __iter__(self):
+        yield from self.__db.items()
+
+    def __getitem__(self, key):
+        return self.__db.__getitem__(key)
+
+
+class FieldsDatabase:
+    def __init__(self):
+        db = {}
+        df = _DecodeFields()
+        df.create_specs()
+        for (form, fields) in df.instrs.items():
+            if form in {"DQE", "TX"}:
+                continue
+            if form == "all":
+                form = "NONE"
+            db[_Form[form]] = Fields(fields)
+
+        self.__db = db
+
+        return super().__init__()
+
+    def __getitem__(self, key):
+        return self.__db.__getitem__(key)
+
+
+class PPCDatabase:
+    def __init__(self, root, mdwndb, fieldsdb):
+        # The code below groups the instructions by section:identifier.
+        # We use the comment as an identifier, there's nothing better.
+        # The point is to capture different opcodes for the same instruction.
+        dd = _collections.defaultdict
+        records = dd(lambda: dd(set))
+        path = (root / "insndb.csv")
+        with open(path, "r", encoding="UTF-8") as stream:
+            for section in parse(stream, Section.CSV):
+                path = (root / section.path)
+                opcode_cls = {
+                    section.Mode.INTEGER: IntegerOpcode,
+                    section.Mode.PATTERN: PatternOpcode,
+                }[section.mode]
+                factory = _functools.partial(PPCRecord.CSV, opcode_cls=opcode_cls)
+                with open(path, "r", encoding="UTF-8") as stream:
+                    for insn in parse(stream, factory):
+                        records[section][insn.comment].add(insn)
+
+        db = dd(set)
+        for (section, group) in records.items():
+            for records in group.values():
+                db[section].add(PPCMultiRecord(records))
+
+        self.__db = db
+        self.__mdwndb = mdwndb
+        self.__fieldsdb = fieldsdb
+
+        return super().__init__()
+
+    def __getitem__(self, key):
+        def exact_match(key, record):
+            for name in record.names:
+                if name == key:
+                    return True
+
+            return False
+
+        def Rc_match(key, record):
+            if not key.endswith("."):
+                return False
+
+            if not record.Rc is _RCOE.RC:
+                return False
+
+            return exact_match(key[:-1], record)
+
+        def LK_match(key, record):
+            if not key.endswith("l"):
+                return False
+
+            if "lk" not in record.flags:
+                return False
+
+            return exact_match(key[:-1], record)
+
+        def AA_match(key, record):
+            if not key.endswith("a"):
+                return False
+
+            if record.intop not in {_MicrOp.OP_B, _MicrOp.OP_BC}:
+                return False
+
+            if self.__mdwndb[key]["AA"] is None:
+                return False
+
+            return (exact_match(key[:-1], record) or
+                LK_match(key[:-1], record))
+
+        for (section, records) in self.__db.items():
+            for record in records:
+                if (exact_match(key, record) or
+                        Rc_match(key, record) or
+                        LK_match(key, record) or
+                        AA_match(key, record)):
+                    return (section, record)
+
+        return (None, None)
+
+
+class SVP64Database:
+    def __init__(self, root, ppcdb):
+        db = set()
+        pattern = _re.compile(r"^(?:LDST)?RM-(1P|2P)-.*?\.csv$")
+        for (prefix, _, names) in _os.walk(root):
+            prefix = _pathlib.Path(prefix)
+            for name in filter(lambda name: pattern.match(name), names):
+                path = (prefix / _pathlib.Path(name))
+                with open(path, "r", encoding="UTF-8") as stream:
+                    db.update(parse(stream, SVP64Record.CSV))
+
+        self.__db = {record.name:record for record in db}
+        self.__ppcdb = ppcdb
+
+        return super().__init__()
+
+    def __getitem__(self, key):
+        (_, record) = self.__ppcdb[key]
+        if record is None:
+            return None
+
+        for name in record.names:
+            record = self.__db.get(name, None)
+            if record is not None:
+                return record
+
+        return None
+
+
+class Database:
+    def __init__(self, root):
+        root = _pathlib.Path(root)
+
+        mdwndb = MarkdownDatabase()
+        fieldsdb = FieldsDatabase()
+        ppcdb = PPCDatabase(root=root, mdwndb=mdwndb, fieldsdb=fieldsdb)
+        svp64db = SVP64Database(root=root, ppcdb=ppcdb)
+
+        db = set()
+        for (name, operands) in mdwndb:
+            (section, ppc) = ppcdb[name]
+            if ppc is None:
+                continue
+            svp64 = svp64db[name]
+            fields = fieldsdb[ppc.form]
+            record = Record(name=name,
+                section=section, ppc=ppc, svp64=svp64,
+                operands=operands, fields=fields)
+            db.add(record)
+
+        self.__db = tuple(sorted(db))
 
         return super().__init__()
 
     def __repr__(self):
-        return repr(self.__items)
+        return repr(self.__db)
 
     def __iter__(self):
-        yield from self.__items
+        yield from self.__db
 
+    @_functools.lru_cache(maxsize=None)
     def __contains__(self, key):
-        if isinstance(key, int):
-            return self.__opcodes.__contains__(key)
-        elif isinstance(key, str):
-            return self.__names.__contains__(key)
-        else:
-            raise KeyError(key)
+        return self.__getitem__(key) is not None
 
+    @_functools.lru_cache(maxsize=None)
     def __getitem__(self, key):
-        if isinstance(key, int):
-            return self.__opcodes.__getitem__(key)
+        if isinstance(key, (int, Instruction)):
+            key = int(key)
+            for record in self:
+                opcode = record.opcode
+                if ((opcode.value & opcode.mask) ==
+                        (key & opcode.mask)):
+                    return record
+            return None
+        elif isinstance(key, Opcode):
+            for record in self:
+                if record.opcode == key:
+                    return record
         elif isinstance(key, str):
-            return self.__names.__getitem__(key)
-        else:
-            raise KeyError(key)
+            for record in self:
+                if record.name == key:
+                    return record
+        return None