rename InternalOp to MicrOp

[soc.git] / src / soc / fu / alu / main_stage.py
diff --git a/src/soc/fu/alu/main_stage.py b/src/soc/fu/alu/main_stage.py

index 28c6b4d3c1edf14e22309c1dac49bac6e3d1bd05..719a9a731e4c9c5f637f574fbf01203fea36df28 100644 (file)
--- a/src/soc/fu/alu/main_stage.py
+++ b/src/soc/fu/alu/main_stage.py
@@ -8,7 +8,12 @@ from nmutil.pipemodbase import PipeModBase
  from nmutil.extend import exts
  from soc.fu.alu.pipe_data import ALUInputData, ALUOutputData
  from ieee754.part.partsig import PartitionedSignal
-from soc.decoder.power_enums import InternalOp
+from soc.decoder.power_enums import MicrOp
+
+
+# microwatt calc_ov function.
+def calc_ov(msb_a, msb_b, ca, msb_r):
+    return (ca ^ msb_r) & ~(msb_a ^ msb_b)
  
  
  class ALUMainStage(PipeModBase):
@@ -41,63 +46,68 @@ class ALUMainStage(PipeModBase):
          add_a = Signal(a.width + 2, reset_less=True)
          add_b = Signal(a.width + 2, reset_less=True)
          add_o = Signal(a.width + 2, reset_less=True)
-        with m.If((op.insn_type == InternalOp.OP_ADD) |
-                  (op.insn_type == InternalOp.OP_CMP)):
+        with m.If((op.insn_type == MicrOp.OP_ADD) |
+                  (op.insn_type == MicrOp.OP_CMP)):
              # in bit 0, 1+carry_in creates carry into bit 1 and above
              comb += add_a.eq(Cat(cry_i[0], a, Const(0, 1)))
              comb += add_b.eq(Cat(Const(1, 1), b, Const(0, 1)))
              comb += add_o.eq(add_a + add_b)
  
-        comb += o.ok.eq(1) # overridden to 0 if op not handled
-
          ##########################
          # main switch-statement for handling arithmetic operations
  
          with m.Switch(op.insn_type):
              #### CMP, CMPL ####
-            with m.Case(InternalOp.OP_CMP):
+            with m.Case(MicrOp.OP_CMP):
                  # this is supposed to be inverted (b-a, not a-b)
                  # however we have a trick: instead of adding either 2x 64-bit
                  # MUXes to invert a and b, or messing with a 64-bit output,
                  # swap +ve and -ve test in the *output* stage using an XOR gate
                  comb += o.data.eq(add_o[1:-1])
+                comb += o.ok.eq(0) # use o.data but do *not* actually output
  
              #### add ####
-            with m.Case(InternalOp.OP_ADD):
+            with m.Case(MicrOp.OP_ADD):
                  # bit 0 is not part of the result, top bit is the carry-out
                  comb += o.data.eq(add_o[1:-1])
+                comb += o.ok.eq(1) # output register
  
                  # see microwatt OP_ADD code
                  # https://bugs.libre-soc.org/show_bug.cgi?id=319#c5
-                comb += cry_o.data[0].eq(add_o[-1]) # XER.CO
-                comb += cry_o.data[1].eq(add_o[33] ^ (a[32] ^ b[32])) # XER.CO32
+                ca = Signal(2, reset_less=True)
+                comb += ca[0].eq(add_o[-1])                   # XER.CA
+                comb += ca[1].eq(add_o[33] ^ (a[32] ^ b[32])) # XER.CA32
+                comb += cry_o.data.eq(ca)
                  comb += cry_o.ok.eq(1)
-                comb += ov_o.data[0].eq((add_o[-2] != a[-1]) & (a[-1] == b[-1]))
-                comb += ov_o.data[1].eq((add_o[32] != a[31]) & (a[31] == b[31]))
+                # 32-bit (ov[1]) and 64-bit (ov[0]) overflow
+                ov = Signal(2, reset_less=True)
+                comb += ov[0].eq(calc_ov(a[-1], b[-1], ca[0], add_o[-2]))
+                comb += ov[1].eq(calc_ov(a[31], b[31], ca[1], add_o[32]))
+                comb += ov_o.data.eq(ov)
                  comb += ov_o.ok.eq(1)
  
              #### exts (sign-extend) ####
-            with m.Case(InternalOp.OP_EXTS):
+            with m.Case(MicrOp.OP_EXTS):
                  with m.If(op.data_len == 1):
                      comb += o.data.eq(exts(a, 8, 64))
                  with m.If(op.data_len == 2):
                      comb += o.data.eq(exts(a, 16, 64))
                  with m.If(op.data_len == 4):
                      comb += o.data.eq(exts(a, 32, 64))
+                comb += o.ok.eq(1) # output register
  
              #### cmpeqb ####
-            with m.Case(InternalOp.OP_CMPEQB):
+            with m.Case(MicrOp.OP_CMPEQB):
                  eqs = Signal(8, reset_less=True)
                  src1 = Signal(8, reset_less=True)
                  comb += src1.eq(a[0:8])
                  for i in range(8):
                      comb += eqs[i].eq(src1 == b[8*i:8*(i+1)])
+                comb += o.data[0].eq(eqs.any())
+                comb += o.ok.eq(0) # use o.data but do *not* actually output
                  comb += cr0.data.eq(Cat(Const(0, 2), eqs.any(), Const(0, 1)))
                  comb += cr0.ok.eq(1)
  
-            with m.Default():
-                comb += o.ok.eq(0)
-
          ###### sticky overflow and context, both pass-through #####
  
          comb += self.o.xer_so.data.eq(self.i.xer_so)