techmap +/cmp2lcu.v for decomposing arithmetic compares to $lcu
authorEddie Hung <eddie@fpgeh.com>
Fri, 17 Jan 2020 18:51:27 +0000 (10:51 -0800)
committerEddie Hung <eddie@fpgeh.com>
Fri, 3 Apr 2020 21:28:22 +0000 (14:28 -0700)
techlibs/common/Makefile.inc
techlibs/common/cmp2lcu.v [new file with mode: 0644]
tests/techmap/cmp2lcu.ys [new file with mode: 0644]

index d5e69a241ed0a1ad5d051cc72c0053e1c523182c..7b1e4b43053db231fceec463caeb95e201232e5c 100644 (file)
@@ -30,3 +30,4 @@ $(eval $(call add_share_file,share,techlibs/common/cmp2lut.v))
 $(eval $(call add_share_file,share,techlibs/common/cells.lib))
 $(eval $(call add_share_file,share,techlibs/common/mul2dsp.v))
 $(eval $(call add_share_file,share,techlibs/common/abc9_model.v))
+$(eval $(call add_share_file,share,techlibs/common/cmp2lcu.v))
diff --git a/techlibs/common/cmp2lcu.v b/techlibs/common/cmp2lcu.v
new file mode 100644 (file)
index 0000000..433f88f
--- /dev/null
@@ -0,0 +1,83 @@
+// This pass performs an optimisation that decomposes wide arithmetic
+//   comparisons into LUT-size chunks (as guided by the `LUT_WIDTH
+//   macro) connected to a single lookahead-carry-unit $lcu cell,
+//   which is typically mapped to dedicated (and fast) FPGA
+//   carry-chains.
+(* techmap_celltype = "$lt $le $gt $ge" *)
+module _90_lcu_cmp_ (A, B, Y);
+
+parameter A_SIGNED = 0;
+parameter B_SIGNED = 0;
+parameter A_WIDTH = 0;
+parameter B_WIDTH = 0;
+parameter Y_WIDTH = 0;
+
+input [A_WIDTH-1:0] A;
+input [B_WIDTH-1:0] B;
+output [Y_WIDTH-1:0] Y;
+
+parameter _TECHMAP_CELLTYPE_ = "";
+localparam gt_width = `LUT_WIDTH/2;
+
+generate
+    if (_TECHMAP_CELLTYPE_ == "" || (A_WIDTH <= gt_width || B_WIDTH <= gt_width))
+        wire _TECHMAP_FAIL_ = 1;
+    else if (_TECHMAP_CELLTYPE_ == "$lt") begin
+        // Transform $lt into $gt by swapping A and B
+               $gt #(.A_SIGNED(B_SIGNED), .B_SIGNED(A_SIGNED), .A_WIDTH(B_WIDTH), .B_WIDTH(A_WIDTH), .Y_WIDTH(Y_WIDTH)) _TECHMAP_REPLACE_ (.A(B), .B(A), .Y(Y));
+    end
+    else if (_TECHMAP_CELLTYPE_ == "$le") begin
+        // Transform $le into $ge by swapping A and B
+               $ge #(.A_SIGNED(B_SIGNED), .B_SIGNED(A_SIGNED), .A_WIDTH(B_WIDTH), .B_WIDTH(A_WIDTH), .Y_WIDTH(Y_WIDTH)) _TECHMAP_REPLACE_ (.A(B), .B(A), .Y(Y));
+    end
+    else begin
+        // Perform sign extension on A and B
+        localparam WIDTH = A_WIDTH > B_WIDTH ? A_WIDTH : B_WIDTH;
+        wire [WIDTH-1:0] AA = {{(WIDTH-A_WIDTH){A_SIGNED ? A[A_WIDTH-1] : 1'b0}}, A};
+        wire [WIDTH-1:0] BB = {{(WIDTH-B_WIDTH){B_SIGNED ? B[B_WIDTH-1] : 1'b0}}, B};
+
+        // Compute width of $lcu/carry-chain cell
+        localparam lcu_width = (WIDTH+gt_width-1)/gt_width;
+        wire [lcu_width-1:0] P, G, CO;
+        genvar i, j;
+        integer j;
+        for (i = 0; i < WIDTH; i=i+gt_width) begin
+            wire [gt_width-1:0] PP, GG;
+            if (i < WIDTH-gt_width) begin
+                // Bit-wise equality (xnor) of sign-extended A and B
+                assign PP = AA[i +: gt_width] ^~ BB[i +: gt_width];
+                // Priority "encoder" that checks A[i] == 1'b1 && B[i] == 1'b0
+                //   from MSB down, deferring to less significant bits if the
+                //   MSBs are equal
+                assign GG[gt_width-1] = AA[i+gt_width-1] & ~BB[i+gt_width-1];
+                for (j = gt_width-2; j >= 0; j=j-1)
+                    assign GG[j] = &PP[gt_width-1:j+1] & (AA[i+j] & ~BB[i+j]);
+                // Propagate only if all bits are equal
+                //   (inconclusive evidence to say A >= B)
+                assign P[i/gt_width] = &PP;
+                // Generate if any pairs call for it
+                assign G[i/gt_width] = |GG;
+            end
+            else begin
+                assign PP = AA[WIDTH-1:i] ^~ BB[WIDTH-1:i];
+                if (A_SIGNED && B_SIGNED)
+                    assign GG[WIDTH-i-1] = ~AA[WIDTH-1] & BB[WIDTH-1];
+                else
+                    assign GG[WIDTH-i-1] = AA[WIDTH-1] & ~BB[WIDTH-1];
+                for (j = WIDTH-i-2; j >= 0; j=j-1)
+                    assign GG[j] = &PP[WIDTH-i-1:j+1] & (AA[i+j] & ~BB[i+j]);
+                assign P[i/gt_width] = &PP[WIDTH-i-1:0];
+                assign G[i/gt_width] = |GG[WIDTH-i-1:0];
+            end
+        end
+        // For $ge operation, start with the assumption that A and B are
+        //   equal (propagating this equality if A and B turn out to be so)
+        if (_TECHMAP_CELLTYPE_ == "$ge")
+            wire CI = 1'b1;
+        else
+            wire CI = 1'b0;
+        $lcu #(.WIDTH(lcu_width)) lcu (.P(P), .G(G), .CI(CI), .CO(CO));
+        assign Y = CO[lcu_width-1];
+    end
+endgenerate
+endmodule
diff --git a/tests/techmap/cmp2lcu.ys b/tests/techmap/cmp2lcu.ys
new file mode 100644 (file)
index 0000000..e7a422e
--- /dev/null
@@ -0,0 +1,24 @@
+read_verilog <<EOT
+module top(input [11:0] a, b, output gtu, gts, ltu, lts, geu, ges, leu, les);
+assign gtu = a > b;
+assign gts = $signed(a) > $signed(b);
+assign ltu = a < b;
+assign lts = $signed(a) < $signed(b);
+assign geu = a >= b;
+assign ges = $signed(a) >= $signed(b);
+assign leu = a <= b;
+assign les = $signed(a) <= $signed(b);
+endmodule
+EOT
+proc
+
+equiv_opt -assert techmap -map +/cmp2lcu.v -D LUT_WIDTH=6
+design -load postopt
+select -assert-count 8 t:$lcu
+select -assert-none t:$gt t:$ge t:$lt t:$le
+
+design -load preopt
+equiv_opt -assert techmap -map +/cmp2lcu.v -D LUT_WIDTH=4
+design -load postopt
+select -assert-count 8 t:$lcu
+select -assert-none t:$gt t:$ge t:$lt t:$le