techmap +/cmp2lcu.v for decomposing arithmetic compares to $lcu

This commit is contained in:
Eddie Hung 2020-01-17 10:51:27 -08:00
parent fffe42d4c1
commit 9b63700678
3 changed files with 108 additions and 0 deletions

View File

@ -30,3 +30,4 @@ $(eval $(call add_share_file,share,techlibs/common/cmp2lut.v))
$(eval $(call add_share_file,share,techlibs/common/cells.lib)) $(eval $(call add_share_file,share,techlibs/common/cells.lib))
$(eval $(call add_share_file,share,techlibs/common/mul2dsp.v)) $(eval $(call add_share_file,share,techlibs/common/mul2dsp.v))
$(eval $(call add_share_file,share,techlibs/common/abc9_model.v)) $(eval $(call add_share_file,share,techlibs/common/abc9_model.v))
$(eval $(call add_share_file,share,techlibs/common/cmp2lcu.v))

83
techlibs/common/cmp2lcu.v Normal file
View File

@ -0,0 +1,83 @@
// This pass performs an optimisation that decomposes wide arithmetic
// comparisons into LUT-size chunks (as guided by the `LUT_WIDTH
// macro) connected to a single lookahead-carry-unit $lcu cell,
// which is typically mapped to dedicated (and fast) FPGA
// carry-chains.
(* techmap_celltype = "$lt $le $gt $ge" *)
module _90_lcu_cmp_ (A, B, Y);
parameter A_SIGNED = 0;
parameter B_SIGNED = 0;
parameter A_WIDTH = 0;
parameter B_WIDTH = 0;
parameter Y_WIDTH = 0;
input [A_WIDTH-1:0] A;
input [B_WIDTH-1:0] B;
output [Y_WIDTH-1:0] Y;
parameter _TECHMAP_CELLTYPE_ = "";
localparam gt_width = `LUT_WIDTH/2;
generate
if (_TECHMAP_CELLTYPE_ == "" || (A_WIDTH <= gt_width || B_WIDTH <= gt_width))
wire _TECHMAP_FAIL_ = 1;
else if (_TECHMAP_CELLTYPE_ == "$lt") begin
// Transform $lt into $gt by swapping A and B
$gt #(.A_SIGNED(B_SIGNED), .B_SIGNED(A_SIGNED), .A_WIDTH(B_WIDTH), .B_WIDTH(A_WIDTH), .Y_WIDTH(Y_WIDTH)) _TECHMAP_REPLACE_ (.A(B), .B(A), .Y(Y));
end
else if (_TECHMAP_CELLTYPE_ == "$le") begin
// Transform $le into $ge by swapping A and B
$ge #(.A_SIGNED(B_SIGNED), .B_SIGNED(A_SIGNED), .A_WIDTH(B_WIDTH), .B_WIDTH(A_WIDTH), .Y_WIDTH(Y_WIDTH)) _TECHMAP_REPLACE_ (.A(B), .B(A), .Y(Y));
end
else begin
// Perform sign extension on A and B
localparam WIDTH = A_WIDTH > B_WIDTH ? A_WIDTH : B_WIDTH;
wire [WIDTH-1:0] AA = {{(WIDTH-A_WIDTH){A_SIGNED ? A[A_WIDTH-1] : 1'b0}}, A};
wire [WIDTH-1:0] BB = {{(WIDTH-B_WIDTH){B_SIGNED ? B[B_WIDTH-1] : 1'b0}}, B};
// Compute width of $lcu/carry-chain cell
localparam lcu_width = (WIDTH+gt_width-1)/gt_width;
wire [lcu_width-1:0] P, G, CO;
genvar i, j;
integer j;
for (i = 0; i < WIDTH; i=i+gt_width) begin
wire [gt_width-1:0] PP, GG;
if (i < WIDTH-gt_width) begin
// Bit-wise equality (xnor) of sign-extended A and B
assign PP = AA[i +: gt_width] ^~ BB[i +: gt_width];
// Priority "encoder" that checks A[i] == 1'b1 && B[i] == 1'b0
// from MSB down, deferring to less significant bits if the
// MSBs are equal
assign GG[gt_width-1] = AA[i+gt_width-1] & ~BB[i+gt_width-1];
for (j = gt_width-2; j >= 0; j=j-1)
assign GG[j] = &PP[gt_width-1:j+1] & (AA[i+j] & ~BB[i+j]);
// Propagate only if all bits are equal
// (inconclusive evidence to say A >= B)
assign P[i/gt_width] = &PP;
// Generate if any pairs call for it
assign G[i/gt_width] = |GG;
end
else begin
assign PP = AA[WIDTH-1:i] ^~ BB[WIDTH-1:i];
if (A_SIGNED && B_SIGNED)
assign GG[WIDTH-i-1] = ~AA[WIDTH-1] & BB[WIDTH-1];
else
assign GG[WIDTH-i-1] = AA[WIDTH-1] & ~BB[WIDTH-1];
for (j = WIDTH-i-2; j >= 0; j=j-1)
assign GG[j] = &PP[WIDTH-i-1:j+1] & (AA[i+j] & ~BB[i+j]);
assign P[i/gt_width] = &PP[WIDTH-i-1:0];
assign G[i/gt_width] = |GG[WIDTH-i-1:0];
end
end
// For $ge operation, start with the assumption that A and B are
// equal (propagating this equality if A and B turn out to be so)
if (_TECHMAP_CELLTYPE_ == "$ge")
wire CI = 1'b1;
else
wire CI = 1'b0;
$lcu #(.WIDTH(lcu_width)) lcu (.P(P), .G(G), .CI(CI), .CO(CO));
assign Y = CO[lcu_width-1];
end
endgenerate
endmodule

24
tests/techmap/cmp2lcu.ys Normal file
View File

@ -0,0 +1,24 @@
read_verilog <<EOT
module top(input [11:0] a, b, output gtu, gts, ltu, lts, geu, ges, leu, les);
assign gtu = a > b;
assign gts = $signed(a) > $signed(b);
assign ltu = a < b;
assign lts = $signed(a) < $signed(b);
assign geu = a >= b;
assign ges = $signed(a) >= $signed(b);
assign leu = a <= b;
assign les = $signed(a) <= $signed(b);
endmodule
EOT
proc
equiv_opt -assert techmap -map +/cmp2lcu.v -D LUT_WIDTH=6
design -load postopt
select -assert-count 8 t:$lcu
select -assert-none t:$gt t:$ge t:$lt t:$le
design -load preopt
equiv_opt -assert techmap -map +/cmp2lcu.v -D LUT_WIDTH=4
design -load postopt
select -assert-count 8 t:$lcu
select -assert-none t:$gt t:$ge t:$lt t:$le