mirror of https://github.com/YosysHQ/yosys.git
85 lines
2.1 KiB
Verilog
85 lines
2.1 KiB
Verilog
// Signed 40-bit streaming accumulator with 16-bit inputs
|
|
// File: HDL_Coding_Techniques/multipliers/multipliers4.v
|
|
//
|
|
// Source:
|
|
// https://www.xilinx.com/support/documentation/sw_manuals/xilinx2014_2/ug901-vivado-synthesis.pdf p.90
|
|
//
|
|
module macc # (parameter SIZEIN = 16, SIZEOUT = 40) (
|
|
input clk, ce, sload,
|
|
input signed [SIZEIN-1:0] a, b,
|
|
output signed [SIZEOUT-1:0] accum_out
|
|
);
|
|
// Declare registers for intermediate values
|
|
reg signed [SIZEIN-1:0] a_reg = 0, b_reg = 0;
|
|
reg sload_reg = 0;
|
|
reg signed [2*SIZEIN-1:0] mult_reg = 0;
|
|
reg signed [SIZEOUT-1:0] adder_out = 0, old_result;
|
|
always @* /*(adder_out or sload_reg)*/ begin // Modification necessary to fix sim/synth mismatch
|
|
if (sload_reg)
|
|
old_result <= 0;
|
|
else
|
|
// 'sload' is now active (=low) and opens the accumulation loop.
|
|
// The accumulator takes the next multiplier output in
|
|
// the same cycle.
|
|
old_result <= adder_out;
|
|
end
|
|
|
|
always @(posedge clk)
|
|
if (ce)
|
|
begin
|
|
a_reg <= a;
|
|
b_reg <= b;
|
|
mult_reg <= a_reg * b_reg;
|
|
sload_reg <= sload;
|
|
// Store accumulation result into a register
|
|
adder_out <= old_result + mult_reg;
|
|
end
|
|
|
|
// Output accumulation result
|
|
assign accum_out = adder_out;
|
|
|
|
endmodule
|
|
|
|
// Adapted variant of above
|
|
module macc2 # (parameter SIZEIN = 16, SIZEOUT = 40) (
|
|
input clk,
|
|
input ce,
|
|
input rst,
|
|
input signed [SIZEIN-1:0] a, b,
|
|
output signed [SIZEOUT-1:0] accum_out,
|
|
output overflow
|
|
);
|
|
// Declare registers for intermediate values
|
|
reg signed [SIZEIN-1:0] a_reg = 0, b_reg = 0, a_reg2 = 0, b_reg2 = 0;
|
|
reg signed [2*SIZEIN-1:0] mult_reg = 0;
|
|
reg signed [SIZEOUT:0] adder_out = 0;
|
|
reg overflow_reg = 0;
|
|
always @(posedge clk) begin
|
|
//if (ce)
|
|
begin
|
|
a_reg <= a;
|
|
b_reg <= b;
|
|
a_reg2 <= a_reg;
|
|
b_reg2 <= b_reg;
|
|
mult_reg <= a_reg2 * b_reg2;
|
|
// Store accumulation result into a register
|
|
adder_out <= adder_out + mult_reg;
|
|
overflow_reg <= overflow;
|
|
end
|
|
if (rst) begin
|
|
a_reg <= 0;
|
|
a_reg2 <= 0;
|
|
b_reg <= 0;
|
|
b_reg2 <= 0;
|
|
mult_reg <= 0;
|
|
adder_out <= 0;
|
|
overflow_reg <= 1'b0;
|
|
end
|
|
end
|
|
assign overflow = (adder_out >= 2**(SIZEOUT-1)) | overflow_reg;
|
|
|
|
// Output accumulation result
|
|
assign accum_out = overflow ? 2**(SIZEOUT-1)-1 : adder_out;
|
|
|
|
endmodule
|