From 3cd5f4ed83413cf4df695217ff85e3190ae4a8c7 Mon Sep 17 00:00:00 2001 From: Emily Schmidt Date: Wed, 17 Jul 2024 16:33:34 +0100 Subject: [PATCH] add support for RTLIL cells with multiple outputs to the functional backend, implement $fa,$lcu,$alu --- kernel/functionalir.cc | 123 ++++++++++++++++++++++------ tests/functional/rtlil_cells.py | 21 ++++- tests/functional/test_functional.py | 8 +- 3 files changed, 118 insertions(+), 34 deletions(-) diff --git a/kernel/functionalir.cc b/kernel/functionalir.cc index 4b2ad8c0b..e768be400 100644 --- a/kernel/functionalir.cc +++ b/kernel/functionalir.cc @@ -18,6 +18,7 @@ */ #include "kernel/functionalir.h" +#include YOSYS_NAMESPACE_BEGIN @@ -172,8 +173,38 @@ private: y = factory.mux(y, factory.slice(b, a.width() * i, a.width()), factory.slice(s, i, 1)); return y; } + dict handle_fa(Node a, Node b, Node c) { + Node t1 = factory.bitwise_xor(a, b); + Node t2 = factory.bitwise_and(a, b); + Node t3 = factory.bitwise_and(c, t1); + Node y = factory.bitwise_xor(c, t1); + Node x = factory.bitwise_or(t2, t3); + return {{ID(X), x}, {ID(Y), y}}; + } + Node handle_lcu(Node p, Node g, Node ci) { + Node rv = factory.bitwise_or(factory.slice(g, 0, 1), factory.bitwise_and(factory.slice(p, 0, 1), ci)); + Node c = rv; + for(int i = 1; i < p.width(); i++) { + c = factory.bitwise_or(factory.slice(g, i, 1), factory.bitwise_and(factory.slice(p, i, 1), c)); + rv = factory.concat(rv, c); + } + return rv; + } + dict handle_alu(Node a_in, Node b_in, int y_width, bool is_signed, Node ci, Node bi) { + Node a = factory.extend(a_in, y_width, is_signed); + Node b_uninverted = factory.extend(b_in, y_width, is_signed); + Node b = factory.mux(b_uninverted, factory.bitwise_not(b_uninverted), bi); + Node x = factory.bitwise_xor(a, b); + Node a_extra = factory.extend(a, y_width + 1, false); + Node b_extra = factory.extend(b, y_width + 1, false); + Node y_extra = factory.add(factory.add(a_extra, b_extra), factory.extend(ci, a.width() + 1, false)); + Node y = factory.slice(y_extra, 0, y_width); + Node carries = factory.bitwise_xor(y_extra, factory.bitwise_xor(a_extra, b_extra)); + Node co = factory.slice(carries, 1, y_width); + return {{ID(X), x}, {ID(Y), y}, {ID(CO), co}}; + } public: - Node handle(IdString cellType, dict parameters, dict inputs) + std::variant, Node> handle(IdString cellType, dict parameters, dict inputs) { int a_width = parameters.at(ID(A_WIDTH), Const(-1)).as_int(); int b_width = parameters.at(ID(B_WIDTH), Const(-1)).as_int(); @@ -360,17 +391,23 @@ public: Node s = factory.extend(inputs.at(ID(S)), b_width, false); Node b = factory.mul(s, factory.constant(Const(width, b_width))); return factory.logical_shift_left(a, b); + } else if(cellType == ID($fa)) { + return handle_fa(inputs.at(ID(A)), inputs.at(ID(B)), inputs.at(ID(C))); + } else if(cellType == ID($lcu)) { + return handle_lcu(inputs.at(ID(P)), inputs.at(ID(G)), inputs.at(ID(CI))); + } else if(cellType == ID($alu)) { + return handle_alu(inputs.at(ID(A)), inputs.at(ID(B)), y_width, a_signed && b_signed, inputs.at(ID(CI)), inputs.at(ID(BI))); } else { - log_error("unhandled cell in CellSimplifier %s\n", cellType.c_str()); + log_error("`%s' cells are not supported by the functional backend\n", cellType.c_str()); } } }; class FunctionalIRConstruction { using Node = FunctionalIR::Node; - std::deque queue; + std::deque> queue; dict graph_nodes; - idict cells; + dict, Node> cell_outputs; DriverMap driver_map; FunctionalIR::Factory& factory; CellSimplifier simplifier; @@ -388,6 +425,24 @@ class FunctionalIRConstruction { }else return it->second; } + Node enqueue_cell(Cell *cell, IdString port_name) + { + auto it = cell_outputs.find({cell, port_name}); + if(it == cell_outputs.end()) { + queue.emplace_back(cell); + std::optional rv; + for(auto const &[name, sigspec] : cell->connections()) + if(driver_map.celltypes.cell_output(cell->type, name)) { + auto node = factory.create_pending(sigspec.size()); + factory.suggest_name(node, cell->name.str() + "$" + name.str()); + cell_outputs.emplace({cell, name}, node); + if(name == port_name) + rv = node; + } + return *rv; + } else + return it->second; + } public: FunctionalIRConstruction(FunctionalIR::Factory &f) : factory(f), simplifier(f) {} void add_module(Module *module) @@ -395,7 +450,7 @@ public: driver_map.add(module); for (auto cell : module->cells()) { if (cell->type.in(ID($assert), ID($assume), ID($cover), ID($check))) - enqueue(DriveBitMarker(cells(cell), 0)); + queue.emplace_back(cell); } for (auto wire : module->wires()) { if (wire->port_output) { @@ -441,10 +496,44 @@ public: factory.declare_state_memory(node, mem->cell->name, addr_width, data_width); return concatenate_read_results(mem, read_results); } + void process_cell(Cell *cell) + { + if (cell->is_mem_cell()) { + Mem *mem = memories.at(cell, nullptr); + log_assert(mem != nullptr); + Node node = handle_memory(mem); + factory.update_pending(cell_outputs.at({cell, ID(RD_DATA)}), node); + } else { + dict connections; + IdString output_name; // for the single output case + int n_outputs = 0; + for(auto const &[name, sigspec] : cell->connections()) { + if(driver_map.celltypes.cell_input(cell->type, name)) + connections.insert({ name, enqueue(DriveChunkPort(cell, {name, sigspec})) }); + if(driver_map.celltypes.cell_output(cell->type, name)) { + output_name = name; + n_outputs++; + } + } + std::variant, Node> outputs = simplifier.handle(cell->type, cell->parameters, connections); + if(auto *nodep = std::get_if(&outputs); nodep != nullptr) { + log_assert(n_outputs == 1); + factory.update_pending(cell_outputs.at({cell, output_name}), *nodep); + } else { + for(auto [name, node] : std::get>(outputs)) + factory.update_pending(cell_outputs.at({cell, name}), node); + } + } + } void process_queue() { for (; !queue.empty(); queue.pop_front()) { - DriveSpec spec = queue.front(); + if(auto p = std::get_if(&queue.front()); p != nullptr) { + process_cell(*p); + continue; + } + + DriveSpec spec = std::get(queue.front()); Node pending = graph_nodes.at(spec); if (spec.chunks().size() > 1) { @@ -492,11 +581,7 @@ public: } else { - Node cell = enqueue(DriveChunkMarker(cells(port_chunk.cell), 0, port_chunk.width)); - factory.suggest_name(cell, port_chunk.cell->name); - //Node node = factory.cell_output(cell, port_chunk.cell->type, port_chunk.port, port_chunk.width); - Node node = cell; - factory.suggest_name(node, port_chunk.cell->name.str() + "$" + port_chunk.port.str()); + Node node = enqueue_cell(port_chunk.cell, port_chunk.port); factory.update_pending(pending, node); } } else { @@ -518,22 +603,6 @@ public: args.push_back(enqueue(driver)); Node node = factory.multiple(args, chunk.size()); factory.update_pending(pending, node); - } else if (chunk.is_marker()) { - Cell *cell = cells[chunk.marker().marker]; - if (cell->is_mem_cell()) { - Mem *mem = memories.at(cell, nullptr); - log_assert(mem != nullptr); - Node node = handle_memory(mem); - factory.update_pending(pending, node); - } else { - dict connections; - for(auto const &conn : cell->connections()) { - if(driver_map.celltypes.cell_input(cell->type, conn.first)) - connections.insert({ conn.first, enqueue(DriveChunkPort(cell, conn)) }); - } - Node node = simplifier.handle(cell->type, cell->parameters, connections); - factory.update_pending(pending, node); - } } else if (chunk.is_none()) { Node node = factory.undriven(chunk.size()); factory.update_pending(pending, node); diff --git a/tests/functional/rtlil_cells.py b/tests/functional/rtlil_cells.py index 7858e3781..4dbea6015 100644 --- a/tests/functional/rtlil_cells.py +++ b/tests/functional/rtlil_cells.py @@ -123,6 +123,21 @@ class SliceCell(BaseCell): def __init__(self, name, values): super().__init__(name, ['A_WIDTH', 'OFFSET', 'Y_WIDTH'], {'A': 'A_WIDTH'}, {'Y': 'Y_WIDTH'}, values) +class FACell(BaseCell): + def __init__(self, name, values): + super().__init__(name, ['WIDTH'], {'A': 'WIDTH', 'B': 'WIDTH', 'C': 'WIDTH'}, {'X': 'WIDTH', 'Y': 'WIDTH'}, values) + self.sim_preprocessing = "techmap" # because FA is not implemented in yosys sim + +class LCUCell(BaseCell): + def __init__(self, name, values): + super().__init__(name, ['WIDTH'], {'P': 'WIDTH', 'G': 'WIDTH', 'CI': 1}, {'CO': 'WIDTH'}, values) + self.sim_preprocessing = "techmap" # because LCU is not implemented in yosys sim + +class ALUCell(BaseCell): + def __init__(self, name, values): + super().__init__(name, ['A_WIDTH', 'B_WIDTH', 'Y_WIDTH', 'A_SIGNED', 'B_SIGNED'], {'A': 'A_WIDTH', 'B': 'B_WIDTH', 'CI': 1, 'BI': 1}, {'X': 'Y_WIDTH', 'Y': 'Y_WIDTH', 'CO': 'Y_WIDTH'}, values) + self.sim_preprocessing = "techmap" # because ALU is not implemented in yosys sim + class FailCell(BaseCell): def __init__(self, name): super().__init__(name, [], {}, {}) @@ -231,9 +246,9 @@ rtlil_cells = [ ShiftCell("sshr", shift_widths), ShiftCell("shift", shift_widths), ShiftCell("shiftx", shift_widths), -# ("fa", ["A", "B", "C", "X", "Y"]), -# ("lcu", ["P", "G", "CI", "CO"]), -# ("alu", ["A", "B", "CI", "BI", "X", "Y", "CO"]), + FACell("fa", [8, 20]), + LCUCell("lcu", [1, 10]), + ALUCell("alu", binary_widths), BinaryCell("lt", binary_widths), BinaryCell("le", binary_widths), BinaryCell("eq", binary_widths), diff --git a/tests/functional/test_functional.py b/tests/functional/test_functional.py index 86e515d90..150642a00 100644 --- a/tests/functional/test_functional.py +++ b/tests/functional/test_functional.py @@ -27,9 +27,9 @@ def yosys_synth(verilog_file, rtlil_file): yosys(f"read_verilog {quote(verilog_file)} ; prep ; clk2fflogic ; write_rtlil {quote(rtlil_file)}") # simulate an rtlil file with yosys, comparing with a given vcd file, and writing out the yosys simulation results into a second vcd file -def yosys_sim(rtlil_file, vcd_reference_file, vcd_out_file): +def yosys_sim(rtlil_file, vcd_reference_file, vcd_out_file, preprocessing = ""): try: - yosys(f"read_rtlil {quote(rtlil_file)}; sim -r {quote(vcd_reference_file)} -scope gold -vcd {quote(vcd_out_file)} -timescale 1us -sim-gold") + yosys(f"read_rtlil {quote(rtlil_file)}; {preprocessing}; sim -r {quote(vcd_reference_file)} -scope gold -vcd {quote(vcd_out_file)} -timescale 1us -sim-gold") except: # if yosys sim fails it's probably because of a simulation mismatch # since yosys sim aborts on simulation mismatch to generate vcd output @@ -53,7 +53,7 @@ def test_cxx(cell, parameters, tmp_path, num_steps, rnd): compile_cpp(vcdharness_cc_file, vcdharness_exe_file, ['-I', tmp_path, '-I', str(base_path / 'backends/functional/cxx_runtime')]) seed = str(rnd(cell.name + "-cxx").getrandbits(32)) run([str(vcdharness_exe_file.resolve()), str(vcd_functional_file), str(num_steps), str(seed)]) - yosys_sim(rtlil_file, vcd_functional_file, vcd_yosys_sim_file) + yosys_sim(rtlil_file, vcd_functional_file, vcd_yosys_sim_file, getattr(cell, 'sim_preprocessing', '')) def test_smt(cell, parameters, tmp_path, num_steps, rnd): import smt_vcd @@ -67,4 +67,4 @@ def test_smt(cell, parameters, tmp_path, num_steps, rnd): yosys(f"read_rtlil {quote(rtlil_file)} ; write_functional_smt2 {quote(smt_file)}") run(['z3', smt_file]) # check if output is valid smtlib before continuing smt_vcd.simulate_smt(smt_file, vcd_functional_file, num_steps, rnd(cell.name + "-smt")) - yosys_sim(rtlil_file, vcd_functional_file, vcd_yosys_sim_file) \ No newline at end of file + yosys_sim(rtlil_file, vcd_functional_file, vcd_yosys_sim_file, getattr(cell, 'sim_preprocessing', '')) \ No newline at end of file