yosys/passes/pmgen/microchip_dsp_cascade.pmg

236 lines
7.3 KiB
Plaintext
Raw Permalink Normal View History

2024-07-02 14:44:30 -05:00
// ISC License
//
// Copyright (C) 2024 Microchip Technology Inc. and its subsidiaries
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice appear in all copies.
//
// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
// ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
// ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
// OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
// This file describes the third of three pattern matcher setups that
2024-07-04 10:53:41 -05:00
// forms the `microchip_dsp` pass described in microchip_dsp.cc
2024-07-02 14:44:30 -05:00
// At a high level, it works as follows:
// (1) Starting from a DSP cell that
// (a) CDIN_FDBK_SEL is set to default "00"
// (b) doesn't already use the 'PCOUT' port
// (2) Match another DSP cell that
// (a) does not have the CREG enabled,
// (b) 'C' port is driven by the 'P' output of the previous DSP cell
// (c) has its 'PCIN' port unused
// (3) Recursively go to (2) until no more matches possible, keeping track
// of the longest possible chain found
// (4) The longest chain is then divided into chunks of no more than
// MAX_DSP_CASCADE in length (to prevent long cascades that exceed the
// height of a DSP column) with each DSP in each chunk being rewritten
// to use [ABP]COUT -> [ABP]CIN cascading as appropriate
2024-07-04 10:53:41 -05:00
pattern microchip_dsp_cascade
2024-07-02 14:44:30 -05:00
udata <std::function<SigSpec(const SigSpec&)>> unextend
udata <vector<std::tuple<Cell*,int>>> chain longest_chain
udata <std::set<Cell*>> visited
state <Cell*> next
state <SigSpec> clock
// Variables used for subpatterns
state <SigSpec> argQ argD
state <int> ffoffset
udata <SigSpec> dffD dffQ
udata <SigBit> dffclock
udata <Cell*> dff
// Maximum of 24 cascaded blocks
code
#define MAX_DSP_CASCADE 24
endcode
// NOTE: Chain vector
// +--------+ +--------+
// | first |----> | next | ----> ...
// +--------+ +--------+
// first.COUT cascades to next.CIN, so on and so forth
// Helper function to remove unused bits
code
2024-07-02 15:47:18 -05:00
unextend = [](const SigSpec &sig) {
int i;
for (i = GetSize(sig)-1; i > 0; i--)
if (sig[i] != sig[i-1])
break;
// Do not remove non-const sign bit
if (sig[i].wire)
++i;
return sig.extract(0, i);
};
2024-07-02 14:44:30 -05:00
endcode
// (1) Starting from a DSP cell that
// (a) CDIN_FDBK_SEL is set to default "00"
// (b) doesn't already use the 'PCOUT' port
match first
select first->type.in(\MACC_PA) && port(first, \CDIN_FDBK_SEL, Const(0, 2)) == Const::from_string("00")
select nusers(port(first, \CDOUT, SigSpec())) <= 1
endmatch
// (4) The longest chain is then divided into chunks of no more than
// MAX_DSP_CASCADE in length (to prevent long cascades that exceed the
// height of a DSP column) with each DSP in each chunk being rewritten
// to use [ABP]COUT -> [ABP]CIN cascading as appropriate
code
2024-07-02 15:47:18 -05:00
visited.clear();
visited.insert(first);
2024-07-02 14:44:30 -05:00
longest_chain.clear();
chain.emplace_back(first, -1);
subpattern(tail);
finally
2024-07-02 15:47:18 -05:00
// longest cascade chain has been found with DSP "first" being the head of the chain
// do some post processing
2024-07-02 14:44:30 -05:00
chain.pop_back();
2024-07-02 15:47:18 -05:00
visited.clear();
2024-07-02 14:44:30 -05:00
log_assert(chain.empty());
if (GetSize(longest_chain) > 1) {
Cell *dsp = std::get<0>(longest_chain.front());
Cell *dsp_pcin;
2024-07-02 15:47:18 -05:00
int SHIFT = -1;
2024-07-02 14:44:30 -05:00
for (int i = 1; i < GetSize(longest_chain); i++) {
2024-07-02 15:47:18 -05:00
log_assert(dsp->type.in(\MACC_PA));
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
std::tie(dsp_pcin,SHIFT) = longest_chain[i];
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// Chain length exceeds the maximum cascade length, must split it up
2024-07-02 14:44:30 -05:00
if (i % MAX_DSP_CASCADE > 0) {
2024-07-02 15:47:18 -05:00
Wire *cascade = module->addWire(NEW_ID, 48);
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// zero port C and move wire to cascade
dsp_pcin->setPort(ID(C), Const(0, 48));
dsp_pcin->setPort(ID(CDIN), cascade);
dsp->setPort(ID(CDOUT), cascade);
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// Configure wire to cascade the dsps
add_siguser(cascade, dsp_pcin);
add_siguser(cascade, dsp);
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// configure mux to use cascade for signal E
SigSpec cdin_fdbk_sel = port(dsp_pcin, \CDIN_FDBK_SEL, Const(0, 2));
cdin_fdbk_sel[1] = State::S1;
dsp_pcin->setPort(\CDIN_FDBK_SEL, cdin_fdbk_sel);
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// check if shifting is required for wide multiplier implmentation
if (SHIFT == 17)
{
dsp_pcin->setPort(\ARSHFT17, State::S1);
}
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
log_debug("PCOUT -> PCIN cascade for %s -> %s\n", log_id(dsp), log_id(dsp_pcin));
2024-07-02 14:44:30 -05:00
} else {
log_debug(" Blocking %s -> %s cascade (exceeds max: %d)\n", log_id(dsp), log_id(dsp_pcin), MAX_DSP_CASCADE);
}
dsp = dsp_pcin;
}
accept;
}
endcode
// ------------------------------------------------------------------
subpattern tail
arg first
arg next
// (2) Match another DSP cell that
// (a) does not have the CREG enabled,
// (b) 'C' port is driven by the 'P' output of the previous DSP cell
// (c) has its 'PCIN' port unused
match nextP
2024-07-02 15:47:18 -05:00
// find candidates where nextP.C port is driven (maybe partially) by chain's tail DSP.P port
// and with no registers in between (since cascade path cannot be pipelined)
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// reg C must not be used
select port(nextP, \C_BYPASS, SigSpec()).is_fully_ones()
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// must be same DSP type
select nextP->type.in(\MACC_PA)
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// port C should be driven by something
2024-07-02 14:44:30 -05:00
select nusers(port(nextP, \C, SigSpec())) > 1
2024-07-02 15:47:18 -05:00
// CIN must be unused
2024-07-02 14:44:30 -05:00
select nusers(port(nextP, \PCIN, SigSpec())) == 0
2024-07-02 15:47:18 -05:00
// should not have internal feedback connection
select port(nextP, \CDIN_FDBK_SEL, SigSpec()).is_fully_zero()
2024-07-02 14:44:30 -05:00
2024-07-02 15:47:18 -05:00
// SHIFT should be unused
select port(nextP, \ARSHFT17_BYPASS).is_fully_ones()
select port(nextP, \ARSHFT17).is_fully_zero()
select nusers(port(nextP, \ARSHFT17, SigSpec())) == 0
// current DSP cell can be cascaded with the back of the cascade chain
2024-07-02 14:44:30 -05:00
// index <SigBit> port(nextP, \C)[0] === port(std::get<0>(chain.back()), \P)[0] || port(nextP, \C)[0] === port(std::get<0>(chain.back()), \P)[17]
2024-07-02 15:47:18 -05:00
filter port(nextP, \C)[0] == port(std::get<0>(chain.back()), \P)[0] || port(nextP, \C)[0] == port(std::get<0>(chain.back()), \P)[17]
2024-07-02 14:44:30 -05:00
// semioptional
2024-07-02 15:47:18 -05:00
optional
2024-07-02 14:44:30 -05:00
endmatch
code next
next = nextP;
2024-07-02 15:47:18 -05:00
// keep DSP type consistent in the chain
// currently since we only have one type anyways, this line is always false
2024-07-02 14:44:30 -05:00
if (next && next->type != first->type) reject;
2024-07-02 15:47:18 -05:00
// break infinite recursion when there's a combinational loop
if (visited.count(next) > 0) reject;
2024-07-02 14:44:30 -05:00
endcode
// (3) Recursively go to (2) until no more matches possible, recording the
// longest possible chain
code
if (next) {
2024-07-02 15:47:18 -05:00
SigSpec driver_sigP = port(std::get<0>(chain.back()), \P);
int shift = 0;
if (port(next, \C)[0] == port(std::get<0>(chain.back()), \P)[17]) shift = 17;
2024-07-02 14:44:30 -05:00
chain.emplace_back(next, shift);
2024-07-02 15:47:18 -05:00
visited.insert(next);
2024-07-02 14:44:30 -05:00
SigSpec sigC = unextend(port(next, \C));
2024-07-02 15:47:18 -05:00
// Make sure driverDSP.P === DSP.C
if (GetSize(sigC) + shift <= GetSize(driver_sigP) && driver_sigP.extract(shift, GetSize(sigC)) == sigC)
{
subpattern(tail);
}
2024-07-02 14:44:30 -05:00
} else {
if (GetSize(chain) > GetSize(longest_chain))
longest_chain = chain;
}
finally
if (next)
2024-07-02 15:47:18 -05:00
{
visited.erase(next);
chain.pop_back();
}
2024-07-02 14:44:30 -05:00
endcode