3
0
Fork 0
mirror of https://github.com/YosysHQ/yosys synced 2025-04-06 01:24:10 +00:00

ql_dsp_macc: Tune DSP inference code

This commit is contained in:
Martin Povišer 2023-10-02 15:55:41 +02:00
parent 7d738b07da
commit e43810e13f
2 changed files with 172 additions and 212 deletions

View file

@ -29,235 +29,169 @@ PRIVATE_NAMESPACE_BEGIN
static void create_ql_macc_dsp(ql_dsp_macc_pm &pm) static void create_ql_macc_dsp(ql_dsp_macc_pm &pm)
{ {
auto &st = pm.st_ql_dsp_macc; auto &st = pm.st_ql_dsp_macc;
// Reject if multiplier drives anything else than either $add or $add and // Get port widths
// $mux size_t a_width = GetSize(st.mul->getPort(ID(A)));
if (st.mux == nullptr && st.mul_nusers > 2) { size_t b_width = GetSize(st.mul->getPort(ID(B)));
return; size_t z_width = GetSize(st.ff->getPort(ID(Q)));
}
// Determine whether the output is taken from before or after the ff size_t min_width = std::min(a_width, b_width);
bool out_ff; size_t max_width = std::max(a_width, b_width);
if (st.ff_d_nusers == 2 && st.ff_q_nusers == 3) {
out_ff = true;
} else if (st.ff_d_nusers == 3 && st.ff_q_nusers == 2) {
out_ff = false;
} else {
// Illegal, cannot take the two outputs simulataneously
return;
}
// No mux, the adder can driver either the ff or the ff + output // Signed / unsigned
if (st.mux == nullptr) { bool ab_signed = st.mul->getParam(ID(A_SIGNED)).as_bool();
if (out_ff && st.add_nusers != 2) { log_assert(ab_signed == st.mul->getParam(ID(B_SIGNED)).as_bool());
return;
}
if (!out_ff && st.add_nusers != 3) {
return;
}
}
// Mux present, the adder cannot drive anything else
else {
if (st.add_nusers != 2) {
return;
}
}
// Mux can driver either the ff or the ff + output // Determine DSP type or discard if too narrow / wide
if (st.mux != nullptr) { RTLIL::IdString type;
if (out_ff && st.mux_nusers != 2) { size_t tgt_a_width;
return; size_t tgt_b_width;
} size_t tgt_z_width;
if (!out_ff && st.mux_nusers != 3) {
return;
}
}
// Accept only posedge clocked FFs string cell_base_name = "dsp_t1";
if (st.ff->getParam(ID(CLK_POLARITY)).as_int() != 1) { string cell_size_name = "";
return; string cell_cfg_name = "";
} string cell_full_name = "";
// Get port widths if (min_width <= 2 && max_width <= 2 && z_width <= 4) {
size_t a_width = GetSize(st.mul->getPort(ID(A))); log_debug("\trejected: too narrow (%zd %zd %zd)\n", min_width, max_width, z_width);
size_t b_width = GetSize(st.mul->getPort(ID(B))); return;
size_t z_width = GetSize(st.ff->getPort(ID(Q))); } else if (min_width <= 9 && max_width <= 10 && z_width <= 19) {
cell_size_name = "_10x9x32";
tgt_a_width = 10;
tgt_b_width = 9;
tgt_z_width = 19;
} else if (min_width <= 18 && max_width <= 20 && z_width <= 38) {
cell_size_name = "_20x18x64";
tgt_a_width = 20;
tgt_b_width = 18;
tgt_z_width = 38;
} else {
log_debug("\trejected: too wide (%zd %zd %zd)\n", min_width, max_width, z_width);
return;
}
size_t min_width = std::min(a_width, b_width); type = RTLIL::escape_id(cell_base_name + cell_size_name + "_cfg_ports");
size_t max_width = std::max(a_width, b_width); log("Inferring MACC %zux%zu->%zu as %s from:\n", a_width, b_width, z_width, log_id(type));
// Signed / unsigned for (auto cell : {st.mul, st.add, st.mux, st.ff})
bool a_signed = st.mul->getParam(ID(A_SIGNED)).as_bool(); if (cell)
bool b_signed = st.mul->getParam(ID(B_SIGNED)).as_bool(); log(" %s (%s)\n", log_id(cell), log_id(cell->type));
// Determine DSP type or discard if too narrow / wide // Add the DSP cell
RTLIL::IdString type; RTLIL::Cell *cell = pm.module->addCell(NEW_ID, type);
size_t tgt_a_width;
size_t tgt_b_width;
size_t tgt_z_width;
string cell_base_name = "dsp_t1"; // Set attributes
string cell_size_name = ""; cell->set_bool_attribute(ID(is_inferred), true);
string cell_cfg_name = "";
string cell_full_name = "";
if (min_width <= 2 && max_width <= 2 && z_width <= 4) { // Get input/output data signals
// Too narrow RTLIL::SigSpec sig_a, sig_b, sig_z;
return; sig_a = st.mul->getPort(ID(A));
} else if (min_width <= 9 && max_width <= 10 && z_width <= 19) { sig_b = st.mul->getPort(ID(B));
cell_size_name = "_10x9x32"; sig_z = st.output_registered ? st.ff->getPort(ID(Q)) : st.ff->getPort(ID(D));
tgt_a_width = 10;
tgt_b_width = 9;
tgt_z_width = 19;
} else if (min_width <= 18 && max_width <= 20 && z_width <= 38) {
cell_size_name = "_20x18x64";
tgt_a_width = 20;
tgt_b_width = 18;
tgt_z_width = 38;
} else {
// Too wide
return;
}
cell_cfg_name = "_cfg_ports"; // TODO: remove if (a_width < b_width)
cell_full_name = cell_base_name + cell_size_name + cell_cfg_name; std::swap(sig_a, sig_b);
type = RTLIL::escape_id(cell_full_name); // Connect input data ports, sign extend / pad with zeros
log("Inferring MACC %zux%zu->%zu as %s from:\n", a_width, b_width, z_width, RTLIL::unescape_id(type).c_str()); sig_a.extend_u0(tgt_a_width, ab_signed);
sig_b.extend_u0(tgt_b_width, ab_signed);
cell->setPort(ID(a_i), sig_a);
cell->setPort(ID(b_i), sig_b);
for (auto cell : {st.mul, st.add, st.mux, st.ff}) { // Connect output data port, pad if needed
if (cell != nullptr) { if ((size_t) GetSize(sig_z) < tgt_z_width) {
log(" %s (%s)\n", RTLIL::unescape_id(cell->name).c_str(), RTLIL::unescape_id(cell->type).c_str()); auto *wire = pm.module->addWire(NEW_ID, tgt_z_width - GetSize(sig_z));
} sig_z.append(wire);
} }
cell->setPort(ID(z_o), sig_z);
// Build the DSP cell name // Connect clock, reset and enable
std::string name; cell->setPort(ID(clock_i), st.ff->getPort(ID(CLK)));
name += RTLIL::unescape_id(st.mul->name) + "_";
name += RTLIL::unescape_id(st.add->name) + "_";
if (st.mux != nullptr) {
name += RTLIL::unescape_id(st.mux->name) + "_";
}
name += RTLIL::unescape_id(st.ff->name);
// Add the DSP cell RTLIL::SigSpec rst;
RTLIL::Cell *cell = pm.module->addCell(RTLIL::escape_id(name), type); RTLIL::SigSpec ena;
// Set attributes if (st.ff->hasPort(ID(ARST))) {
cell->set_bool_attribute(RTLIL::escape_id("is_inferred"), true); if (st.ff->getParam(ID(ARST_POLARITY)).as_int() != 1) {
rst = pm.module->Not(NEW_ID, st.ff->getPort(ID(ARST)));
} else {
rst = st.ff->getPort(ID(ARST));
}
} else {
rst = RTLIL::SigSpec(RTLIL::S0);
}
// Get input/output data signals if (st.ff->hasPort(ID(EN))) {
RTLIL::SigSpec sig_a; if (st.ff->getParam(ID(EN_POLARITY)).as_int() != 1) {
RTLIL::SigSpec sig_b; ena = pm.module->Not(NEW_ID, st.ff->getPort(ID(EN)));
RTLIL::SigSpec sig_z; } else {
ena = st.ff->getPort(ID(EN));
}
} else {
ena = RTLIL::SigSpec(RTLIL::S1);
}
if (a_width >= b_width) { cell->setPort(ID(reset_i), rst);
sig_a = st.mul->getPort(ID(A)); cell->setPort(ID(load_acc_i), ena);
sig_b = st.mul->getPort(ID(B));
} else {
sig_a = st.mul->getPort(ID(B));
sig_b = st.mul->getPort(ID(A));
}
sig_z = out_ff ? st.ff->getPort(ID(Q)) : st.ff->getPort(ID(D)); // Insert feedback_i control logic used for clearing / loading the accumulator
if (st.mux_in_pattern) {
RTLIL::SigSpec sig_s = st.mux->getPort(ID(S));
// Connect input data ports, sign extend / pad with zeros // Depending on the mux port ordering insert inverter if needed
sig_a.extend_u0(tgt_a_width, a_signed); log_assert(st.mux_ab.in(ID(A), ID(B)));
sig_b.extend_u0(tgt_b_width, b_signed); if (st.mux_ab == ID(A))
cell->setPort(RTLIL::escape_id("a_i"), sig_a); sig_s = pm.module->Not(NEW_ID, sig_s);
cell->setPort(RTLIL::escape_id("b_i"), sig_b);
// Connect output data port, pad if needed // Assemble the full control signal for the feedback_i port
if ((size_t)GetSize(sig_z) < tgt_z_width) { RTLIL::SigSpec sig_f;
auto *wire = pm.module->addWire(NEW_ID, tgt_z_width - GetSize(sig_z)); sig_f.append(sig_s);
sig_z.append(wire); sig_f.append(RTLIL::S0);
} sig_f.append(RTLIL::S0);
cell->setPort(RTLIL::escape_id("z_o"), sig_z); cell->setPort(ID(feedback_i), sig_f);
}
// No acc clear/load
else {
cell->setPort(ID(feedback_i), RTLIL::SigSpec(RTLIL::S0, 3));
}
// Connect clock, reset and enable // Connect control ports
cell->setPort(RTLIL::escape_id("clock_i"), st.ff->getPort(ID(CLK))); cell->setPort(ID(unsigned_a_i), RTLIL::SigSpec(ab_signed ? RTLIL::S0 : RTLIL::S1));
cell->setPort(ID(unsigned_b_i), RTLIL::SigSpec(ab_signed ? RTLIL::S0 : RTLIL::S1));
RTLIL::SigSpec rst; // Connect config bits
RTLIL::SigSpec ena; cell->setPort(ID(saturate_enable_i), RTLIL::SigSpec(RTLIL::S0));
cell->setPort(ID(shift_right_i), RTLIL::SigSpec(RTLIL::S0, 6));
cell->setPort(ID(round_i), RTLIL::SigSpec(RTLIL::S0));
cell->setPort(ID(register_inputs_i), RTLIL::SigSpec(RTLIL::S0));
// 3 - output post acc; 1 - output pre acc
cell->setPort(ID(output_select_i), RTLIL::Const(st.output_registered ? 1 : 3, 3));
if (st.ff->hasPort(ID(ARST))) { bool subtract = (st.add->type == ID($sub));
if (st.ff->getParam(ID(ARST_POLARITY)).as_int() != 1) { cell->setPort(ID(subtract_i), RTLIL::SigSpec(subtract ? RTLIL::S1 : RTLIL::S0));
rst = pm.module->Not(NEW_ID, st.ff->getPort(ID(ARST)));
} else {
rst = st.ff->getPort(ID(ARST));
}
} else {
rst = RTLIL::SigSpec(RTLIL::S0);
}
if (st.ff->hasPort(ID(EN))) { // Mark the cells for removal
if (st.ff->getParam(ID(EN_POLARITY)).as_int() != 1) { pm.autoremove(st.mul);
ena = pm.module->Not(NEW_ID, st.ff->getPort(ID(EN))); pm.autoremove(st.add);
} else { if (st.mux != nullptr) {
ena = st.ff->getPort(ID(EN)); pm.autoremove(st.mux);
} }
} else { pm.autoremove(st.ff);
ena = RTLIL::SigSpec(RTLIL::S1);
}
cell->setPort(RTLIL::escape_id("reset_i"), rst);
cell->setPort(RTLIL::escape_id("load_acc_i"), ena);
// Insert feedback_i control logic used for clearing / loading the accumulator
if (st.mux != nullptr) {
RTLIL::SigSpec sig_s = st.mux->getPort(ID(S));
// Depending on the mux port ordering insert inverter if needed
log_assert(st.mux_ab == ID(A) || st.mux_ab == ID(B));
if (st.mux_ab == ID(A)) {
sig_s = pm.module->Not(NEW_ID, sig_s);
}
// Assemble the full control signal for the feedback_i port
RTLIL::SigSpec sig_f;
sig_f.append(sig_s);
sig_f.append(RTLIL::S0);
sig_f.append(RTLIL::S0);
cell->setPort(RTLIL::escape_id("feedback_i"), sig_f);
}
// No acc clear/load
else {
cell->setPort(RTLIL::escape_id("feedback_i"), RTLIL::SigSpec(RTLIL::S0, 3));
}
// Connect control ports
cell->setPort(RTLIL::escape_id("unsigned_a_i"), RTLIL::SigSpec(a_signed ? RTLIL::S0 : RTLIL::S1));
cell->setPort(RTLIL::escape_id("unsigned_b_i"), RTLIL::SigSpec(b_signed ? RTLIL::S0 : RTLIL::S1));
// Connect config bits
cell->setPort(RTLIL::escape_id("saturate_enable_i"), RTLIL::SigSpec(RTLIL::S0));
cell->setPort(RTLIL::escape_id("shift_right_i"), RTLIL::SigSpec(RTLIL::S0, 6));
cell->setPort(RTLIL::escape_id("round_i"), RTLIL::SigSpec(RTLIL::S0));
cell->setPort(RTLIL::escape_id("register_inputs_i"), RTLIL::SigSpec(RTLIL::S0));
// 3 - output post acc; 1 - output pre acc
cell->setPort(RTLIL::escape_id("output_select_i"), out_ff ? RTLIL::Const(1, 3) : RTLIL::Const(3, 3));
bool subtract = (st.add->type == RTLIL::escape_id("$sub"));
cell->setPort(RTLIL::escape_id("subtract_i"), RTLIL::SigSpec(subtract ? RTLIL::S1 : RTLIL::S0));
// Mark the cells for removal
pm.autoremove(st.mul);
pm.autoremove(st.add);
if (st.mux != nullptr) {
pm.autoremove(st.mux);
}
pm.autoremove(st.ff);
} }
struct QlDspMacc : public Pass { struct QlDspMacc : public Pass {
QlDspMacc() : Pass("ql_dsp_macc", "infer QuickLogic multiplier-accumulator DSP cells") {}
QlDspMacc() : Pass("ql_dsp_macc", "Does something") {}
void help() override void help() override
{ {
// |---v---|---v---|---v---|---v---|---v---|---v---|---v---|---v---|---v---|---v---|
log("\n"); log("\n");
log(" ql_dsp_macc [options] [selection]\n"); log(" ql_dsp_macc [selection]\n");
log("\n");
log("This pass looks for a multiply-accumulate pattern based on which it infers a\n");
log("QuickLogic DSP cell.\n");
log("\n"); log("\n");
} }
@ -271,9 +205,8 @@ struct QlDspMacc : public Pass {
} }
extra_args(a_Args, argidx, a_Design); extra_args(a_Args, argidx, a_Design);
for (auto module : a_Design->selected_modules()) { for (auto module : a_Design->selected_modules())
ql_dsp_macc_pm(module, module->selected_cells()).run_ql_dsp_macc(create_ql_macc_dsp); ql_dsp_macc_pm(module, module->selected_cells()).run_ql_dsp_macc(create_ql_macc_dsp);
}
} }
} QlDspMacc; } QlDspMacc;

View file

@ -1,48 +1,75 @@
pattern ql_dsp_macc pattern ql_dsp_macc
// Rough sketch: (mux is optional)
//
// /-----------------------\
// | |
// \ / |
// mul ----> add -----> mux -----> ff -+---->
// | /\
// | |
// --------------
state <IdString> add_ba state <IdString> add_ba
state <IdString> mux_ab state <IdString> mux_ab
state <int> mul_nusers // Is the output taken from before or after the FF?
state <int> add_nusers state <bool> output_registered
state <int> mux_nusers
state <int> ff_d_nusers
state <int> ff_q_nusers
// Is there a mux in the pattern?
state <bool> mux_in_pattern
code mux_in_pattern
mux_in_pattern = false;
branch;
mux_in_pattern = true;
endcode
// The multiplier is at the center of our pattern
match mul match mul
select mul->type.in($mul) select mul->type.in($mul)
// It has either two or three consumers depending on whether there's a mux
// in the pattern or not
select nusers(port(mul, \Y)) <= 3 select nusers(port(mul, \Y)) <= 3
set mul_nusers nusers(port(mul, \Y)) filter nusers(port(mul, \Y)) == (mux_in_pattern ? 3 : 2)
endmatch endmatch
code output_registered
output_registered = false;
branch;
output_registered = true;
endcode
match add match add
select add->type.in($add, $sub) select add->type.in($add, $sub)
choice <IdString> AB {\A, \B} choice <IdString> AB {\A, \B}
define <IdString> BA (AB == \A ? \B : \A) define <IdString> BA (AB == \A ? \B : \A)
// One input to the adder is fed by the multiplier
index <SigSpec> port(add, AB) === port(mul, \Y) index <SigSpec> port(add, AB) === port(mul, \Y)
select nusers(port(add, \Y)) <= 3 // Save the other input port, it needs to be fed by the flip-flop
set add_nusers nusers(port(add, \Y))
set add_ba BA set add_ba BA
// Adder has either two or three consumers; it will have three consumers
// IFF there's no mux in the pattern and the multiplier-accumulator result
// is taken unregistered
filter nusers(port(add, \Y)) == (!mux_in_pattern && !output_registered ? 3 : 2)
endmatch endmatch
match mux match mux
if mux_in_pattern
select mux->type.in($mux) select mux->type.in($mux)
choice <IdString> AB {\A, \B} choice <IdString> AB {\A, \B}
define <IdString> BA (AB == \A ? \B : \A) define <IdString> BA (AB == \A ? \B : \A)
index <SigSpec> port(mux, AB) === port(mul, \Y) index <SigSpec> port(mux, AB) === port(mul, \Y)
index <SigSpec> port(mux, BA) === port(add, \Y) index <SigSpec> port(mux, BA) === port(add, \Y)
select nusers(port(mux, \Y)) <= 3 filter nusers(port(mux, \Y)) == (output_registered ? 2 : 3)
set mux_nusers nusers(port(mux, \Y))
set mux_ab AB set mux_ab AB
optional
endmatch endmatch
match ff match ff
select ff->type.in($dff, $adff, $dffe, $adffe) select ff->type.in($dff, $adff, $dffe, $adffe)
index <SigSpec> port(ff, \D) === (mux == nullptr ? port(add, \Y) : port(mux, \Y)) select param(ff, \CLK_POLARITY).as_bool()
index <SigSpec> port(ff, \D) === mux_in_pattern ? port(mux, \Y) : port(add, \Y);
index <SigSpec> port(ff, \Q) === port(add, add_ba) index <SigSpec> port(ff, \Q) === port(add, add_ba)
set ff_d_nusers nusers(port(ff, \D)) filter nusers(port(ff, \Q)) == (output_registered ? 3 : 2)
set ff_q_nusers nusers(port(ff, \Q))
endmatch endmatch
code code