2018-06-23 21:07:22 +00:00
|
|
|
// -*- mode: C++; c-file-style: "cc-mode" -*-
|
|
|
|
//*************************************************************************
|
|
|
|
// DESCRIPTION: Verilator: Recreate loops to help pack caches
|
|
|
|
//
|
2019-11-08 03:33:59 +00:00
|
|
|
// Code available from: https://verilator.org
|
2018-06-23 21:07:22 +00:00
|
|
|
//
|
|
|
|
//*************************************************************************
|
|
|
|
//
|
2020-03-21 15:24:24 +00:00
|
|
|
// Copyright 2003-2020 by Wilson Snyder. This program is free software; you
|
|
|
|
// can redistribute it and/or modify it under the terms of either the GNU
|
2018-06-23 21:07:22 +00:00
|
|
|
// Lesser General Public License Version 3 or the Perl Artistic License
|
|
|
|
// Version 2.0.
|
2020-03-21 15:24:24 +00:00
|
|
|
// SPDX-License-Identifier: LGPL-3.0-only OR Artistic-2.0
|
2018-06-23 21:07:22 +00:00
|
|
|
//
|
|
|
|
//*************************************************************************
|
|
|
|
// V3Reloop's Transformations:
|
|
|
|
//
|
|
|
|
// Each CFunc:
|
|
|
|
// Look for a series of assignments that would look better in a loop:
|
|
|
|
//
|
|
|
|
// ASSIGN(ARRAYREF(var, #), ARRAYREF(var, #))
|
|
|
|
// ASSIGN(ARRAYREF(var, #+1), ARRAYREF(var, #+1))
|
|
|
|
// ->
|
|
|
|
// Create __Vilp local variable
|
|
|
|
// FOR(__Vilp = low; __Vilp <= high; ++__Vlip)
|
|
|
|
// ASSIGN(ARRAYREF(var, __Vilp), ARRAYREF(var, __Vilp))
|
|
|
|
//
|
|
|
|
// Likewise vector assign to the same constant converted to a loop.
|
|
|
|
//
|
|
|
|
//*************************************************************************
|
2019-10-05 00:17:11 +00:00
|
|
|
|
2018-06-23 21:07:22 +00:00
|
|
|
#include "config_build.h"
|
|
|
|
#include "verilatedos.h"
|
|
|
|
|
|
|
|
#include "V3Global.h"
|
|
|
|
#include "V3Reloop.h"
|
|
|
|
#include "V3Stats.h"
|
|
|
|
#include "V3Ast.h"
|
|
|
|
|
2018-10-14 17:43:24 +00:00
|
|
|
#include <algorithm>
|
|
|
|
|
2020-08-16 18:19:12 +00:00
|
|
|
constexpr unsigned RELOOP_MIN_ITERS = 40; // Need at least this many loops to do this optimization
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
//######################################################################
|
|
|
|
|
|
|
|
class ReloopVisitor : public AstNVisitor {
|
|
|
|
private:
|
|
|
|
// TYPES
|
2020-04-14 02:51:35 +00:00
|
|
|
typedef std::vector<AstNodeAssign*> AssVec;
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
// NODE STATE
|
|
|
|
// AstCFunc::user1p -> Var* for temp var, 0=not set yet
|
2020-04-14 02:51:35 +00:00
|
|
|
AstUser1InUse m_inuser1;
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
// STATE
|
2020-04-14 02:51:35 +00:00
|
|
|
VDouble0 m_statReloops; // Statistic tracking
|
|
|
|
VDouble0 m_statReItems; // Statistic tracking
|
2020-08-16 13:55:36 +00:00
|
|
|
AstCFunc* m_cfuncp = nullptr; // Current block
|
2018-06-23 21:07:22 +00:00
|
|
|
|
2020-04-14 02:51:35 +00:00
|
|
|
AssVec m_mgAssignps; // List of assignments merging
|
2020-08-16 13:55:36 +00:00
|
|
|
AstCFunc* m_mgCfuncp = nullptr; // Parent C function
|
|
|
|
AstNode* m_mgNextp = nullptr; // Next node
|
|
|
|
AstNodeSel* m_mgSelLp = nullptr; // Parent select, nullptr = idle
|
|
|
|
AstNodeSel* m_mgSelRp = nullptr; // Parent select, nullptr = constant
|
|
|
|
AstNodeVarRef* m_mgVarrefLp = nullptr; // Parent varref
|
|
|
|
AstNodeVarRef* m_mgVarrefRp = nullptr; // Parent varref, nullptr = constant
|
|
|
|
AstConst* m_mgConstRp = nullptr; // Parent RHS constant, nullptr = sel
|
|
|
|
uint32_t m_mgIndexLo = 0; // Merge range
|
|
|
|
uint32_t m_mgIndexHi = 0; // Merge range
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
// METHODS
|
|
|
|
VL_DEBUG_FUNC; // Declare debug()
|
|
|
|
|
2018-06-24 15:22:56 +00:00
|
|
|
AstVar* findCreateVarTemp(FileLine* fl, AstCFunc* cfuncp) {
|
|
|
|
AstVar* varp = VN_CAST(cfuncp->user1p(), Var);
|
2018-06-23 21:07:22 +00:00
|
|
|
if (!varp) {
|
|
|
|
string newvarname = string("__Vilp");
|
2020-04-14 02:51:35 +00:00
|
|
|
varp = new AstVar(fl, AstVarType::STMTTEMP, newvarname, VFlagLogicPacked(), 32);
|
2019-07-06 16:57:50 +00:00
|
|
|
UASSERT_OBJ(cfuncp, fl, "Assignment not under a function");
|
2018-06-24 15:22:56 +00:00
|
|
|
cfuncp->addInitsp(varp);
|
|
|
|
cfuncp->user1p(varp);
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
|
|
|
return varp;
|
|
|
|
}
|
|
|
|
void mergeEnd() {
|
|
|
|
if (!m_mgAssignps.empty()) {
|
|
|
|
uint32_t items = m_mgIndexHi - m_mgIndexLo + 1;
|
2020-04-14 02:51:35 +00:00
|
|
|
UINFO(9, "End merge iter=" << items << " " << m_mgIndexHi << ":" << m_mgIndexLo << " "
|
|
|
|
<< m_mgAssignps[0] << endl);
|
2018-06-23 21:07:22 +00:00
|
|
|
if (items >= RELOOP_MIN_ITERS) {
|
2020-04-14 02:51:35 +00:00
|
|
|
UINFO(6, "Reloop merging items=" << items << " " << m_mgIndexHi << ":"
|
|
|
|
<< m_mgIndexLo << " " << m_mgAssignps[0] << endl);
|
2018-06-23 21:07:22 +00:00
|
|
|
++m_statReloops;
|
|
|
|
m_statReItems += items;
|
|
|
|
|
|
|
|
// Transform first assign into for loop body
|
|
|
|
AstNodeAssign* bodyp = m_mgAssignps.front();
|
2019-07-06 16:57:50 +00:00
|
|
|
UASSERT_OBJ(bodyp->lhsp() == m_mgSelLp, bodyp, "Corrupt queue/state");
|
2018-06-23 21:07:22 +00:00
|
|
|
FileLine* fl = bodyp->fileline();
|
|
|
|
AstVar* itp = findCreateVarTemp(fl, m_mgCfuncp);
|
|
|
|
|
2020-09-07 21:09:25 +00:00
|
|
|
AstNode* initp = new AstAssign(fl, new AstVarRef(fl, itp, VAccess::WRITE),
|
2018-06-23 21:07:22 +00:00
|
|
|
new AstConst(fl, m_mgIndexLo));
|
2020-09-07 21:09:25 +00:00
|
|
|
AstNode* condp = new AstLte(fl, new AstVarRef(fl, itp, VAccess::READ),
|
|
|
|
new AstConst(fl, m_mgIndexHi));
|
2020-04-14 02:51:35 +00:00
|
|
|
AstNode* incp = new AstAssign(
|
2020-09-07 21:09:25 +00:00
|
|
|
fl, new AstVarRef(fl, itp, VAccess::WRITE),
|
|
|
|
new AstAdd(fl, new AstConst(fl, 1), new AstVarRef(fl, itp, VAccess::READ)));
|
2020-08-15 14:12:55 +00:00
|
|
|
AstWhile* whilep = new AstWhile(fl, condp, nullptr, incp);
|
2018-06-23 21:07:22 +00:00
|
|
|
initp->addNext(whilep);
|
|
|
|
bodyp->replaceWith(initp);
|
|
|
|
whilep->addBodysp(bodyp);
|
|
|
|
|
|
|
|
// Replace constant index with new loop index
|
|
|
|
AstNode* lbitp = m_mgSelLp->bitp();
|
2020-09-07 21:09:25 +00:00
|
|
|
lbitp->replaceWith(new AstVarRef(fl, itp, VAccess::READ));
|
2020-01-17 01:17:11 +00:00
|
|
|
VL_DO_DANGLING(lbitp->deleteTree(), lbitp);
|
2018-08-23 09:09:12 +00:00
|
|
|
if (m_mgSelRp) { // else constant and no replace
|
2018-06-23 21:07:22 +00:00
|
|
|
AstNode* rbitp = m_mgSelRp->bitp();
|
2020-09-07 21:09:25 +00:00
|
|
|
rbitp->replaceWith(new AstVarRef(fl, itp, VAccess::READ));
|
2020-01-17 01:17:11 +00:00
|
|
|
VL_DO_DANGLING(rbitp->deleteTree(), lbitp);
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
2020-04-14 02:51:35 +00:00
|
|
|
if (debug() >= 9) initp->dumpTree(cout, "-new: ");
|
|
|
|
if (debug() >= 9) whilep->dumpTree(cout, "-new: ");
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
// Remove remaining assigns
|
2020-08-16 15:43:49 +00:00
|
|
|
for (AstNodeAssign* assp : m_mgAssignps) {
|
2018-06-23 21:07:22 +00:00
|
|
|
if (assp != bodyp) {
|
2020-01-17 01:17:11 +00:00
|
|
|
VL_DO_DANGLING(assp->unlinkFrBack()->deleteTree(), assp);
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Setup for next merge
|
|
|
|
m_mgAssignps.clear();
|
2020-08-15 14:12:55 +00:00
|
|
|
m_mgSelLp = nullptr;
|
|
|
|
m_mgSelRp = nullptr;
|
|
|
|
m_mgVarrefLp = nullptr;
|
|
|
|
m_mgVarrefRp = nullptr;
|
|
|
|
m_mgConstRp = nullptr;
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// VISITORS
|
2020-08-15 14:03:34 +00:00
|
|
|
virtual void visit(AstCFunc* nodep) override {
|
2018-06-23 21:07:22 +00:00
|
|
|
m_cfuncp = nodep;
|
|
|
|
iterateChildren(nodep);
|
2020-08-15 14:12:55 +00:00
|
|
|
m_cfuncp = nullptr;
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
2020-08-15 14:03:34 +00:00
|
|
|
virtual void visit(AstNodeAssign* nodep) override {
|
2018-06-23 21:07:22 +00:00
|
|
|
if (!m_cfuncp) return;
|
|
|
|
|
|
|
|
// Left select WordSel or ArraySel
|
|
|
|
AstNodeSel* lselp = VN_CAST(nodep->lhsp(), NodeSel);
|
2020-04-14 02:51:35 +00:00
|
|
|
if (!lselp) { // Not ever merged
|
|
|
|
mergeEnd();
|
|
|
|
return;
|
|
|
|
}
|
2018-06-23 21:07:22 +00:00
|
|
|
// Of a constant index
|
|
|
|
AstConst* lbitp = VN_CAST(lselp->bitp(), Const);
|
2020-04-14 02:51:35 +00:00
|
|
|
if (!lbitp) {
|
|
|
|
mergeEnd();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (lbitp->width() > 32) { // Assoc arrays can do this
|
|
|
|
mergeEnd();
|
|
|
|
return;
|
|
|
|
}
|
2018-06-23 21:07:22 +00:00
|
|
|
uint32_t index = lbitp->toUInt();
|
|
|
|
// Of variable
|
|
|
|
AstNodeVarRef* lvarrefp = VN_CAST(lselp->fromp(), NodeVarRef);
|
2020-04-14 02:51:35 +00:00
|
|
|
if (!lvarrefp) {
|
|
|
|
mergeEnd();
|
|
|
|
return;
|
|
|
|
}
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
// RHS is a constant or a select
|
|
|
|
AstConst* rconstp = VN_CAST(nodep->rhsp(), Const);
|
|
|
|
AstNodeSel* rselp = VN_CAST(nodep->rhsp(), NodeSel);
|
2020-08-15 14:12:55 +00:00
|
|
|
AstNodeVarRef* rvarrefp = nullptr;
|
2018-06-23 21:07:22 +00:00
|
|
|
if (rconstp) { // Ok
|
|
|
|
} else {
|
2020-04-14 02:51:35 +00:00
|
|
|
if (!rselp) {
|
|
|
|
mergeEnd();
|
|
|
|
return;
|
|
|
|
}
|
2018-06-23 21:07:22 +00:00
|
|
|
AstConst* rbitp = VN_CAST(rselp->bitp(), Const);
|
|
|
|
rvarrefp = VN_CAST(rselp->fromp(), NodeVarRef);
|
2020-04-14 02:51:35 +00:00
|
|
|
if (!rbitp || rbitp->toUInt() != index || !rvarrefp
|
2018-06-23 21:07:22 +00:00
|
|
|
|| lvarrefp->varp() == rvarrefp->varp()) {
|
2020-04-14 02:51:35 +00:00
|
|
|
mergeEnd();
|
|
|
|
return;
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-08-23 09:09:12 +00:00
|
|
|
if (m_mgSelLp) { // Old merge
|
2020-04-14 02:51:35 +00:00
|
|
|
if (m_mgCfuncp == m_cfuncp && m_mgNextp == nodep && m_mgSelLp->same(lselp)
|
2018-06-23 21:07:22 +00:00
|
|
|
&& m_mgVarrefLp->same(lvarrefp)
|
|
|
|
&& (m_mgConstRp
|
2020-04-14 02:51:35 +00:00
|
|
|
? (rconstp && m_mgConstRp->same(rconstp))
|
|
|
|
: (rselp && m_mgSelRp->same(rselp) && m_mgVarrefRp->same(rvarrefp)))
|
|
|
|
&& (index == m_mgIndexLo - 1 || index == m_mgIndexHi + 1)) {
|
2018-06-23 21:07:22 +00:00
|
|
|
// Sequentially next to last assign; continue merge
|
2020-04-14 02:51:35 +00:00
|
|
|
if (index == m_mgIndexLo - 1) {
|
|
|
|
m_mgIndexLo = index;
|
|
|
|
} else if (index == m_mgIndexHi + 1) {
|
|
|
|
m_mgIndexHi = index;
|
|
|
|
}
|
|
|
|
UINFO(9, "Continue merge i=" << index << " " << m_mgIndexHi << ":" << m_mgIndexLo
|
|
|
|
<< " " << nodep << endl);
|
2018-06-23 21:07:22 +00:00
|
|
|
m_mgAssignps.push_back(nodep);
|
|
|
|
m_mgNextp = nodep->nextp();
|
|
|
|
return;
|
2020-04-14 02:51:35 +00:00
|
|
|
} else {
|
2018-06-23 21:07:22 +00:00
|
|
|
// This assign doesn't merge with previous assign,
|
|
|
|
// but should start a new merge
|
|
|
|
mergeEnd();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Merge start
|
|
|
|
m_mgAssignps.push_back(nodep);
|
|
|
|
m_mgCfuncp = m_cfuncp;
|
|
|
|
m_mgNextp = nodep->nextp();
|
|
|
|
m_mgSelLp = lselp;
|
|
|
|
m_mgSelRp = rselp;
|
|
|
|
m_mgVarrefLp = lvarrefp;
|
|
|
|
m_mgVarrefRp = rvarrefp;
|
|
|
|
m_mgConstRp = rconstp;
|
|
|
|
m_mgIndexLo = index;
|
|
|
|
m_mgIndexHi = index;
|
2020-04-14 02:51:35 +00:00
|
|
|
UINFO(9, "Start merge i=" << index << " " << nodep << endl);
|
2018-06-23 21:07:22 +00:00
|
|
|
}
|
|
|
|
//--------------------
|
2020-08-15 14:03:34 +00:00
|
|
|
virtual void visit(AstVar*) override {} // Accelerate
|
|
|
|
virtual void visit(AstNodeMath*) override {} // Accelerate
|
|
|
|
virtual void visit(AstNode* nodep) override { iterateChildren(nodep); }
|
2018-06-23 21:07:22 +00:00
|
|
|
|
|
|
|
public:
|
2019-09-12 11:22:22 +00:00
|
|
|
// CONSTRUCTORS
|
2020-08-16 13:55:36 +00:00
|
|
|
explicit ReloopVisitor(AstNetlist* nodep) { iterate(nodep); }
|
2020-08-15 15:44:10 +00:00
|
|
|
virtual ~ReloopVisitor() override {
|
2018-06-23 21:07:22 +00:00
|
|
|
V3Stats::addStat("Optimizations, Reloops", m_statReloops);
|
|
|
|
V3Stats::addStat("Optimizations, Reloop iterations", m_statReItems);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
//######################################################################
|
|
|
|
// Reloop class functions
|
|
|
|
|
|
|
|
void V3Reloop::reloopAll(AstNetlist* nodep) {
|
2020-04-14 02:51:35 +00:00
|
|
|
UINFO(2, __FUNCTION__ << ": " << endl);
|
|
|
|
{ ReloopVisitor visitor(nodep); } // Destruct before checking
|
2018-06-23 21:07:22 +00:00
|
|
|
V3Global::dumpCheckGlobalTree("reloop", 0, v3Global.opt.dumpTreeLevel(__FILE__) >= 6);
|
|
|
|
}
|