V3Simulate: Avoid copying while managing free list.

V3Simulate reuses allocated AstConst nodes for efficiency, however this
used to be implemented in a way that required a deep copy of a
std::unorderd_map<_, std::deque<_>>, which was quite inefficient when it
grew large. The free list is now managed without any copying. This takes
the V3Table pass from taking 12s to 0.2s on SweRV EH1.
This commit is contained in:
Geza Lore 2021-07-05 16:35:24 +01:00
parent 2a7aa28b20
commit 2ebed755e6
2 changed files with 32 additions and 22 deletions

View File

@ -32,6 +32,7 @@ Verilator 4.205 devel
* In XML, show pinIndex information (#2877). [errae233] * In XML, show pinIndex information (#2877). [errae233]
* Fix error on unsupported recursive functions (#2957). [Trefor Southwell] * Fix error on unsupported recursive functions (#2957). [Trefor Southwell]
* Fix type parameter specialization when struct names are same (#3055). [7FM] * Fix type parameter specialization when struct names are same (#3055). [7FM]
* Improve speed of table optimization (-OA) pass. [Geza Lore]
Verilator 4.204 2021-06-12 Verilator 4.204 2021-06-12

View File

@ -61,9 +61,6 @@ public:
~SimStackNode() = default; ~SimStackNode() = default;
}; };
using ConstDeque = std::deque<AstConst*>;
using ConstPile = std::unordered_map<const AstNodeDType*, ConstDeque>;
class SimulateVisitor VL_NOT_FINAL : public AstNVisitor { class SimulateVisitor VL_NOT_FINAL : public AstNVisitor {
// Simulate a node tree, returning value of variables // Simulate a node tree, returning value of variables
// Two major operating modes: // Two major operating modes:
@ -82,6 +79,7 @@ private:
// Checking: // Checking:
// AstVar(Scope)::user1() -> VarUsage. Set true to indicate tracking as lvalue/rvalue // AstVar(Scope)::user1() -> VarUsage. Set true to indicate tracking as lvalue/rvalue
// Simulating: // Simulating:
// AstConst::user2() -> bool. This AstConst (allocated by this class) is in use
// AstVar(Scope)::user3() -> AstConst*. Input value of variable or node // AstVar(Scope)::user3() -> AstConst*. Input value of variable or node
// (and output for non-delayed assignments) // (and output for non-delayed assignments)
// AstVar(Scope)::user2() -> AstCont*. Output value of variable (delayed assignments) // AstVar(Scope)::user2() -> AstCont*. Output value of variable (delayed assignments)
@ -103,8 +101,8 @@ private:
int m_dataCount; ///< Bytes of data int m_dataCount; ///< Bytes of data
AstJumpGo* m_jumpp; ///< Jump label we're branching from AstJumpGo* m_jumpp; ///< Jump label we're branching from
// Simulating: // Simulating:
ConstPile m_constFreeps; ///< List of all AstConst* free and not in use std::unordered_map<const AstNodeDType*, std::deque<AstConst*>>
ConstPile m_constAllps; ///< List of all AstConst* free and in use m_constps; ///< Lists of all AstConst* allocated per dtype
std::vector<SimStackNode*> m_callStack; ///< Call stack for verbose error messages std::vector<SimStackNode*> m_callStack; ///< Call stack for verbose error messages
// Cleanup // Cleanup
@ -214,16 +212,31 @@ private:
// It would be more efficient to do this by size, but the extra accounting // It would be more efficient to do this by size, but the extra accounting
// slows things down more than we gain. // slows things down more than we gain.
AstConst* constp; AstConst* constp;
AstNodeDType* dtypep = nodep->dtypep(); // Grab free list corresponding to this dtype
if (!m_constFreeps[dtypep].empty()) { std::deque<AstConst*>& freeList = m_constps[nodep->dtypep()];
// UINFO(7, "Num Reuse " << nodep->width() << endl); bool allocNewConst = true;
constp = m_constFreeps[dtypep].back(); if (!freeList.empty()) {
m_constFreeps[dtypep].pop_back(); constp = freeList.front();
constp->num().nodep(nodep); if (!constp->user2()) {
} else { // Front of free list is free, reuse it (otherwise allocate new node)
// UINFO(7, "Num New " << nodep->width() << endl); allocNewConst = false; // No need to allocate
// Mark the AstConst node as used, and move it to the back of the free list. This
// ensures that when all AstConst instances within the list are used, then the
// front of the list will be marked as used, in which case the enclosing 'if' will
// fail and we fall back to allocation.
constp->user2(1);
freeList.pop_front();
freeList.push_back(constp);
// configure const
constp->num().nodep(nodep);
}
}
if (allocNewConst) {
// Need to allocate new constant
constp = new AstConst(nodep->fileline(), AstConst::DtypedValue(), nodep->dtypep(), 0); constp = new AstConst(nodep->fileline(), AstConst::DtypedValue(), nodep->dtypep(), 0);
m_constAllps[constp->dtypep()].push_back(constp); // Mark as in use, add to free list for later reuse
constp->user2(1);
freeList.push_back(constp);
} }
constp->num().isDouble(nodep->isDouble()); constp->num().isDouble(nodep->isDouble());
constp->num().isString(nodep->isString()); constp->num().isString(nodep->isString());
@ -1122,11 +1135,8 @@ public:
m_jumpp = nullptr; m_jumpp = nullptr;
AstNode::user1ClearTree(); AstNode::user1ClearTree();
AstNode::user2ClearTree(); AstNode::user2ClearTree(); // Also marks all elements in m_constps as free
AstNode::user3ClearTree(); AstNode::user3ClearTree();
// Move all allocated numbers to the free pool
m_constFreeps = m_constAllps;
} }
void mainTableCheck(AstNode* nodep) { void mainTableCheck(AstNode* nodep) {
setMode(true /*scoped*/, true /*checking*/, false /*params*/); setMode(true /*scoped*/, true /*checking*/, false /*params*/);
@ -1145,13 +1155,12 @@ public:
mainGuts(nodep); mainGuts(nodep);
} }
virtual ~SimulateVisitor() override { virtual ~SimulateVisitor() override {
for (const auto& i : m_constAllps) { for (const auto& pair : m_constps) {
for (AstConst* i2p : i.second) delete i2p; for (AstConst* const constp : pair.second) { delete constp; }
} }
m_constps.clear();
for (AstNode* ip : m_reclaimValuesp) delete ip; for (AstNode* ip : m_reclaimValuesp) delete ip;
m_reclaimValuesp.clear(); m_reclaimValuesp.clear();
m_constFreeps.clear();
m_constAllps.clear();
} }
}; };