forked from github/verilator
Rename some internals related to multi-threaded tracing
Rename the implementation internals of current multi-threaded tracing to be "offload mode". No functional change, nor user interface change intended.
This commit is contained in:
parent
9edccfdffa
commit
551bd284dd
@ -22,6 +22,10 @@
|
|||||||
#ifndef VERILATOR_VERILATED_TRACE_H_
|
#ifndef VERILATOR_VERILATED_TRACE_H_
|
||||||
#define VERILATOR_VERILATED_TRACE_H_
|
#define VERILATOR_VERILATED_TRACE_H_
|
||||||
|
|
||||||
|
#ifdef VL_TRACE_THREADED
|
||||||
|
#define VL_TRACE_OFFLOAD
|
||||||
|
#endif
|
||||||
|
|
||||||
// clang-format off
|
// clang-format off
|
||||||
|
|
||||||
#include "verilated.h"
|
#include "verilated.h"
|
||||||
@ -32,7 +36,7 @@
|
|||||||
#include <string>
|
#include <string>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
# include <condition_variable>
|
# include <condition_variable>
|
||||||
# include <deque>
|
# include <deque>
|
||||||
# include <thread>
|
# include <thread>
|
||||||
@ -40,9 +44,9 @@
|
|||||||
|
|
||||||
// clang-format on
|
// clang-format on
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
//=============================================================================
|
//=============================================================================
|
||||||
// Threaded tracing
|
// Offloaded tracing
|
||||||
|
|
||||||
// A simple synchronized first in first out queue
|
// A simple synchronized first in first out queue
|
||||||
template <class T> class VerilatedThreadQueue final { // LCOV_EXCL_LINE // lcov bug
|
template <class T> class VerilatedThreadQueue final { // LCOV_EXCL_LINE // lcov bug
|
||||||
@ -88,7 +92,7 @@ public:
|
|||||||
|
|
||||||
// Commands used by thread tracing. Anonymous enum in class, as we want
|
// Commands used by thread tracing. Anonymous enum in class, as we want
|
||||||
// it scoped, but we also want the automatic conversion to integer types.
|
// it scoped, but we also want the automatic conversion to integer types.
|
||||||
class VerilatedTraceCommand final {
|
class VerilatedTraceOffloadCommand final {
|
||||||
public:
|
public:
|
||||||
// These must all fit in 4 bit at the moment, as the tracing routines
|
// These must all fit in 4 bit at the moment, as the tracing routines
|
||||||
// pack parameters in the top bits.
|
// pack parameters in the top bits.
|
||||||
@ -172,33 +176,33 @@ private:
|
|||||||
// Close the file on termination
|
// Close the file on termination
|
||||||
static void onExit(void* selfp) VL_MT_UNSAFE_ONE;
|
static void onExit(void* selfp) VL_MT_UNSAFE_ONE;
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
// Number of total trace buffers that have been allocated
|
// Number of total offload buffers that have been allocated
|
||||||
uint32_t m_numTraceBuffers;
|
uint32_t m_numOffloadBuffers;
|
||||||
// Size of trace buffers
|
// Size of offload buffers
|
||||||
size_t m_traceBufferSize;
|
size_t m_offloadBufferSize;
|
||||||
// Buffers handed to worker for processing
|
// Buffers handed to worker for processing
|
||||||
VerilatedThreadQueue<uint32_t*> m_buffersToWorker;
|
VerilatedThreadQueue<uint32_t*> m_offloadBuffersToWorker;
|
||||||
// Buffers returned from worker after processing
|
// Buffers returned from worker after processing
|
||||||
VerilatedThreadQueue<uint32_t*> m_buffersFromWorker;
|
VerilatedThreadQueue<uint32_t*> m_offloadBuffersFromWorker;
|
||||||
// Write pointer into current buffer
|
// Write pointer into current buffer
|
||||||
uint32_t* m_traceBufferWritep;
|
uint32_t* m_offloadBufferWritep;
|
||||||
// End of trace buffer
|
// End of offload buffer
|
||||||
uint32_t* m_traceBufferEndp;
|
uint32_t* m_offloadBufferEndp;
|
||||||
// The worker thread itself
|
// The offload worker thread itself
|
||||||
std::unique_ptr<std::thread> m_workerThread;
|
std::unique_ptr<std::thread> m_workerThread;
|
||||||
|
|
||||||
// Get a new trace buffer that can be populated. May block if none available
|
// Get a new offload buffer that can be populated. May block if none available
|
||||||
uint32_t* getTraceBuffer();
|
uint32_t* getOffloadBuffer();
|
||||||
|
|
||||||
// The function executed by the worker thread
|
// The function executed by the offload worker thread
|
||||||
void workerThreadMain();
|
void offloadWorkerThreadMain();
|
||||||
|
|
||||||
// Wait until given buffer is placed in m_buffersFromWorker
|
// Wait until given offload buffer is placed in m_offloadBuffersFromWorker
|
||||||
void waitForBuffer(const uint32_t* bufferp);
|
void waitForOffloadBuffer(const uint32_t* bufferp);
|
||||||
|
|
||||||
// Shut down and join worker, if it's running, otherwise do nothing
|
// Shut down and join worker, if it's running, otherwise do nothing
|
||||||
void shutdownWorker();
|
void shutdownOffloadWorker();
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// CONSTRUCTORS
|
// CONSTRUCTORS
|
||||||
@ -307,56 +311,56 @@ public:
|
|||||||
void fullWData(uint32_t* oldp, const WData* newvalp, int bits);
|
void fullWData(uint32_t* oldp, const WData* newvalp, int bits);
|
||||||
void fullDouble(uint32_t* oldp, double newval);
|
void fullDouble(uint32_t* oldp, double newval);
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
// Threaded tracing. Just dump everything in the trace buffer
|
// Offloaded tracing. Just dump everything in the offload buffer
|
||||||
inline void chgBit(uint32_t code, CData newval) {
|
inline void chgBit(uint32_t code, CData newval) {
|
||||||
m_traceBufferWritep[0] = VerilatedTraceCommand::CHG_BIT_0 | newval;
|
m_offloadBufferWritep[0] = VerilatedTraceOffloadCommand::CHG_BIT_0 | newval;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
m_traceBufferWritep += 2;
|
m_offloadBufferWritep += 2;
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
inline void chgCData(uint32_t code, CData newval, int bits) {
|
inline void chgCData(uint32_t code, CData newval, int bits) {
|
||||||
m_traceBufferWritep[0] = (bits << 4) | VerilatedTraceCommand::CHG_CDATA;
|
m_offloadBufferWritep[0] = (bits << 4) | VerilatedTraceOffloadCommand::CHG_CDATA;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
m_traceBufferWritep[2] = newval;
|
m_offloadBufferWritep[2] = newval;
|
||||||
m_traceBufferWritep += 3;
|
m_offloadBufferWritep += 3;
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
inline void chgSData(uint32_t code, SData newval, int bits) {
|
inline void chgSData(uint32_t code, SData newval, int bits) {
|
||||||
m_traceBufferWritep[0] = (bits << 4) | VerilatedTraceCommand::CHG_SDATA;
|
m_offloadBufferWritep[0] = (bits << 4) | VerilatedTraceOffloadCommand::CHG_SDATA;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
m_traceBufferWritep[2] = newval;
|
m_offloadBufferWritep[2] = newval;
|
||||||
m_traceBufferWritep += 3;
|
m_offloadBufferWritep += 3;
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
inline void chgIData(uint32_t code, IData newval, int bits) {
|
inline void chgIData(uint32_t code, IData newval, int bits) {
|
||||||
m_traceBufferWritep[0] = (bits << 4) | VerilatedTraceCommand::CHG_IDATA;
|
m_offloadBufferWritep[0] = (bits << 4) | VerilatedTraceOffloadCommand::CHG_IDATA;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
m_traceBufferWritep[2] = newval;
|
m_offloadBufferWritep[2] = newval;
|
||||||
m_traceBufferWritep += 3;
|
m_offloadBufferWritep += 3;
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
inline void chgQData(uint32_t code, QData newval, int bits) {
|
inline void chgQData(uint32_t code, QData newval, int bits) {
|
||||||
m_traceBufferWritep[0] = (bits << 4) | VerilatedTraceCommand::CHG_QDATA;
|
m_offloadBufferWritep[0] = (bits << 4) | VerilatedTraceOffloadCommand::CHG_QDATA;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
*reinterpret_cast<QData*>(m_traceBufferWritep + 2) = newval;
|
*reinterpret_cast<QData*>(m_offloadBufferWritep + 2) = newval;
|
||||||
m_traceBufferWritep += 4;
|
m_offloadBufferWritep += 4;
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
inline void chgWData(uint32_t code, const WData* newvalp, int bits) {
|
inline void chgWData(uint32_t code, const WData* newvalp, int bits) {
|
||||||
m_traceBufferWritep[0] = (bits << 4) | VerilatedTraceCommand::CHG_WDATA;
|
m_offloadBufferWritep[0] = (bits << 4) | VerilatedTraceOffloadCommand::CHG_WDATA;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
m_traceBufferWritep += 2;
|
m_offloadBufferWritep += 2;
|
||||||
for (int i = 0; i < (bits + 31) / 32; ++i) { *m_traceBufferWritep++ = newvalp[i]; }
|
for (int i = 0; i < (bits + 31) / 32; ++i) { *m_offloadBufferWritep++ = newvalp[i]; }
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
inline void chgDouble(uint32_t code, double newval) {
|
inline void chgDouble(uint32_t code, double newval) {
|
||||||
m_traceBufferWritep[0] = VerilatedTraceCommand::CHG_DOUBLE;
|
m_offloadBufferWritep[0] = VerilatedTraceOffloadCommand::CHG_DOUBLE;
|
||||||
m_traceBufferWritep[1] = code;
|
m_offloadBufferWritep[1] = code;
|
||||||
// cppcheck-suppress invalidPointerCast
|
// cppcheck-suppress invalidPointerCast
|
||||||
*reinterpret_cast<double*>(m_traceBufferWritep + 2) = newval;
|
*reinterpret_cast<double*>(m_offloadBufferWritep + 2) = newval;
|
||||||
m_traceBufferWritep += 4;
|
m_offloadBufferWritep += 4;
|
||||||
VL_DEBUG_IF(assert(m_traceBufferWritep <= m_traceBufferEndp););
|
VL_DEBUG_IF(assert(m_offloadBufferWritep <= m_offloadBufferEndp););
|
||||||
}
|
}
|
||||||
|
|
||||||
#define CHG(name) chg##name##Impl
|
#define CHG(name) chg##name##Impl
|
||||||
@ -364,8 +368,8 @@ public:
|
|||||||
#define CHG(name) chg##name
|
#define CHG(name) chg##name
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// In non-threaded mode, these are called directly by the trace callbacks,
|
// In non-offload mode, these are called directly by the trace callbacks,
|
||||||
// and are called chg*. In threaded mode, they are called by the worker
|
// and are called chg*. In offload mode, they are called by the worker
|
||||||
// thread and are called chg*Impl
|
// thread and are called chg*Impl
|
||||||
|
|
||||||
// Check previous dumped value of signal. If changed, then emit trace entry
|
// Check previous dumped value of signal. If changed, then emit trace entry
|
||||||
|
@ -33,9 +33,9 @@
|
|||||||
|
|
||||||
#if 0
|
#if 0
|
||||||
# include <iostream>
|
# include <iostream>
|
||||||
# define VL_TRACE_THREAD_DEBUG(msg) std::cout << "TRACE THREAD: " << msg << std::endl
|
# define VL_TRACE_OFFLOAD_DEBUG(msg) std::cout << "TRACE OFFLOAD THREAD: " << msg << std::endl
|
||||||
#else
|
#else
|
||||||
# define VL_TRACE_THREAD_DEBUG(msg)
|
# define VL_TRACE_OFFLOAD_DEBUG(msg)
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// clang-format on
|
// clang-format on
|
||||||
@ -78,37 +78,37 @@ static std::string doubleToTimescale(double value) {
|
|||||||
return valuestr; // Gets converted to string, so no ref to stack
|
return valuestr; // Gets converted to string, so no ref to stack
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
//=========================================================================
|
//=========================================================================
|
||||||
// Buffer management
|
// Buffer management
|
||||||
|
|
||||||
template <> uint32_t* VerilatedTrace<VL_DERIVED_T>::getTraceBuffer() {
|
template <> uint32_t* VerilatedTrace<VL_DERIVED_T>::getOffloadBuffer() {
|
||||||
uint32_t* bufferp;
|
uint32_t* bufferp;
|
||||||
// Some jitter is expected, so some number of alternative trace buffers are
|
// Some jitter is expected, so some number of alternative offlaod buffers are
|
||||||
// required, but don't allocate more than 8 buffers.
|
// required, but don't allocate more than 8 buffers.
|
||||||
if (m_numTraceBuffers < 8) {
|
if (m_numOffloadBuffers < 8) {
|
||||||
// Allocate a new buffer if none is available
|
// Allocate a new buffer if none is available
|
||||||
if (!m_buffersFromWorker.tryGet(bufferp)) {
|
if (!m_offloadBuffersFromWorker.tryGet(bufferp)) {
|
||||||
++m_numTraceBuffers;
|
++m_numOffloadBuffers;
|
||||||
// Note: over allocate a bit so pointer comparison is well defined
|
// Note: over allocate a bit so pointer comparison is well defined
|
||||||
// if we overflow only by a small amount
|
// if we overflow only by a small amount
|
||||||
bufferp = new uint32_t[m_traceBufferSize + 16];
|
bufferp = new uint32_t[m_offloadBufferSize + 16];
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
// Block until a buffer becomes available
|
// Block until a buffer becomes available
|
||||||
bufferp = m_buffersFromWorker.get();
|
bufferp = m_offloadBuffersFromWorker.get();
|
||||||
}
|
}
|
||||||
return bufferp;
|
return bufferp;
|
||||||
}
|
}
|
||||||
|
|
||||||
template <> void VerilatedTrace<VL_DERIVED_T>::waitForBuffer(const uint32_t* buffp) {
|
template <> void VerilatedTrace<VL_DERIVED_T>::waitForOffloadBuffer(const uint32_t* buffp) {
|
||||||
// Slow path code only called on flush/shutdown, so use a simple algorithm.
|
// Slow path code only called on flush/shutdown, so use a simple algorithm.
|
||||||
// Collect buffers from worker and stash them until we get the one we want.
|
// Collect buffers from worker and stash them until we get the one we want.
|
||||||
std::deque<uint32_t*> stash;
|
std::deque<uint32_t*> stash;
|
||||||
do { stash.push_back(m_buffersFromWorker.get()); } while (stash.back() != buffp);
|
do { stash.push_back(m_offloadBuffersFromWorker.get()); } while (stash.back() != buffp);
|
||||||
// Now put them back in the queue, in the original order.
|
// Now put them back in the queue, in the original order.
|
||||||
while (!stash.empty()) {
|
while (!stash.empty()) {
|
||||||
m_buffersFromWorker.put_front(stash.back());
|
m_offloadBuffersFromWorker.put_front(stash.back());
|
||||||
stash.pop_back();
|
stash.pop_back();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -116,14 +116,14 @@ template <> void VerilatedTrace<VL_DERIVED_T>::waitForBuffer(const uint32_t* buf
|
|||||||
//=========================================================================
|
//=========================================================================
|
||||||
// Worker thread
|
// Worker thread
|
||||||
|
|
||||||
template <> void VerilatedTrace<VL_DERIVED_T>::workerThreadMain() {
|
template <> void VerilatedTrace<VL_DERIVED_T>::offloadWorkerThreadMain() {
|
||||||
bool shutdown = false;
|
bool shutdown = false;
|
||||||
|
|
||||||
do {
|
do {
|
||||||
uint32_t* const bufferp = m_buffersToWorker.get();
|
uint32_t* const bufferp = m_offloadBuffersToWorker.get();
|
||||||
|
|
||||||
VL_TRACE_THREAD_DEBUG("");
|
VL_TRACE_OFFLOAD_DEBUG("");
|
||||||
VL_TRACE_THREAD_DEBUG("Got buffer: " << bufferp);
|
VL_TRACE_OFFLOAD_DEBUG("Got buffer: " << bufferp);
|
||||||
|
|
||||||
const uint32_t* readp = bufferp;
|
const uint32_t* readp = bufferp;
|
||||||
|
|
||||||
@ -139,53 +139,53 @@ template <> void VerilatedTrace<VL_DERIVED_T>::workerThreadMain() {
|
|||||||
switch (cmd & 0xF) {
|
switch (cmd & 0xF) {
|
||||||
//===
|
//===
|
||||||
// CHG_* commands
|
// CHG_* commands
|
||||||
case VerilatedTraceCommand::CHG_BIT_0:
|
case VerilatedTraceOffloadCommand::CHG_BIT_0:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_BIT_0 " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_BIT_0 " << top);
|
||||||
chgBitImpl(oldp, 0);
|
chgBitImpl(oldp, 0);
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_BIT_1:
|
case VerilatedTraceOffloadCommand::CHG_BIT_1:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_BIT_1 " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_BIT_1 " << top);
|
||||||
chgBitImpl(oldp, 1);
|
chgBitImpl(oldp, 1);
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_CDATA:
|
case VerilatedTraceOffloadCommand::CHG_CDATA:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_CDATA " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_CDATA " << top);
|
||||||
// Bits stored in bottom byte of command
|
// Bits stored in bottom byte of command
|
||||||
chgCDataImpl(oldp, *readp, top);
|
chgCDataImpl(oldp, *readp, top);
|
||||||
readp += 1;
|
readp += 1;
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_SDATA:
|
case VerilatedTraceOffloadCommand::CHG_SDATA:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_SDATA " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_SDATA " << top);
|
||||||
// Bits stored in bottom byte of command
|
// Bits stored in bottom byte of command
|
||||||
chgSDataImpl(oldp, *readp, top);
|
chgSDataImpl(oldp, *readp, top);
|
||||||
readp += 1;
|
readp += 1;
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_IDATA:
|
case VerilatedTraceOffloadCommand::CHG_IDATA:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_IDATA " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_IDATA " << top);
|
||||||
// Bits stored in bottom byte of command
|
// Bits stored in bottom byte of command
|
||||||
chgIDataImpl(oldp, *readp, top);
|
chgIDataImpl(oldp, *readp, top);
|
||||||
readp += 1;
|
readp += 1;
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_QDATA:
|
case VerilatedTraceOffloadCommand::CHG_QDATA:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_QDATA " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_QDATA " << top);
|
||||||
// Bits stored in bottom byte of command
|
// Bits stored in bottom byte of command
|
||||||
chgQDataImpl(oldp, *reinterpret_cast<const QData*>(readp), top);
|
chgQDataImpl(oldp, *reinterpret_cast<const QData*>(readp), top);
|
||||||
readp += 2;
|
readp += 2;
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_WDATA:
|
case VerilatedTraceOffloadCommand::CHG_WDATA:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_WDATA " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_WDATA " << top);
|
||||||
chgWDataImpl(oldp, readp, top);
|
chgWDataImpl(oldp, readp, top);
|
||||||
readp += VL_WORDS_I(top);
|
readp += VL_WORDS_I(top);
|
||||||
continue;
|
continue;
|
||||||
case VerilatedTraceCommand::CHG_DOUBLE:
|
case VerilatedTraceOffloadCommand::CHG_DOUBLE:
|
||||||
VL_TRACE_THREAD_DEBUG("Command CHG_DOUBLE " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command CHG_DOUBLE " << top);
|
||||||
chgDoubleImpl(oldp, *reinterpret_cast<const double*>(readp));
|
chgDoubleImpl(oldp, *reinterpret_cast<const double*>(readp));
|
||||||
readp += 2;
|
readp += 2;
|
||||||
continue;
|
continue;
|
||||||
|
|
||||||
//===
|
//===
|
||||||
// Rare commands
|
// Rare commands
|
||||||
case VerilatedTraceCommand::TIME_CHANGE:
|
case VerilatedTraceOffloadCommand::TIME_CHANGE:
|
||||||
VL_TRACE_THREAD_DEBUG("Command TIME_CHANGE " << top);
|
VL_TRACE_OFFLOAD_DEBUG("Command TIME_CHANGE " << top);
|
||||||
readp -= 1; // No code in this command, undo increment
|
readp -= 1; // No code in this command, undo increment
|
||||||
emitTimeChange(*reinterpret_cast<const uint64_t*>(readp));
|
emitTimeChange(*reinterpret_cast<const uint64_t*>(readp));
|
||||||
readp += 2;
|
readp += 2;
|
||||||
@ -193,16 +193,16 @@ template <> void VerilatedTrace<VL_DERIVED_T>::workerThreadMain() {
|
|||||||
|
|
||||||
//===
|
//===
|
||||||
// Commands ending this buffer
|
// Commands ending this buffer
|
||||||
case VerilatedTraceCommand::END: VL_TRACE_THREAD_DEBUG("Command END"); break;
|
case VerilatedTraceOffloadCommand::END: VL_TRACE_OFFLOAD_DEBUG("Command END"); break;
|
||||||
case VerilatedTraceCommand::SHUTDOWN:
|
case VerilatedTraceOffloadCommand::SHUTDOWN:
|
||||||
VL_TRACE_THREAD_DEBUG("Command SHUTDOWN");
|
VL_TRACE_OFFLOAD_DEBUG("Command SHUTDOWN");
|
||||||
shutdown = true;
|
shutdown = true;
|
||||||
break;
|
break;
|
||||||
|
|
||||||
//===
|
//===
|
||||||
// Unknown command
|
// Unknown command
|
||||||
default: { // LCOV_EXCL_START
|
default: { // LCOV_EXCL_START
|
||||||
VL_TRACE_THREAD_DEBUG("Command UNKNOWN");
|
VL_TRACE_OFFLOAD_DEBUG("Command UNKNOWN");
|
||||||
VL_PRINTF_MT("Trace command: 0x%08x\n", cmd);
|
VL_PRINTF_MT("Trace command: 0x%08x\n", cmd);
|
||||||
VL_FATAL_MT(__FILE__, __LINE__, "", "Unknown trace command");
|
VL_FATAL_MT(__FILE__, __LINE__, "", "Unknown trace command");
|
||||||
break;
|
break;
|
||||||
@ -214,23 +214,23 @@ template <> void VerilatedTrace<VL_DERIVED_T>::workerThreadMain() {
|
|||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
VL_TRACE_THREAD_DEBUG("Returning buffer");
|
VL_TRACE_OFFLOAD_DEBUG("Returning buffer");
|
||||||
|
|
||||||
// Return buffer
|
// Return buffer
|
||||||
m_buffersFromWorker.put(bufferp);
|
m_offloadBuffersFromWorker.put(bufferp);
|
||||||
} while (VL_LIKELY(!shutdown));
|
} while (VL_LIKELY(!shutdown));
|
||||||
}
|
}
|
||||||
|
|
||||||
template <> void VerilatedTrace<VL_DERIVED_T>::shutdownWorker() {
|
template <> void VerilatedTrace<VL_DERIVED_T>::shutdownOffloadWorker() {
|
||||||
// If the worker thread is not running, done..
|
// If the worker thread is not running, done..
|
||||||
if (!m_workerThread) return;
|
if (!m_workerThread) return;
|
||||||
|
|
||||||
// Hand an buffer with a shutdown command to the worker thread
|
// Hand an buffer with a shutdown command to the worker thread
|
||||||
uint32_t* const bufferp = getTraceBuffer();
|
uint32_t* const bufferp = getOffloadBuffer();
|
||||||
bufferp[0] = VerilatedTraceCommand::SHUTDOWN;
|
bufferp[0] = VerilatedTraceOffloadCommand::SHUTDOWN;
|
||||||
m_buffersToWorker.put(bufferp);
|
m_offloadBuffersToWorker.put(bufferp);
|
||||||
// Wait for it to return
|
// Wait for it to return
|
||||||
waitForBuffer(bufferp);
|
waitForOffloadBuffer(bufferp);
|
||||||
// Join the thread and delete it
|
// Join the thread and delete it
|
||||||
m_workerThread->join();
|
m_workerThread->join();
|
||||||
m_workerThread.reset(nullptr);
|
m_workerThread.reset(nullptr);
|
||||||
@ -242,24 +242,24 @@ template <> void VerilatedTrace<VL_DERIVED_T>::shutdownWorker() {
|
|||||||
// Life cycle
|
// Life cycle
|
||||||
|
|
||||||
template <> void VerilatedTrace<VL_DERIVED_T>::closeBase() {
|
template <> void VerilatedTrace<VL_DERIVED_T>::closeBase() {
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
shutdownWorker();
|
shutdownOffloadWorker();
|
||||||
while (m_numTraceBuffers) {
|
while (m_numOffloadBuffers) {
|
||||||
delete[] m_buffersFromWorker.get();
|
delete[] m_offloadBuffersFromWorker.get();
|
||||||
--m_numTraceBuffers;
|
--m_numOffloadBuffers;
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
template <> void VerilatedTrace<VL_DERIVED_T>::flushBase() {
|
template <> void VerilatedTrace<VL_DERIVED_T>::flushBase() {
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
// Hand an empty buffer to the worker thread
|
// Hand an empty buffer to the worker thread
|
||||||
uint32_t* const bufferp = getTraceBuffer();
|
uint32_t* const bufferp = getOffloadBuffer();
|
||||||
*bufferp = VerilatedTraceCommand::END;
|
*bufferp = VerilatedTraceOffloadCommand::END;
|
||||||
m_buffersToWorker.put(bufferp);
|
m_offloadBuffersToWorker.put(bufferp);
|
||||||
// Wait for it to be returned. As the processing is in-order,
|
// Wait for it to be returned. As the processing is in-order,
|
||||||
// this ensures all previous buffers have been processed.
|
// this ensures all previous buffers have been processed.
|
||||||
waitForBuffer(bufferp);
|
waitForOffloadBuffer(bufferp);
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -293,8 +293,8 @@ VerilatedTrace<VL_DERIVED_T>::VerilatedTrace()
|
|||||||
, m_timeUnit {
|
, m_timeUnit {
|
||||||
1e-9
|
1e-9
|
||||||
}
|
}
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
, m_numTraceBuffers { 0 }
|
, m_numOffloadBuffers { 0 }
|
||||||
#endif
|
#endif
|
||||||
{
|
{
|
||||||
set_time_unit(Verilated::threadContextp()->timeunitString());
|
set_time_unit(Verilated::threadContextp()->timeunitString());
|
||||||
@ -306,7 +306,7 @@ template <> VerilatedTrace<VL_DERIVED_T>::~VerilatedTrace() {
|
|||||||
if (m_sigs_enabledp) VL_DO_CLEAR(delete[] m_sigs_enabledp, m_sigs_enabledp = nullptr);
|
if (m_sigs_enabledp) VL_DO_CLEAR(delete[] m_sigs_enabledp, m_sigs_enabledp = nullptr);
|
||||||
Verilated::removeFlushCb(VerilatedTrace<VL_DERIVED_T>::onFlush, this);
|
Verilated::removeFlushCb(VerilatedTrace<VL_DERIVED_T>::onFlush, this);
|
||||||
Verilated::removeExitCb(VerilatedTrace<VL_DERIVED_T>::onExit, this);
|
Verilated::removeExitCb(VerilatedTrace<VL_DERIVED_T>::onExit, this);
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
closeBase();
|
closeBase();
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
@ -362,16 +362,17 @@ template <> void VerilatedTrace<VL_DERIVED_T>::traceInit() VL_MT_UNSAFE {
|
|||||||
Verilated::addFlushCb(VerilatedTrace<VL_DERIVED_T>::onFlush, this);
|
Verilated::addFlushCb(VerilatedTrace<VL_DERIVED_T>::onFlush, this);
|
||||||
Verilated::addExitCb(VerilatedTrace<VL_DERIVED_T>::onExit, this);
|
Verilated::addExitCb(VerilatedTrace<VL_DERIVED_T>::onExit, this);
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
// Compute trace buffer size. we need to be able to store a new value for
|
// Compute offload buffer size. we need to be able to store a new value for
|
||||||
// each signal, which is 'nextCode()' entries after the init callbacks
|
// each signal, which is 'nextCode()' entries after the init callbacks
|
||||||
// above have been run, plus up to 2 more words of metadata per signal,
|
// above have been run, plus up to 2 more words of metadata per signal,
|
||||||
// plus fixed overhead of 1 for a termination flag and 3 for a time stamp
|
// plus fixed overhead of 1 for a termination flag and 3 for a time stamp
|
||||||
// update.
|
// update.
|
||||||
m_traceBufferSize = nextCode() + numSignals() * 2 + 4;
|
m_offloadBufferSize = nextCode() + numSignals() * 2 + 4;
|
||||||
|
|
||||||
// Start the worker thread
|
// Start the worker thread
|
||||||
m_workerThread.reset(new std::thread{&VerilatedTrace<VL_DERIVED_T>::workerThreadMain, this});
|
m_workerThread.reset(
|
||||||
|
new std::thread{&VerilatedTrace<VL_DERIVED_T>::offloadWorkerThreadMain, this});
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -477,19 +478,19 @@ template <> void VerilatedTrace<VL_DERIVED_T>::dump(uint64_t timeui) VL_MT_SAFE_
|
|||||||
if (!preChangeDump()) return;
|
if (!preChangeDump()) return;
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
// Currently only incremental dumps run on the worker thread
|
// Currently only incremental dumps run on the worker thread
|
||||||
uint32_t* bufferp = nullptr;
|
uint32_t* bufferp = nullptr;
|
||||||
if (VL_LIKELY(!m_fullDump)) {
|
if (VL_LIKELY(!m_fullDump)) {
|
||||||
// Get the trace buffer we are about to fill
|
// Get the offload buffer we are about to fill
|
||||||
bufferp = getTraceBuffer();
|
bufferp = getOffloadBuffer();
|
||||||
m_traceBufferWritep = bufferp;
|
m_offloadBufferWritep = bufferp;
|
||||||
m_traceBufferEndp = bufferp + m_traceBufferSize;
|
m_offloadBufferEndp = bufferp + m_offloadBufferSize;
|
||||||
|
|
||||||
// Tell worker to update time point
|
// Tell worker to update time point
|
||||||
m_traceBufferWritep[0] = VerilatedTraceCommand::TIME_CHANGE;
|
m_offloadBufferWritep[0] = VerilatedTraceOffloadCommand::TIME_CHANGE;
|
||||||
*reinterpret_cast<uint64_t*>(m_traceBufferWritep + 1) = timeui;
|
*reinterpret_cast<uint64_t*>(m_offloadBufferWritep + 1) = timeui;
|
||||||
m_traceBufferWritep += 3;
|
m_offloadBufferWritep += 3;
|
||||||
} else {
|
} else {
|
||||||
// Update time point
|
// Update time point
|
||||||
flushBase();
|
flushBase();
|
||||||
@ -519,16 +520,16 @@ template <> void VerilatedTrace<VL_DERIVED_T>::dump(uint64_t timeui) VL_MT_SAFE_
|
|||||||
cbr.m_dumpCb(cbr.m_userp, self());
|
cbr.m_dumpCb(cbr.m_userp, self());
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef VL_TRACE_THREADED
|
#ifdef VL_TRACE_OFFLOAD
|
||||||
if (VL_LIKELY(bufferp)) {
|
if (VL_LIKELY(bufferp)) {
|
||||||
// Mark end of the trace buffer we just filled
|
// Mark end of the offload buffer we just filled
|
||||||
*m_traceBufferWritep++ = VerilatedTraceCommand::END;
|
*m_offloadBufferWritep++ = VerilatedTraceOffloadCommand::END;
|
||||||
|
|
||||||
// Assert no buffer overflow
|
// Assert no buffer overflow
|
||||||
assert(m_traceBufferWritep - bufferp <= m_traceBufferSize);
|
assert(m_offloadBufferWritep - bufferp <= m_offloadBufferSize);
|
||||||
|
|
||||||
// Pass it to the worker thread
|
// Pass it to the worker thread
|
||||||
m_buffersToWorker.put(bufferp);
|
m_offloadBuffersToWorker.put(bufferp);
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
@ -292,7 +292,7 @@ void VerilatedVcd::bufferResize(uint64_t minsize) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
void VerilatedVcd::bufferFlush() VL_MT_UNSAFE_ONE {
|
void VerilatedVcd::bufferFlush() VL_MT_UNSAFE_ONE {
|
||||||
// This function can be called from the trace thread
|
// This function can be called from the trace offload thread
|
||||||
// This function is on the flush() call path
|
// This function is on the flush() call path
|
||||||
// We add output data to m_writep.
|
// We add output data to m_writep.
|
||||||
// When it gets nearly full we dump it using this routine which calls write()
|
// When it gets nearly full we dump it using this routine which calls write()
|
||||||
|
@ -770,7 +770,7 @@ class EmitCTrace final : EmitCFunc {
|
|||||||
|
|
||||||
const uint32_t offset = (arrayindex < 0) ? 0 : (arrayindex * nodep->declp()->widthWords());
|
const uint32_t offset = (arrayindex < 0) ? 0 : (arrayindex * nodep->declp()->widthWords());
|
||||||
const uint32_t code = nodep->declp()->code() + offset;
|
const uint32_t code = nodep->declp()->code() + offset;
|
||||||
puts(v3Global.opt.trueTraceThreads() && !nodep->full() ? "(base+" : "(oldp+");
|
puts(v3Global.opt.useTraceOffloadThread() && !nodep->full() ? "(base+" : "(oldp+");
|
||||||
puts(cvtToStr(code - nodep->baseCode()));
|
puts(cvtToStr(code - nodep->baseCode()));
|
||||||
puts(",");
|
puts(",");
|
||||||
emitTraceValue(nodep, arrayindex);
|
emitTraceValue(nodep, arrayindex);
|
||||||
|
@ -71,7 +71,7 @@ public:
|
|||||||
of.puts("\n");
|
of.puts("\n");
|
||||||
of.puts("# Tracing threaded output mode? 0/1/N threads (from --trace-thread)\n");
|
of.puts("# Tracing threaded output mode? 0/1/N threads (from --trace-thread)\n");
|
||||||
of.puts("VM_TRACE_THREADS = ");
|
of.puts("VM_TRACE_THREADS = ");
|
||||||
of.puts(cvtToStr(v3Global.opt.trueTraceThreads()));
|
of.puts(cvtToStr(v3Global.opt.useTraceOffloadThread()));
|
||||||
of.puts("\n");
|
of.puts("\n");
|
||||||
of.puts("# Separate FST writer thread? 0/1 (from --trace-fst with --trace-thread > 0)\n");
|
of.puts("# Separate FST writer thread? 0/1 (from --trace-fst with --trace-thread > 0)\n");
|
||||||
of.puts("VM_TRACE_FST_WRITER_THREAD = ");
|
of.puts("VM_TRACE_FST_WRITER_THREAD = ");
|
||||||
|
@ -517,7 +517,7 @@ public:
|
|||||||
int traceMaxArray() const { return m_traceMaxArray; }
|
int traceMaxArray() const { return m_traceMaxArray; }
|
||||||
int traceMaxWidth() const { return m_traceMaxWidth; }
|
int traceMaxWidth() const { return m_traceMaxWidth; }
|
||||||
int traceThreads() const { return m_traceThreads; }
|
int traceThreads() const { return m_traceThreads; }
|
||||||
bool trueTraceThreads() const {
|
bool useTraceOffloadThread() const {
|
||||||
return traceThreads() == 0 ? 0 : traceThreads() - traceFormat().fst();
|
return traceThreads() == 0 ? 0 : traceThreads() - traceFormat().fst();
|
||||||
}
|
}
|
||||||
int unrollCount() const { return m_unrollCount; }
|
int unrollCount() const { return m_unrollCount; }
|
||||||
|
@ -520,7 +520,7 @@ private:
|
|||||||
"tracep->oldp(vlSymsp->__Vm_baseCode);\n");
|
"tracep->oldp(vlSymsp->__Vm_baseCode);\n");
|
||||||
} else {
|
} else {
|
||||||
// Change dump sub function
|
// Change dump sub function
|
||||||
if (v3Global.opt.trueTraceThreads()) {
|
if (v3Global.opt.useTraceOffloadThread()) {
|
||||||
addInitStr("const uint32_t base VL_ATTR_UNUSED = "
|
addInitStr("const uint32_t base VL_ATTR_UNUSED = "
|
||||||
"vlSymsp->__Vm_baseCode + "
|
"vlSymsp->__Vm_baseCode + "
|
||||||
+ cvtToStr(baseCode) + ";\n");
|
+ cvtToStr(baseCode) + ";\n");
|
||||||
|
Loading…
Reference in New Issue
Block a user