forked from github/verilator
b1b5b5dfe2
The --prof-threads option has been split into two independent options: 1. --prof-exec, for collecting verilator_gantt and other execution related profiling data, and 2. --prof-pgo, for collecting data needed for PGO The implementation of execution profiling is extricated from VlThreadPool and is now a separate class VlExecutionProfiler. This means --prof-exec can now be used for single-threaded models (though it does not measure a lot of things just yet). For consistency VerilatedProfiler is renamed VlPgoProfiler. Both VlExecutionProfiler and VlPgoProfiler are in verilated_profiler.{h/cpp}, but can be used completely independently. Also re-worked the execution profile format so it now only emits events without holding onto any temporaries. This is in preparation for some future optimizations that would be hindered by the introduction of function locals via AstText. Also removed the Barrier event. Clearing the profile buffers is not notably more expensive as the profiling records are trivially destructible.
259 lines
2.6 KiB
Plaintext
259 lines
2.6 KiB
Plaintext
$version Generated by verilator_gantt $end
|
|
$timescale 1ns $end
|
|
|
|
$scope module gantt $end
|
|
$scope module Stats $end
|
|
$var wire 32 vf measured_parallelism [31:0] $end
|
|
$var wire 32 v10 predicted_parallelism [31:0] $end
|
|
$upscope $end
|
|
$scope module cpus $end
|
|
$var wire 32 v5 cpu10_thread [31:0] $end
|
|
$var wire 32 v1 cpu19_thread [31:0] $end
|
|
$upscope $end
|
|
$scope module evals $end
|
|
$var wire 32 vb eval [31:0] $end
|
|
$var wire 32 vc eval_loop [31:0] $end
|
|
$upscope $end
|
|
$scope module measured_threads $end
|
|
$var wire 32 v0 thread0_mtask [31:0] $end
|
|
$var wire 32 v4 thread1_mtask [31:0] $end
|
|
$upscope $end
|
|
$scope module mtasks $end
|
|
$var wire 32 v3 mtask10_cpu [31:0] $end
|
|
$var wire 32 va mtask11_cpu [31:0] $end
|
|
$var wire 32 v6 mtask5_cpu [31:0] $end
|
|
$var wire 32 v2 mtask6_cpu [31:0] $end
|
|
$var wire 32 v7 mtask7_cpu [31:0] $end
|
|
$var wire 32 v8 mtask8_cpu [31:0] $end
|
|
$var wire 32 v9 mtask9_cpu [31:0] $end
|
|
$upscope $end
|
|
$scope module predicted_threads $end
|
|
$var wire 32 vd predicted_thread0_mtask [31:0] $end
|
|
$var wire 32 ve predicted_thread1_mtask [31:0] $end
|
|
$upscope $end
|
|
$upscope $end
|
|
$enddefinitions $end
|
|
|
|
#0
|
|
bz v0
|
|
bz v1
|
|
bz v2
|
|
bz v3
|
|
bz v4
|
|
bz v5
|
|
bz v6
|
|
bz v7
|
|
bz v8
|
|
bz v9
|
|
bz va
|
|
bz vb
|
|
bz vc
|
|
bz vd
|
|
bz ve
|
|
b0 vf
|
|
b0 v10
|
|
#595
|
|
b1 vb
|
|
#945
|
|
b1 vc
|
|
b110 vd
|
|
b101 ve
|
|
b10 v10
|
|
#2429
|
|
bz vd
|
|
b111 ve
|
|
b1 v10
|
|
#2695
|
|
b110 v0
|
|
b0 v1
|
|
b10011 v2
|
|
b1 vf
|
|
#2905
|
|
bz v0
|
|
bz v1
|
|
bz v2
|
|
b0 vf
|
|
#3914
|
|
b1000 ve
|
|
b1 v10
|
|
#5495
|
|
b101 v4
|
|
b1 v5
|
|
b1010 v6
|
|
b1 vf
|
|
#6090
|
|
bz v4
|
|
bz v5
|
|
bz v6
|
|
b0 vf
|
|
#6300
|
|
b111 v4
|
|
b1 v5
|
|
b1010 v7
|
|
b1 vf
|
|
#6895
|
|
bz v4
|
|
bz v5
|
|
bz v7
|
|
b0 vf
|
|
#7490
|
|
b1000 v4
|
|
b1 v5
|
|
b1010 v8
|
|
b1 vf
|
|
#8540
|
|
bz v4
|
|
bz v5
|
|
bz v8
|
|
b0 vf
|
|
#9135
|
|
b1001 v4
|
|
b1 v5
|
|
b1010 v9
|
|
b1 vf
|
|
#9210
|
|
b1001 ve
|
|
b1 v10
|
|
#9695
|
|
b1010 v0
|
|
b0 v1
|
|
b10011 v3
|
|
b10 vf
|
|
#9730
|
|
bz v4
|
|
bz v5
|
|
bz v9
|
|
b1 vf
|
|
#9870
|
|
bz v0
|
|
bz v1
|
|
bz v3
|
|
b0 vf
|
|
#10255
|
|
b1011 v4
|
|
b1 v5
|
|
b1010 va
|
|
b1 vf
|
|
#10645
|
|
b1010 vd
|
|
b10 v10
|
|
#10695
|
|
b1011 ve
|
|
b10 v10
|
|
#11060
|
|
bz v4
|
|
bz v5
|
|
bz va
|
|
b0 vf
|
|
#12130
|
|
bz vd
|
|
b1 v10
|
|
#12180
|
|
bz vc
|
|
bz ve
|
|
b0 v10
|
|
#12250
|
|
bz vb
|
|
#13720
|
|
b10 vb
|
|
#14000
|
|
b10 vc
|
|
b110 vd
|
|
b101 ve
|
|
b10 v10
|
|
#15068
|
|
bz vd
|
|
b111 ve
|
|
b1 v10
|
|
#15610
|
|
b110 v0
|
|
b0 v1
|
|
b10011 v2
|
|
b1 vf
|
|
#15820
|
|
bz v0
|
|
bz v1
|
|
bz v2
|
|
b0 vf
|
|
#16137
|
|
b1000 ve
|
|
b1 v10
|
|
#18375
|
|
b101 v4
|
|
b1 v5
|
|
b1010 v6
|
|
b1 vf
|
|
#18970
|
|
bz v4
|
|
bz v5
|
|
bz v6
|
|
b0 vf
|
|
#19145
|
|
b111 v4
|
|
b1 v5
|
|
b1010 v7
|
|
b1 vf
|
|
#19320
|
|
bz v4
|
|
bz v5
|
|
bz v7
|
|
b0 vf
|
|
#19670
|
|
b1000 v4
|
|
b1 v5
|
|
b1010 v8
|
|
b1 vf
|
|
#19810
|
|
bz v4
|
|
bz v5
|
|
bz v8
|
|
b0 vf
|
|
#19947
|
|
b1001 ve
|
|
b1 v10
|
|
#20650
|
|
b1001 v4
|
|
b1 v5
|
|
b1010 v9
|
|
b1 vf
|
|
#20720
|
|
bz v4
|
|
bz v5
|
|
bz v9
|
|
b0 vf
|
|
#20980
|
|
b1010 vd
|
|
b10 v10
|
|
#21016
|
|
b1011 ve
|
|
b10 v10
|
|
#21140
|
|
b1011 v4
|
|
b1 v5
|
|
b1010 va
|
|
b1 vf
|
|
#21245
|
|
bz v4
|
|
bz v5
|
|
bz va
|
|
b0 vf
|
|
#21700
|
|
b1010 v0
|
|
b0 v1
|
|
b10011 v3
|
|
b1 vf
|
|
#21875
|
|
bz v0
|
|
bz v1
|
|
bz v3
|
|
b0 vf
|
|
#22049
|
|
bz vd
|
|
b1 v10
|
|
#22085
|
|
bz vc
|
|
bz ve
|
|
b0 v10
|
|
#22330
|
|
bz vb
|