Add VerilatedContext::useNumaAssign and set on threads() call (#6954)

2026-01-28 00:05:28 +08:00 · 2026-01-28 00:05:28 +08:00 · 5b84635bde
parent 7c6c6a684b
commit 5b84635bde
6 changed files with 120 additions and 3 deletions
--- a/include/verilated.cpp
+++ b/include/verilated.cpp
@ -2816,6 +2816,7 @@ void VerilatedContext::threads(unsigned n) {
            "%Error: Cannot set simulation threads after the thread pool has been created.");
    }

+    m_useNumaAssign = true;
    if (m_threads == n) return;  // To avoid unnecessary warnings
    m_threads = n;
    const unsigned threadsAvailableToProcess = VlOs::getProcessDefaultParallelism();
@ -2826,6 +2827,8 @@ void VerilatedContext::threads(unsigned n) {
    }
 }

+void VerilatedContext::useNumaAssign(bool flag) { m_useNumaAssign = flag; }
+
 void VerilatedContext::commandArgs(int argc, const char** argv) VL_MT_SAFE_EXCLUDES(m_argMutex) {
    // Not locking m_argMutex here, it is done in impp()->commandArgsAddGuts
    // m_argMutex here is the same as in impp()->commandArgsAddGuts;
--- a/include/verilated.h
+++ b/include/verilated.h
@ -433,6 +433,8 @@ protected:
    const std::unique_ptr<VerilatedContextImpData> m_impdatap;
    // Number of threads to use for simulation (size of m_threadPool + 1 for main thread)
    unsigned m_threads = VlOs::getProcessDefaultParallelism();
+    // Use numa automatic CPU-to-thread assignment
+    bool m_useNumaAssign = false;
    // Number of threads in added models
    unsigned m_threadsInModels = 0;
    // The thread pool shared by all models added to this context
@ -599,6 +601,13 @@ public:
    /// Can only be called before the thread pool is created (before first model is added).
    void threads(unsigned n);

+    /// Use numa automatic CPU-to-thread assignment.
+    bool useNumaAssign() const VL_MT_SAFE { return m_useNumaAssign; }
+    /// Set numa assignment of threads to cores
+    /// Defaults false; set true automatically when threads() called;
+    /// call this to override back to false if numa assignment not wanted.
+    void useNumaAssign(bool flag);
+
    /// Trace signals in models within the context; called by application code
    void trace(VerilatedTraceBaseC* tfp, int levels, int options = 0);
    /// Allow traces to at some point be enabled (disables some optimizations)
--- a/include/verilated_threads.cpp
+++ b/include/verilated_threads.cpp
@ -137,7 +137,7 @@ VlThreadPool::VlThreadPool(VerilatedContext* contextp, unsigned nThreads) {
        m_workers.push_back(new VlWorkerThread{contextp});
        m_unassignedWorkers.push(i);
    }
-    m_numaStatus = numaAssign();
+    m_numaStatus = numaAssign(contextp);
 }

 VlThreadPool::~VlThreadPool() {
@ -145,8 +145,9 @@ VlThreadPool::~VlThreadPool() {
    for (auto& i : m_workers) delete i;
 }

-std::string VlThreadPool::numaAssign() {
+std::string VlThreadPool::numaAssign(VerilatedContext* contextp) {
 #if defined(__linux) || defined(CPU_ZERO) || defined(VL_CPPCHECK)  // Linux-like pthreads
+    if (contextp && !contextp->useNumaAssign()) { return "NUMA assignment not requested"; }
    std::string numa_strategy = VlOs::getenvStr("VERILATOR_NUMA_STRATEGY", "default");
    if (numa_strategy == "none") {
        return "no NUMA assignment requested";
--- a/include/verilated_threads.h
+++ b/include/verilated_threads.h
@ -254,7 +254,7 @@ public:
 private:
    VL_UNCOPYABLE(VlThreadPool);

-    std::string numaAssign();
+    std::string numaAssign(VerilatedContext* contextp);
 };

 #endif
--- a/test_regress/t/t_gantt_numa_default_threads.cpp
+++ b/test_regress/t/t_gantt_numa_default_threads.cpp
@ -0,0 +1,53 @@
+// -*- mode: C++; c-file-style: "cc-mode" -*-
+//*************************************************************************
+//
+// Copyright 2026 by Wilson Snyder. This program is free software; you can
+// redistribute it and/or modify it under the terms of either the GNU
+// Lesser General Public License Version 3 or the Perl Artistic License
+// Version 2.0.
+// SPDX-License-Identifier: LGPL-3.0-only OR Artistic-2.0
+//
+//*************************************************************************
+
+// Generated header
+#include "Vt_gantt_numa_default_threads.h"
+// General headers
+#include "verilated.h"
+
+#include "TestCheck.h"
+
+int errors = 0;
+
+std::unique_ptr<Vt_gantt_numa_default_threads> topp;
+
+int main(int argc, char** argv) {
+    vluint64_t sim_time = 1100;
+    const std::unique_ptr<VerilatedContext> contextp{new VerilatedContext};
+    contextp->debug(0);
+    contextp->commandArgs(argc, argv);
+    srand48(5);
+    TEST_CHECK_EQ(contextp->useNumaAssign(), false);
+    contextp->threads(3);
+    TEST_CHECK_EQ(contextp->useNumaAssign(), true);
+    contextp->useNumaAssign(false);
+    TEST_CHECK_EQ(contextp->useNumaAssign(), false);
+    topp.reset(new VM_PREFIX{"top"});
+
+    topp->clk = 0;
+    topp->eval();
+    { contextp->timeInc(10); }
+
+    while ((contextp->time() < sim_time) && !contextp->gotFinish()) {
+        topp->eval();
+        topp->clk = !topp->clk;
+        topp->eval();
+        contextp->timeInc(5);
+    }
+    if (!contextp->gotFinish()) {
+        vl_fatal(__FILE__, __LINE__, "main", "%Error: Timeout; never got a $finish");
+    }
+    topp->final();
+
+    topp.reset();
+    return (errors ? 10 : 0);
+}
--- a/test_regress/t/t_gantt_numa_default_threads.py
+++ b/test_regress/t/t_gantt_numa_default_threads.py
@ -0,0 +1,51 @@
+#!/usr/bin/env python3
+# DESCRIPTION: Verilator: Verilog Test driver/expect definition
+#
+# Copyright 2026 by Wilson Snyder. This program is free software; you
+# can redistribute it and/or modify it under the terms of either the GNU
+# Lesser General Public License Version 3 or the Perl Artistic License
+# Version 2.0.
+# SPDX-License-Identifier: LGPL-3.0-only OR Artistic-2.0
+
+import os
+import sys
+import vltest_bootstrap
+
+test.scenarios('vltmt')
+
+test.top_filename = "t/t_gantt.v"
+test.pli_filename = "t/t_gantt_numa_default_threads.cpp"
+
+# Require enough cores so default thread count stays >= model threads
+# (we don't call contextp->threads in this test)
+test.skip_if_too_few_cores()
+
+test.compile(
+    make_main=False,
+    verilator_flags2=[
+        "--prof-exec",
+        "--exe",
+        test.pli_filename,
+        test.t_dir + "/t_gantt_c.cpp",
+    ],
+    threads=test.get_default_vltmt_threads,
+)
+
+test.execute(all_run_flags=[
+    "+verilator+prof+exec+start+2",
+    " +verilator+prof+exec+window+2",
+    " +verilator+prof+exec+file+" + test.obj_dir + "/profile_exec.dat",
+])
+
+gantt_log = test.obj_dir + "/gantt_default_threads.log"
+test.run(cmd=[
+    os.environ["VERILATOR_ROOT"] + "/bin/verilator_gantt",
+    "--no-vcd",
+    test.obj_dir + "/profile_exec.dat",
+    "| tee " + gantt_log,
+])
+
+if sys.platform != "darwin":
+    test.file_grep(gantt_log, r"NUMA status += NUMA assignment not requested")
+
+test.passes()