clusterlin: introduce CostModel class (preparation)

This parametrizes the cost model for the SFL algorithm with another class. Right now, the behavior of that class matches the naive cost model so far, but it will be replaced with a more advanced on in a future commit. The reason for abstracting this out is that it makes benchmarking for creating such cost models easy, by instantiating the cost model class with one that tracks time.
2026-03-02 01:36:13 +00:00 · 2026-01-24 19:02:15 -05:00 · 2026-01-24 19:02:15 -05:00 · 9e7129df29
commit 9e7129df29
parent 5db78c84ad
1 changed files with 89 additions and 12 deletions
--- a/src/cluster_linearize.h
+++ b/src/cluster_linearize.h
@ -472,6 +472,41 @@ concept StrongComparator =
 *  Linearize(), which just sorts by DepGraphIndex. */
 using IndexTxOrder = std::compare_three_way;

+class SFLDefaultCostModel
+{
+    uint64_t m_cost{0};
+
+public:
+    inline void InitializeBegin() noexcept {}
+    inline void InitializeEnd(int num_txns, int num_deps) noexcept {}
+    inline void GetLinearizationBegin() noexcept {}
+    inline void GetLinearizationEnd(int num_txns, int num_deps) noexcept {}
+    inline void MakeTopologicalBegin() noexcept {}
+    inline void MakeTopologicalEnd(int num_chunks, int num_steps) noexcept {}
+    inline void StartOptimizingBegin() noexcept {}
+    inline void StartOptimizingEnd(int num_chunks) noexcept {}
+    inline void ActivateBegin() noexcept {}
+    inline void ActivateEnd(int num_deps) noexcept { m_cost += num_deps + 1; }
+    inline void DeactivateBegin() noexcept {}
+    inline void DeactivateEnd(int num_deps) noexcept { m_cost += num_deps + 1; }
+    inline void MergeChunksBegin() noexcept {}
+    inline void MergeChunksMid(int num_txns) noexcept {}
+    inline void MergeChunksEnd(int num_steps) noexcept {}
+    inline void PickMergeCandidateBegin() noexcept {}
+    inline void PickMergeCandidateEnd(int num_steps) noexcept {}
+    inline void PickChunkToOptimizeBegin() noexcept {}
+    inline void PickChunkToOptimizeEnd(int num_steps) noexcept {}
+    inline void PickDependencyToSplitBegin() noexcept {}
+    inline void PickDependencyToSplitEnd(int num_txns) noexcept {}
+    inline void StartMinimizingBegin() noexcept {}
+    inline void StartMinimizingEnd(int num_chunks) noexcept {}
+    inline void MinimizeStepBegin() noexcept {}
+    inline void MinimizeStepMid(int num_txns) noexcept {}
+    inline void MinimizeStepEnd(bool split) noexcept {}
+
+    inline uint64_t GetCost() const noexcept { return m_cost; }
+};
+
 /** Class to represent the internal state of the spanning-forest linearization (SFL) algorithm.
 *
 * At all times, each dependency is marked as either "active" or "inactive". The subset of active
@ -643,7 +678,7 @@ using IndexTxOrder = std::compare_three_way;
 *   - Within chunks, repeatedly pick a uniformly random transaction among those with no missing
 *     dependencies.
 */
-template<typename SetType>
+template<typename SetType, typename CostModel = SFLDefaultCostModel>
 class SpanningForestState
 {
 private:
@ -704,12 +739,12 @@ private:
     */
    VecDeque<std::tuple<SetIdx, TxIdx, unsigned>> m_nonminimal_chunks;

-    /** The number of updated transactions in activations/deactivations. */
-    uint64_t m_cost{0};
-
    /** The DepGraph we are trying to linearize. */
    const DepGraph<SetType>& m_depgraph;

+    /** Accounting for the cost of this computation. */
+    CostModel m_cost;
+
    /** Pick a random transaction within a set (which must be non-empty). */
    TxIdx PickRandomTx(const SetType& tx_idxs) noexcept
    {
@ -741,6 +776,7 @@ private:
     *  already, active. Returns the merged chunk idx. */
    SetIdx Activate(TxIdx parent_idx, TxIdx child_idx) noexcept
    {
+        m_cost.ActivateBegin();
        // Gather and check information about the parent and child transactions.
        auto& parent_data = m_tx_data[parent_idx];
        auto& child_data = m_tx_data[child_idx];
@ -794,7 +830,6 @@ private:
        }
        // Merge top_info into bottom_info, which becomes the merged chunk.
        bottom_info |= top_info;
-        m_cost += bottom_info.transactions.Count();
        // Compute merged sets of reachable transactions from the new chunk, based on the input
        // chunks' reachable sets.
        m_reachable[child_chunk_idx].first |= m_reachable[parent_chunk_idx].first;
@ -806,6 +841,7 @@ private:
        parent_data.active_children.Set(child_idx);
        m_chunk_idxs.Reset(parent_chunk_idx);
        // Return the newly merged chunk.
+        m_cost.ActivateEnd(/*num_deps=*/bottom_info.transactions.Count() - 1);
        return child_chunk_idx;
    }

@ -813,6 +849,7 @@ private:
     *  indexes. */
    std::pair<SetIdx, SetIdx> Deactivate(TxIdx parent_idx, TxIdx child_idx) noexcept
    {
+        m_cost.DeactivateBegin();
        // Gather and check information about the parent transactions.
        auto& parent_data = m_tx_data[parent_idx];
        Assume(parent_data.children[child_idx]);
@ -830,7 +867,7 @@ private:
        // Remove the active dependency.
        parent_data.active_children.Reset(child_idx);
        m_chunk_idxs.Set(parent_chunk_idx);
-        m_cost += bottom_info.transactions.Count();
+        auto ntx = bottom_info.transactions.Count();
        // Subtract the top_info from the bottom_info, as it will become the child chunk.
        bottom_info -= top_info;
        // See the comment above in Activate(). We perform the opposite operations here, removing
@ -863,6 +900,7 @@ private:
        m_reachable[child_chunk_idx].first = bottom_parents - bottom_info.transactions;
        m_reachable[child_chunk_idx].second = bottom_children - bottom_info.transactions;
        // Return the two new set idxs.
+        m_cost.DeactivateEnd(/*num_deps=*/ntx - 1);
        return {parent_chunk_idx, child_chunk_idx};
    }

@ -870,6 +908,7 @@ private:
     *  index of the merged chunk. */
    SetIdx MergeChunks(SetIdx top_idx, SetIdx bottom_idx) noexcept
    {
+        m_cost.MergeChunksBegin();
        Assume(m_chunk_idxs[top_idx]);
        Assume(m_chunk_idxs[bottom_idx]);
        auto& top_chunk_info = m_set_info[top_idx];
@ -880,16 +919,22 @@ private:
            auto& tx_data = m_tx_data[tx_idx];
            num_deps += (tx_data.children & bottom_chunk_info.transactions).Count();
        }
+        m_cost.MergeChunksMid(/*num_txns=*/top_chunk_info.transactions.Count());
        Assume(num_deps > 0);
        // Uniformly randomly pick one of them and activate it.
        unsigned pick = m_rng.randrange(num_deps);
+        unsigned num_steps = 0;
        for (auto tx_idx : top_chunk_info.transactions) {
+            ++num_steps;
            auto& tx_data = m_tx_data[tx_idx];
            auto intersect = tx_data.children & bottom_chunk_info.transactions;
            auto count = intersect.Count();
            if (pick < count) {
                for (auto child_idx : intersect) {
-                    if (pick == 0) return Activate(tx_idx, child_idx);
+                    if (pick == 0) {
+                        m_cost.MergeChunksEnd(/*num_steps=*/num_steps);
+                        return Activate(tx_idx, child_idx);
+                    }
                    --pick;
                }
                Assume(false);
@ -917,6 +962,7 @@ private:
    template<bool DownWard>
    SetIdx PickMergeCandidate(SetIdx chunk_idx) noexcept
    {
+        m_cost.PickMergeCandidateBegin();
        /** Information about the chunk. */
        Assume(m_chunk_idxs[chunk_idx]);
        auto& chunk_info = m_set_info[chunk_idx];
@ -957,6 +1003,7 @@ private:
        }
        Assume(steps <= m_set_info.size());

+        m_cost.PickMergeCandidateEnd(/*num_steps=*/steps);
        return best_other_chunk_idx;
    }

@ -1028,23 +1075,31 @@ private:
    /** Determine the next chunk to optimize, or INVALID_SET_IDX if none. */
    SetIdx PickChunkToOptimize() noexcept
    {
+        m_cost.PickChunkToOptimizeBegin();
+        unsigned steps{0};
        while (!m_suboptimal_chunks.empty()) {
+            ++steps;
            // Pop an entry from the potentially-suboptimal chunk queue.
            SetIdx chunk_idx = m_suboptimal_chunks.front();
            Assume(m_suboptimal_idxs[chunk_idx]);
            m_suboptimal_idxs.Reset(chunk_idx);
            m_suboptimal_chunks.pop_front();
-            if (m_chunk_idxs[chunk_idx]) return chunk_idx;
+            if (m_chunk_idxs[chunk_idx]) {
+                m_cost.PickChunkToOptimizeEnd(/*num_steps=*/steps);
+                return chunk_idx;
+            }
            // If what was popped is not currently a chunk, continue. This may
            // happen when a split chunk merges in Improve() with one or more existing chunks that
            // are themselves on the suboptimal queue already.
        }
+        m_cost.PickChunkToOptimizeEnd(/*num_steps=*/steps);
        return INVALID_SET_IDX;
    }

    /** Find a (parent, child) dependency to deactivate in chunk_idx, or (-1, -1) if none. */
    std::pair<TxIdx, TxIdx> PickDependencyToSplit(SetIdx chunk_idx) noexcept
    {
+        m_cost.PickDependencyToSplitBegin();
        Assume(m_chunk_idxs[chunk_idx]);
        auto& chunk_info = m_set_info[chunk_idx];

@ -1071,21 +1126,24 @@ private:
                candidate_tiebreak = tiebreak;
            }
        }
+        m_cost.PickDependencyToSplitEnd(/*num_txns=*/chunk_info.transactions.Count());
        return candidate_dep;
    }

 public:
    /** Construct a spanning forest for the given DepGraph, with every transaction in its own chunk
     *  (not topological). */
-    explicit SpanningForestState(const DepGraph<SetType>& depgraph LIFETIMEBOUND, uint64_t rng_seed) noexcept :
-        m_rng(rng_seed), m_depgraph(depgraph)
+    explicit SpanningForestState(const DepGraph<SetType>& depgraph LIFETIMEBOUND, uint64_t rng_seed, const CostModel& cost = CostModel{}) noexcept :
+        m_rng(rng_seed), m_depgraph(depgraph), m_cost(cost)
    {
+        m_cost.InitializeBegin();
        m_transaction_idxs = depgraph.Positions();
        auto num_transactions = m_transaction_idxs.Count();
        m_tx_data.resize(depgraph.PositionRange());
        m_set_info.resize(num_transactions);
        m_reachable.resize(num_transactions);
        size_t num_chunks = 0;
+        size_t num_deps = 0;
        for (auto tx_idx : m_transaction_idxs) {
            // Fill in transaction data.
            auto& tx_data = m_tx_data[tx_idx];
@ -1093,6 +1151,7 @@ public:
            for (auto parent_idx : tx_data.parents) {
                m_tx_data[parent_idx].children.Set(tx_idx);
            }
+            num_deps += tx_data.parents.Count();
            // Create a singleton chunk for it.
            tx_data.chunk_idx = num_chunks;
            m_set_info[num_chunks++] = SetInfo(depgraph, tx_idx);
@ -1106,6 +1165,7 @@ public:
        Assume(num_chunks == num_transactions);
        // Mark all chunk sets as chunks.
        m_chunk_idxs = SetType::Fill(num_chunks);
+        m_cost.InitializeEnd(/*num_txns=*/num_chunks, /*num_deps=*/num_deps);
    }

    /** Load an existing linearization. Must be called immediately after constructor. The result is
@ -1127,6 +1187,7 @@ public:
    /** Make state topological. Can be called after constructing, or after LoadLinearization. */
    void MakeTopological() noexcept
    {
+        m_cost.MakeTopologicalBegin();
        Assume(m_suboptimal_chunks.empty());
        /** What direction to initially merge chunks in; one of the two directions is enough. This
         *  is sufficient because if a non-topological inactive dependency exists between two
@ -1147,7 +1208,10 @@ public:
                std::swap(m_suboptimal_chunks.back(), m_suboptimal_chunks[j]);
            }
        }
+        unsigned chunks = m_chunk_idxs.Count();
+        unsigned steps = 0;
        while (!m_suboptimal_chunks.empty()) {
+            ++steps;
            // Pop an entry from the potentially-suboptimal chunk queue.
            SetIdx chunk_idx = m_suboptimal_chunks.front();
            m_suboptimal_chunks.pop_front();
@ -1187,11 +1251,13 @@ public:
                }
            }
        }
+        m_cost.MakeTopologicalEnd(/*num_chunks=*/chunks, /*num_steps=*/steps);
    }

    /** Initialize the data structure for optimization. It must be topological already. */
    void StartOptimizing() noexcept
    {
+        m_cost.StartOptimizingBegin();
        Assume(m_suboptimal_chunks.empty());
        // Mark chunks suboptimal.
        m_suboptimal_idxs = m_chunk_idxs;
@ -1203,6 +1269,7 @@ public:
                std::swap(m_suboptimal_chunks.back(), m_suboptimal_chunks[j]);
            }
        }
+        m_cost.StartOptimizingEnd(/*num_chunks=*/m_suboptimal_chunks.size());
    }

    /** Try to improve the forest. Returns false if it is optimal, true otherwise. */
@ -1228,6 +1295,7 @@ public:
     *  to be optimal. OptimizeStep() cannot be called anymore afterwards. */
    void StartMinimizing() noexcept
    {
+        m_cost.StartMinimizingBegin();
        m_nonminimal_chunks.clear();
        m_nonminimal_chunks.reserve(m_transaction_idxs.Count());
        // Gather all chunks, and for each, add it with a random pivot in it, and a random initial
@ -1241,6 +1309,7 @@ public:
                std::swap(m_nonminimal_chunks.back(), m_nonminimal_chunks[j]);
            }
        }
+        m_cost.StartMinimizingEnd(/*num_chunks=*/m_nonminimal_chunks.size());
    }

    /** Try to reduce a chunk's size. Returns false if all chunks are minimal, true otherwise. */
@ -1248,6 +1317,7 @@ public:
    {
        // If the queue of potentially-non-minimal chunks is empty, we are done.
        if (m_nonminimal_chunks.empty()) return false;
+        m_cost.MinimizeStepBegin();
        // Pop an entry from the potentially-non-minimal chunk queue.
        auto [chunk_idx, pivot_idx, flags] = m_nonminimal_chunks.front();
        m_nonminimal_chunks.pop_front();
@ -1283,6 +1353,7 @@ public:
                }
            }
        }
+        m_cost.MinimizeStepMid(/*num_txns=*/chunk_info.transactions.Count());
        // If no dependencies have equal top and bottom set feerate, this chunk is minimal.
        if (!have_any) return true;
        // If all found dependencies have the pivot in the wrong place, try moving it in the other
@ -1308,6 +1379,7 @@ public:
            // Re-insert the chunk into the queue, in the same direction. Note that the chunk_idx
            // will have changed.
            m_nonminimal_chunks.emplace_back(merged_chunk_idx, pivot_idx, flags);
+            m_cost.MinimizeStepEnd(/*split=*/false);
        } else {
            // No self-merge happens, and thus we have found a way to split the chunk. Create two
            // smaller chunks, and add them to the queue. The one that contains the current pivot
@ -1328,6 +1400,7 @@ public:
            if (m_rng.randbool()) {
                std::swap(m_nonminimal_chunks.back(), m_nonminimal_chunks[m_nonminimal_chunks.size() - 2]);
            }
+            m_cost.MinimizeStepEnd(/*split=*/true);
        }
        return true;
    }
@ -1348,8 +1421,9 @@ public:
     *   - smallest tx size first
     *   - the lowest transaction, by fallback_order, first
     */
-    std::vector<DepGraphIndex> GetLinearization(const StrongComparator<DepGraphIndex> auto& fallback_order) const noexcept
+    std::vector<DepGraphIndex> GetLinearization(const StrongComparator<DepGraphIndex> auto& fallback_order) noexcept
    {
+        m_cost.GetLinearizationBegin();
        /** The output linearization. */
        std::vector<DepGraphIndex> ret;
        ret.reserve(m_set_info.size());
@ -1367,9 +1441,11 @@ public:
         *  tx feerate (high to low), tx size (small to large), and fallback order. */
        std::vector<TxIdx> ready_tx;
        // Populate chunk_deps and tx_deps.
+        unsigned num_deps{0};
        for (TxIdx chl_idx : m_transaction_idxs) {
            const auto& chl_data = m_tx_data[chl_idx];
            tx_deps[chl_idx] = chl_data.parents.Count();
+            num_deps += tx_deps[chl_idx];
            auto chl_chunk_idx = chl_data.chunk_idx;
            auto& chl_chunk_info = m_set_info[chl_chunk_idx];
            chunk_deps[chl_chunk_idx] += (chl_data.parents - chl_chunk_info.transactions).Count();
@ -1483,6 +1559,7 @@ public:
            }
        }
        Assume(ret.size() == m_set_info.size());
+        m_cost.GetLinearizationEnd(/*num_txns=*/m_set_info.size(), /*num_deps=*/num_deps);
        return ret;
    }

@ -1510,7 +1587,7 @@ public:
    }

    /** Determine how much work was performed so far. */
-    uint64_t GetCost() const noexcept { return m_cost; }
+    uint64_t GetCost() const noexcept { return m_cost.GetCost(); }

    /** Verify internal consistency of the data structure. */
    void SanityCheck() const