Skip to content

Commit

Permalink
clusterlin: improve rechunking in LinearizationChunking (optimization)
Browse files Browse the repository at this point in the history
When the transactions being marked done exactly match the first chunk of
what remains of the linearization, we can just remember to skip that
chunk instead of computing a full rechunking.

Further, chop off prefixes of the input linearization that are already done,
so they don't need to be reconsidered for further rechunkings.
  • Loading branch information
sipa committed Aug 1, 2024
1 parent 04d7a04 commit bbcee5a
Showing 1 changed file with 29 additions and 9 deletions.
38 changes: 29 additions & 9 deletions src/cluster_linearize.h
Original file line number Diff line number Diff line change
Expand Up @@ -310,22 +310,30 @@ class LinearizationChunking
/** The depgraph this linearization is for. */
const DepGraph<SetType>& m_depgraph;

/** The linearization we started from. */
/** The linearization we started from, possibly with removed prefix stripped. */
Span<const ClusterIndex> m_linearization;

/** Chunk sets and their feerates, of what remains of the linearization. */
std::vector<SetInfo<SetType>> m_chunks;

/** How large a prefix of m_chunks corresponds to removed transactions. */
ClusterIndex m_chunks_skip{0};

/** Which transactions remain in the linearization. */
SetType m_todo;

/** Fill the m_chunks variable. */
/** Fill the m_chunks variable, and remove the done prefix of m_linearization. */
void BuildChunks() noexcept
{
// Caller must clear m_chunks.
Assume(m_chunks.empty());

// Iterate over the entries in m_linearization. This is effectively the same
// Chop off the initial part of m_linearization that is already done.
while (!m_linearization.empty() && !m_todo[m_linearization.front()]) {
m_linearization = m_linearization.subspan(1);
}

// Iterate over the remaining entries in m_linearization. This is effectively the same
// algorithm as ChunkLinearization, but supports skipping parts of the linearization and
// keeps track of the sets themselves instead of just their feerates.
for (auto idx : m_linearization) {
Expand Down Expand Up @@ -355,13 +363,13 @@ class LinearizationChunking
}

/** Determine how many chunks remain in the linearization. */
ClusterIndex NumChunksLeft() const noexcept { return m_chunks.size(); }
ClusterIndex NumChunksLeft() const noexcept { return m_chunks.size() - m_chunks_skip; }

/** Access a chunk. Chunk 0 is the highest-feerate prefix of what remains. */
const SetInfo<SetType>& GetChunk(ClusterIndex n) const noexcept
{
Assume(n < m_chunks.size());
return m_chunks[n];
Assume(n + m_chunks_skip < m_chunks.size());
return m_chunks[n + m_chunks_skip];
}

/** Remove some subset of transactions from the linearization. */
Expand All @@ -370,9 +378,21 @@ class LinearizationChunking
Assume(subset.Any());
Assume(subset.IsSubsetOf(m_todo));
m_todo -= subset;
// Rechunk what remains of m_linearization.
m_chunks.clear();
BuildChunks();
if (GetChunk(0).transactions == subset) {
// If the newly done transactions exactly match the first chunk of the remainder of
// the linearization, we do not need to rechunk; just remember to skip one
// additional chunk.
++m_chunks_skip;
// With subset marked done, some prefix of m_linearization will be done now. How long
// that prefix is depends on how many done elements were interspersed with subset,
// but at least as many transactions as there are in subset.
m_linearization = m_linearization.subspan(subset.Count());
} else {
// Otherwise rechunk what remains of m_linearization.
m_chunks.clear();
m_chunks_skip = 0;
BuildChunks();
}
}

/** Find the shortest intersection between subset and the prefixes of remaining chunks
Expand Down

0 comments on commit bbcee5a

Please sign in to comment.