Skip to content

Commit 0606e66

Browse files
committedOct 7, 2024
clusterlin: add DepGraph::RemoveTransactions and support for holes in DepGraph
This commits introduces support in DepGraph for the transaction positions to be non-continuous. Specifically, it adds: * DepGraph::RemoveTransactions which removes 0 or more positions from a DepGraph. * DepGraph::Positions() to get a set of which positions are in use. * DepGraph::PositionRange() to get the highest used position in a DepGraph + 1. In addition, it extends the DepGraphFormatter format to support holes in a compatible way (it serializes non-holey DepGraphs identically to the old code, and deserializes them the same way)
1 parent 75b5d42 commit 0606e66

7 files changed

+267
-79
lines changed
 

‎src/cluster_linearize.h

+98-22
Original file line numberDiff line numberDiff line change
@@ -57,9 +57,20 @@ class DepGraph
5757
/** Data for each transaction, in the same order as the Cluster it was constructed from. */
5858
std::vector<Entry> entries;
5959

60+
/** Which positions are used. */
61+
SetType m_used;
62+
6063
public:
6164
/** Equality operator (primarily for testing purposes). */
62-
friend bool operator==(const DepGraph&, const DepGraph&) noexcept = default;
65+
friend bool operator==(const DepGraph& a, const DepGraph& b) noexcept
66+
{
67+
if (a.m_used != b.m_used) return false;
68+
// Only compare the used positions within the entries vector.
69+
for (auto idx : a.m_used) {
70+
if (a.entries[idx] != b.entries[idx]) return false;
71+
}
72+
return true;
73+
}
6374

6475
// Default constructors.
6576
DepGraph() noexcept = default;
@@ -80,6 +91,7 @@ class DepGraph
8091
entries[i].ancestors = SetType::Singleton(i);
8192
entries[i].descendants = SetType::Singleton(i);
8293
}
94+
m_used = SetType::Fill(ntx);
8395
}
8496

8597
/** Construct a DepGraph object given a cluster.
@@ -97,24 +109,50 @@ class DepGraph
97109
}
98110

99111
/** Construct a DepGraph object given another DepGraph and a mapping from old to new.
112+
*
113+
* @param depgraph The original DepGraph that is being remapped.
114+
*
115+
* @param mapping A Span such that mapping[i] gives the position in the new DepGraph
116+
* for position i in the old depgraph. Its size must be equal to
117+
* depgraph.PositionRange(). The value of mapping[i] is ignored if
118+
* position i is a hole in depgraph (i.e., if !depgraph.Positions()[i]).
119+
*
120+
* @param pos_range The PositionRange() for the new DepGraph. It must equal the largest
121+
* value in mapping for any used position in depgraph plus 1, or 0 if
122+
* depgraph.TxCount() == 0.
100123
*
101124
* Complexity: O(N^2) where N=depgraph.TxCount().
102125
*/
103-
DepGraph(const DepGraph<SetType>& depgraph, Span<const ClusterIndex> mapping) noexcept : DepGraph(depgraph.TxCount())
126+
DepGraph(const DepGraph<SetType>& depgraph, Span<const ClusterIndex> mapping, ClusterIndex pos_range) noexcept : entries(pos_range)
104127
{
105-
Assert(mapping.size() == depgraph.TxCount());
106-
for (ClusterIndex i = 0; i < depgraph.TxCount(); ++i) {
128+
Assume(mapping.size() == depgraph.PositionRange());
129+
Assume((pos_range == 0) == (depgraph.TxCount() == 0));
130+
for (ClusterIndex i : depgraph.Positions()) {
131+
auto new_idx = mapping[i];
132+
Assume(new_idx < pos_range);
133+
// Add transaction.
134+
entries[new_idx].ancestors = SetType::Singleton(new_idx);
135+
entries[new_idx].descendants = SetType::Singleton(new_idx);
136+
m_used.Set(new_idx);
107137
// Fill in fee and size.
108-
entries[mapping[i]].feerate = depgraph.entries[i].feerate;
138+
entries[new_idx].feerate = depgraph.entries[i].feerate;
139+
}
140+
for (ClusterIndex i : depgraph.Positions()) {
109141
// Fill in dependencies by mapping direct parents.
110142
SetType parents;
111143
for (auto j : depgraph.GetReducedParents(i)) parents.Set(mapping[j]);
112144
AddDependencies(parents, mapping[i]);
113145
}
146+
// Verify that the provided pos_range was correct (no unused positions at the end).
147+
Assume(m_used.None() ? (pos_range == 0) : (pos_range == m_used.Last() + 1));
114148
}
115149

150+
/** Get the set of transactions positions in use. Complexity: O(1). */
151+
const SetType& Positions() const noexcept { return m_used; }
152+
/** Get the range of positions in this DepGraph. All entries in Positions() are in [0, PositionRange() - 1]. */
153+
ClusterIndex PositionRange() const noexcept { return entries.size(); }
116154
/** Get the number of transactions in the graph. Complexity: O(1). */
117-
auto TxCount() const noexcept { return entries.size(); }
155+
auto TxCount() const noexcept { return m_used.Count(); }
118156
/** Get the feerate of a given transaction i. Complexity: O(1). */
119157
const FeeFrac& FeeRate(ClusterIndex i) const noexcept { return entries[i].feerate; }
120158
/** Get the mutable feerate of a given transaction i. Complexity: O(1). */
@@ -124,25 +162,59 @@ class DepGraph
124162
/** Get the descendants of a given transaction i. Complexity: O(1). */
125163
const SetType& Descendants(ClusterIndex i) const noexcept { return entries[i].descendants; }
126164

127-
/** Add a new unconnected transaction to this transaction graph (at the end), and return its
128-
* ClusterIndex.
165+
/** Add a new unconnected transaction to this transaction graph (in the first available
166+
* position), and return its ClusterIndex.
129167
*
130168
* Complexity: O(1) (amortized, due to resizing of backing vector).
131169
*/
132170
ClusterIndex AddTransaction(const FeeFrac& feefrac) noexcept
133171
{
134-
Assume(TxCount() < SetType::Size());
135-
ClusterIndex new_idx = TxCount();
136-
entries.emplace_back(feefrac, SetType::Singleton(new_idx), SetType::Singleton(new_idx));
172+
static constexpr auto ALL_POSITIONS = SetType::Fill(SetType::Size());
173+
auto available = ALL_POSITIONS - m_used;
174+
Assume(available.Any());
175+
ClusterIndex new_idx = available.First();
176+
if (new_idx == entries.size()) {
177+
entries.emplace_back(feefrac, SetType::Singleton(new_idx), SetType::Singleton(new_idx));
178+
} else {
179+
entries[new_idx] = Entry(feefrac, SetType::Singleton(new_idx), SetType::Singleton(new_idx));
180+
}
181+
m_used.Set(new_idx);
137182
return new_idx;
138183
}
139184

185+
/** Remove the specified positions from this DepGraph.
186+
*
187+
* The specified positions will no longer be part of Positions(), and dependencies with them are
188+
* removed. Note that due to DepGraph only tracking ancestors/descendants (and not direct
189+
* dependencies), if a parent is removed while a grandparent remains, the grandparent will
190+
* remain an ancestor.
191+
*
192+
* Complexity: O(N) where N=TxCount().
193+
*/
194+
void RemoveTransactions(const SetType& del) noexcept
195+
{
196+
m_used -= del;
197+
// Remove now-unused trailing entries.
198+
while (!entries.empty() && !m_used[entries.size() - 1]) {
199+
entries.pop_back();
200+
}
201+
// Remove the deleted transactions from ancestors/descendants of other transactions. Note
202+
// that the deleted positions will retain old feerate and dependency information. This does
203+
// not matter as they will be overwritten by AddTransaction if they get used again.
204+
for (auto& entry : entries) {
205+
entry.ancestors &= m_used;
206+
entry.descendants &= m_used;
207+
}
208+
}
209+
140210
/** Modify this transaction graph, adding multiple parents to a specified child.
141211
*
142212
* Complexity: O(N) where N=TxCount().
143213
*/
144214
void AddDependencies(const SetType& parents, ClusterIndex child) noexcept
145215
{
216+
Assume(m_used[child]);
217+
Assume(parents.IsSubsetOf(m_used));
146218
// Compute the ancestors of parents that are not already ancestors of child.
147219
SetType par_anc;
148220
for (auto par : parents - Ancestors(child)) {
@@ -257,7 +329,7 @@ class DepGraph
257329
*
258330
* Complexity: O(TxCount()).
259331
*/
260-
bool IsConnected() const noexcept { return IsConnected(SetType::Fill(TxCount())); }
332+
bool IsConnected() const noexcept { return IsConnected(m_used); }
261333

262334
/** Append the entries of select to list in a topologically valid order.
263335
*
@@ -507,11 +579,11 @@ class AncestorCandidateFinder
507579
*/
508580
AncestorCandidateFinder(const DepGraph<SetType>& depgraph LIFETIMEBOUND) noexcept :
509581
m_depgraph(depgraph),
510-
m_todo{SetType::Fill(depgraph.TxCount())},
511-
m_ancestor_set_feerates(depgraph.TxCount())
582+
m_todo{depgraph.Positions()},
583+
m_ancestor_set_feerates(depgraph.PositionRange())
512584
{
513585
// Precompute ancestor-set feerates.
514-
for (ClusterIndex i = 0; i < depgraph.TxCount(); ++i) {
586+
for (ClusterIndex i : m_depgraph.Positions()) {
515587
/** The remaining ancestors for transaction i. */
516588
SetType anc_to_add = m_depgraph.Ancestors(i);
517589
FeeFrac anc_feerate;
@@ -634,22 +706,26 @@ class SearchCandidateFinder
634706
SearchCandidateFinder(const DepGraph<SetType>& depgraph, uint64_t rng_seed) noexcept :
635707
m_rng(rng_seed),
636708
m_sorted_to_original(depgraph.TxCount()),
637-
m_original_to_sorted(depgraph.TxCount()),
638-
m_todo(SetType::Fill(depgraph.TxCount()))
709+
m_original_to_sorted(depgraph.PositionRange())
639710
{
640-
// Determine reordering mapping, by sorting by decreasing feerate.
641-
std::iota(m_sorted_to_original.begin(), m_sorted_to_original.end(), ClusterIndex{0});
711+
// Determine reordering mapping, by sorting by decreasing feerate. Unusued positions are
712+
// not included, as they will never be looked up anyway.
713+
ClusterIndex sorted_pos{0};
714+
for (auto i : depgraph.Positions()) {
715+
m_sorted_to_original[sorted_pos++] = i;
716+
}
642717
std::sort(m_sorted_to_original.begin(), m_sorted_to_original.end(), [&](auto a, auto b) {
643718
auto feerate_cmp = depgraph.FeeRate(a) <=> depgraph.FeeRate(b);
644719
if (feerate_cmp == 0) return a < b;
645720
return feerate_cmp > 0;
646721
});
647722
// Compute reverse mapping.
648-
for (ClusterIndex i = 0; i < depgraph.TxCount(); ++i) {
723+
for (ClusterIndex i = 0; i < m_sorted_to_original.size(); ++i) {
649724
m_original_to_sorted[m_sorted_to_original[i]] = i;
650725
}
651726
// Compute reordered dependency graph.
652-
m_sorted_depgraph = DepGraph(depgraph, m_original_to_sorted);
727+
m_sorted_depgraph = DepGraph(depgraph, m_original_to_sorted, m_sorted_to_original.size());
728+
m_todo = m_sorted_depgraph.Positions();
653729
}
654730

655731
/** Check whether any unlinearized transactions remain. */
@@ -1161,7 +1237,7 @@ void PostLinearize(const DepGraph<SetType>& depgraph, Span<ClusterIndex> lineari
11611237
// During an even pass, the diagram above would correspond to linearization [2,3,0,1], with
11621238
// groups [2] and [3,0,1].
11631239

1164-
std::vector<TxEntry> entries(linearization.size() + 1);
1240+
std::vector<TxEntry> entries(depgraph.PositionRange() + 1);
11651241

11661242
// Perform two passes over the linearization.
11671243
for (int pass = 0; pass < 2; ++pass) {

‎src/test/cluster_linearize_tests.cpp

+39
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,10 @@ using namespace cluster_linearize;
1818

1919
namespace {
2020

21+
/** Special magic value that indicates to TestDepGraphSerialization that a cluster entry represents
22+
* a hole. */
23+
constexpr std::pair<FeeFrac, TestBitSet> HOLE{FeeFrac{0, 0x3FFFFF}, {}};
24+
2125
template<typename SetType>
2226
void TestDepGraphSerialization(const Cluster<SetType>& cluster, const std::string& hexenc)
2327
{
@@ -26,6 +30,13 @@ void TestDepGraphSerialization(const Cluster<SetType>& cluster, const std::strin
2630
// Run normal sanity and correspondence checks, which includes a round-trip test.
2731
VerifyDepGraphFromCluster(cluster, depgraph);
2832

33+
// Remove holes (which are expected to be present as HOLE entries in cluster).
34+
SetType holes;
35+
for (ClusterIndex i = 0; i < cluster.size(); ++i) {
36+
if (cluster[i] == HOLE) holes.Set(i);
37+
}
38+
depgraph.RemoveTransactions(holes);
39+
2940
// There may be multiple serializations of the same graph, but DepGraphFormatter's serializer
3041
// only produces one of those. Verify that hexenc matches that canonical serialization.
3142
std::vector<unsigned char> encoding;
@@ -133,6 +144,34 @@ BOOST_AUTO_TEST_CASE(depgraph_ser_tests)
133144
skip insertion C): D,A,B,E,C */
134145
"00" /* end of graph */
135146
);
147+
148+
// Transactions: A(1,2), B(3,1), C(2,1), D(1,3), E(1,1). Deps: C->A, D->A, D->B, E->D.
149+
// In order: [_, D, _, _, A, _, B, _, _, _, E, _, _, C] (_ being holes). Internally serialized
150+
// in order A,B,C,D,E.
151+
TestDepGraphSerialization<TestBitSet>(
152+
{HOLE, {{1, 3}, {4, 6}}, HOLE, HOLE, {{1, 2}, {}}, HOLE, {{3, 1}, {}}, HOLE, HOLE, HOLE, {{1, 1}, {1}}, HOLE, HOLE, {{2, 1}, {4}}},
153+
"02" /* A size */
154+
"02" /* A fee */
155+
"03" /* A insertion position (3 holes): _, _, _, A */
156+
"01" /* B size */
157+
"06" /* B fee */
158+
"06" /* B insertion position (skip B->A dependency, skip 4 inserts, add 1 hole): _, _, _, A, _, B */
159+
"01" /* C size */
160+
"04" /* C fee */
161+
"01" /* C->A dependency (skip C->B dependency) */
162+
"0b" /* C insertion position (skip 6 inserts, add 5 holes): _, _, _, A, _, B, _, _, _, _, _, C */
163+
"03" /* D size */
164+
"02" /* D fee */
165+
"01" /* D->B dependency (skip D->C dependency) */
166+
"00" /* D->A dependency (no skips) */
167+
"0b" /* D insertion position (skip 11 inserts): _, D, _, _, A, _, B, _, _, _, _, _, C */
168+
"01" /* E size */
169+
"02" /* E fee */
170+
"00" /* E->D dependency (no skips) */
171+
"04" /* E insertion position (skip E->C dependency, E->B and E->A are implied, skip 3
172+
inserts): _, D, _, _, A, _, B, _, _, _, E, _, _, C */
173+
"00" /* end of graph */
174+
);
136175
}
137176

138177
BOOST_AUTO_TEST_SUITE_END()

‎src/test/feefrac_tests.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ BOOST_AUTO_TEST_CASE(feefrac_operators)
1515
FeeFrac sum{1500, 400};
1616
FeeFrac diff{500, -200};
1717
FeeFrac empty{0, 0};
18-
FeeFrac zero_fee{0, 1}; // zero-fee allowed
18+
[[maybe_unused]] FeeFrac zero_fee{0, 1}; // zero-fee allowed
1919

2020
BOOST_CHECK(empty == FeeFrac{}); // same as no-args
2121

0 commit comments

Comments
 (0)
Please sign in to comment.