Branch data Line data Source code
1 : : // Copyright (c) The Bitcoin Core developers
2 : : // Distributed under the MIT software license, see the accompanying
3 : : // file COPYING or http://www.opensource.org/licenses/mit-license.php.
4 : :
5 : : #include <cluster_linearize.h>
6 : : #include <random.h>
7 : : #include <serialize.h>
8 : : #include <streams.h>
9 : : #include <test/fuzz/fuzz.h>
10 : : #include <test/fuzz/FuzzedDataProvider.h>
11 : : #include <test/util/cluster_linearize.h>
12 : : #include <util/bitset.h>
13 : : #include <util/feefrac.h>
14 : :
15 : : #include <algorithm>
16 : : #include <stdint.h>
17 : : #include <vector>
18 : : #include <utility>
19 : :
20 : : using namespace cluster_linearize;
21 : :
22 : : namespace {
23 : :
24 : : /** A simple finder class for candidate sets.
25 : : *
26 : : * This class matches SearchCandidateFinder in interface and behavior, though with fewer
27 : : * optimizations.
28 : : */
29 : : template<typename SetType>
30 : : class SimpleCandidateFinder
31 : : {
32 : : /** Internal dependency graph. */
33 : : const DepGraph<SetType>& m_depgraph;
34 : : /** Which transaction are left to include. */
35 : : SetType m_todo;
36 : :
37 : : public:
38 : : /** Construct an SimpleCandidateFinder for a given graph. */
39 : 818 : SimpleCandidateFinder(const DepGraph<SetType>& depgraph LIFETIMEBOUND) noexcept :
40 : 818 : m_depgraph(depgraph), m_todo{depgraph.Positions()} {}
41 : :
42 : : /** Remove a set of transactions from the set of to-be-linearized ones. */
43 : 5833 : void MarkDone(SetType select) noexcept { m_todo -= select; }
44 : :
45 : : /** Determine whether unlinearized transactions remain. */
46 : 3687 : bool AllDone() const noexcept { return m_todo.None(); }
47 : :
48 : : /** Find a candidate set using at most max_iterations iterations, and the number of iterations
49 : : * actually performed. If that number is less than max_iterations, then the result is optimal.
50 : : *
51 : : * Complexity: O(N * M), where M is the number of connected topological subsets of the cluster.
52 : : * That number is bounded by M <= 2^(N-1).
53 : : */
54 : 4614 : std::pair<SetInfo<SetType>, uint64_t> FindCandidateSet(uint64_t max_iterations) const noexcept
55 : : {
56 : 4614 : uint64_t iterations_left = max_iterations;
57 : : // Queue of work units. Each consists of:
58 : : // - inc: set of transactions definitely included
59 : : // - und: set of transactions that can be added to inc still
60 : 4614 : std::vector<std::pair<SetType, SetType>> queue;
61 : : // Initially we have just one queue element, with the entire graph in und.
62 : 4614 : queue.emplace_back(SetType{}, m_todo);
63 : : // Best solution so far.
64 : 4614 : SetInfo best(m_depgraph, m_todo);
65 : : // Process the queue.
66 [ + + + + ]: 16067686 : while (!queue.empty() && iterations_left) {
67 : 16063072 : --iterations_left;
68 : : // Pop top element of the queue.
69 : 16063072 : auto [inc, und] = queue.back();
70 : 16063072 : queue.pop_back();
71 : : // Look for a transaction to consider adding/removing.
72 : 16063072 : bool inc_none = inc.None();
73 [ + + ]: 27669912 : for (auto split : und) {
74 : : // If inc is empty, consider any split transaction. Otherwise only consider
75 : : // transactions that share ancestry with inc so far (which means only connected
76 : : // sets will be considered).
77 [ + + + + ]: 19636265 : if (inc_none || inc.Overlaps(m_depgraph.Ancestors(split))) {
78 : : // Add a queue entry with split included.
79 : 8029425 : SetInfo new_inc(m_depgraph, inc | (m_todo & m_depgraph.Ancestors(split)));
80 : 8029425 : queue.emplace_back(new_inc.transactions, und - new_inc.transactions);
81 : : // Add a queue entry with split excluded.
82 : 8029425 : queue.emplace_back(inc, und - m_depgraph.Descendants(split));
83 : : // Update statistics to account for the candidate new_inc.
84 [ + + ]: 8029425 : if (new_inc.feerate > best.feerate) best = new_inc;
85 : : break;
86 : : }
87 : : }
88 : : }
89 : 4614 : return {std::move(best), max_iterations - iterations_left};
90 : 4614 : }
91 : : };
92 : :
93 : : /** A very simple finder class for optimal candidate sets, which tries every subset.
94 : : *
95 : : * It is even simpler than SimpleCandidateFinder, and is primarily included here to test the
96 : : * correctness of SimpleCandidateFinder, which is then used to test the correctness of
97 : : * SearchCandidateFinder.
98 : : */
99 : : template<typename SetType>
100 : : class ExhaustiveCandidateFinder
101 : : {
102 : : /** Internal dependency graph. */
103 : : const DepGraph<SetType>& m_depgraph;
104 : : /** Which transaction are left to include. */
105 : : SetType m_todo;
106 : :
107 : : public:
108 : : /** Construct an ExhaustiveCandidateFinder for a given graph. */
109 : 427 : ExhaustiveCandidateFinder(const DepGraph<SetType>& depgraph LIFETIMEBOUND) noexcept :
110 : 427 : m_depgraph(depgraph), m_todo{depgraph.Positions()} {}
111 : :
112 : : /** Remove a set of transactions from the set of to-be-linearized ones. */
113 : 3260 : void MarkDone(SetType select) noexcept { m_todo -= select; }
114 : :
115 : : /** Determine whether unlinearized transactions remain. */
116 : 3687 : bool AllDone() const noexcept { return m_todo.None(); }
117 : :
118 : : /** Find the optimal remaining candidate set.
119 : : *
120 : : * Complexity: O(N * 2^N).
121 : : */
122 : 1133 : SetInfo<SetType> FindCandidateSet() const noexcept
123 : : {
124 : : // Best solution so far.
125 : 1133 : SetInfo<SetType> best{m_todo, m_depgraph.FeeRate(m_todo)};
126 : : // The number of combinations to try.
127 : 1133 : uint64_t limit = (uint64_t{1} << m_todo.Count()) - 1;
128 : : // Try the transitive closure of every non-empty subset of m_todo.
129 [ + + ]: 479967 : for (uint64_t x = 1; x < limit; ++x) {
130 : : // If bit number b is set in x, then the remaining ancestors of the b'th remaining
131 : : // transaction in m_todo are included.
132 : 478834 : SetType txn;
133 : 478834 : auto x_shifted{x};
134 [ + - + + ]: 6139920 : for (auto i : m_todo) {
135 [ + + ]: 5182252 : if (x_shifted & 1) txn |= m_depgraph.Ancestors(i);
136 : 5182252 : x_shifted >>= 1;
137 : : }
138 : 478834 : SetInfo cur(m_depgraph, txn & m_todo);
139 [ + + ]: 478834 : if (cur.feerate > best.feerate) best = cur;
140 : : }
141 : 1133 : return best;
142 : : }
143 : : };
144 : :
145 : : /** A simple linearization algorithm.
146 : : *
147 : : * This matches Linearize() in interface and behavior, though with fewer optimizations, lacking
148 : : * the ability to pass in an existing linearization, and using just SimpleCandidateFinder rather
149 : : * than AncestorCandidateFinder and SearchCandidateFinder.
150 : : */
151 : : template<typename SetType>
152 : 391 : std::pair<std::vector<ClusterIndex>, bool> SimpleLinearize(const DepGraph<SetType>& depgraph, uint64_t max_iterations)
153 : : {
154 : 391 : std::vector<ClusterIndex> linearization;
155 : 391 : SimpleCandidateFinder finder(depgraph);
156 : 391 : SetType todo = depgraph.Positions();
157 : 391 : bool optimal = true;
158 [ + + ]: 2964 : while (todo.Any()) {
159 [ + + ]: 2573 : auto [candidate, iterations_done] = finder.FindCandidateSet(max_iterations);
160 [ + + ]: 2573 : if (iterations_done == max_iterations) optimal = false;
161 : 2573 : depgraph.AppendTopo(linearization, candidate.transactions);
162 : 2573 : todo -= candidate.transactions;
163 : 2573 : finder.MarkDone(candidate.transactions);
164 : 2573 : max_iterations -= iterations_done;
165 : : }
166 : 391 : return {std::move(linearization), optimal};
167 : 391 : }
168 : :
169 : : /** Stitch connected components together in a DepGraph, guaranteeing its corresponding cluster is connected. */
170 : : template<typename BS>
171 : 1135 : void MakeConnected(DepGraph<BS>& depgraph)
172 : : {
173 : 1135 : auto todo = depgraph.Positions();
174 : 1135 : auto comp = depgraph.FindConnectedComponent(todo);
175 : 1135 : Assume(depgraph.IsConnected(comp));
176 : 1135 : todo -= comp;
177 [ + + ]: 11351 : while (todo.Any()) {
178 : 10216 : auto nextcomp = depgraph.FindConnectedComponent(todo);
179 : 10216 : Assume(depgraph.IsConnected(nextcomp));
180 : 10216 : depgraph.AddDependencies(BS::Singleton(comp.Last()), nextcomp.First());
181 : 10216 : todo -= nextcomp;
182 : 10216 : comp = nextcomp;
183 : : }
184 : 1135 : }
185 : :
186 : : /** Given a dependency graph, and a todo set, read a topological subset of todo from reader. */
187 : : template<typename SetType>
188 : 9984 : SetType ReadTopologicalSet(const DepGraph<SetType>& depgraph, const SetType& todo, SpanReader& reader)
189 : : {
190 [ + + ]: 9984 : uint64_t mask{0};
191 : : try {
192 [ + + ]: 9984 : reader >> VARINT(mask);
193 [ - + ]: 5701 : } catch(const std::ios_base::failure&) {}
194 : 9984 : SetType ret;
195 [ + + + + ]: 148289 : for (auto i : todo) {
196 [ + + ]: 128328 : if (!ret[i]) {
197 [ + + ]: 124574 : if (mask & 1) ret |= depgraph.Ancestors(i);
198 : 124574 : mask >>= 1;
199 : : }
200 : : }
201 : 9984 : return ret & todo;
202 : : }
203 : :
204 : : /** Given a dependency graph, construct any valid linearization for it, reading from a SpanReader. */
205 : : template<typename BS>
206 : 1943 : std::vector<ClusterIndex> ReadLinearization(const DepGraph<BS>& depgraph, SpanReader& reader)
207 : : {
208 : 1943 : std::vector<ClusterIndex> linearization;
209 : 1943 : TestBitSet todo = depgraph.Positions();
210 : : // In every iteration one topologically-valid transaction is appended to linearization.
211 [ + + ]: 41254 : while (todo.Any()) {
212 : : // Compute the set of transactions with no not-yet-included ancestors.
213 : 37368 : TestBitSet potential_next;
214 [ + + ]: 553729 : for (auto j : todo) {
215 [ + + ]: 814912 : if ((depgraph.Ancestors(j) & todo) == TestBitSet::Singleton(j)) {
216 : 298551 : potential_next.Set(j);
217 : : }
218 : : }
219 : : // There must always be one (otherwise there is a cycle in the graph).
220 [ - + ]: 37368 : assert(potential_next.Any());
221 : : // Read a number from reader, and interpret it as index into potential_next.
222 [ + + ]: 37368 : uint64_t idx{0};
223 : : try {
224 [ + + + - ]: 74736 : reader >> VARINT(idx);
225 [ - + ]: 27555 : } catch (const std::ios_base::failure&) {}
226 : 37368 : idx %= potential_next.Count();
227 : : // Find out which transaction that corresponds to.
228 [ + - + - ]: 105269 : for (auto j : potential_next) {
229 [ + + ]: 67901 : if (idx == 0) {
230 : : // When found, add it to linearization and remove it from todo.
231 [ + - ]: 37368 : linearization.push_back(j);
232 [ - + ]: 37368 : assert(todo[j]);
233 : 37368 : todo.Reset(j);
234 : 37368 : break;
235 : : }
236 : 30533 : --idx;
237 : : }
238 : : }
239 : 1943 : return linearization;
240 : 0 : }
241 : :
242 : : } // namespace
243 : :
244 [ + - ]: 620 : FUZZ_TARGET(clusterlin_depgraph_sim)
245 : : {
246 : : // Simulation test to verify the full behavior of DepGraph.
247 : :
248 : 206 : FuzzedDataProvider provider(buffer.data(), buffer.size());
249 : :
250 : : /** Real DepGraph being tested. */
251 : 206 : DepGraph<TestBitSet> real;
252 : : /** Simulated DepGraph (sim[i] is std::nullopt if position i does not exist; otherwise,
253 : : * sim[i]->first is its individual feerate, and sim[i]->second is its set of ancestors. */
254 : 206 : std::array<std::optional<std::pair<FeeFrac, TestBitSet>>, TestBitSet::Size()> sim;
255 : : /** The number of non-nullopt position in sim. */
256 : 206 : ClusterIndex num_tx_sim{0};
257 : :
258 : : /** Read a valid index of a transaction from the provider. */
259 : 13823 : auto idx_fn = [&]() {
260 : 13617 : auto offset = provider.ConsumeIntegralInRange<ClusterIndex>(0, num_tx_sim - 1);
261 [ + - ]: 155070 : for (ClusterIndex i = 0; i < sim.size(); ++i) {
262 [ + + ]: 155070 : if (!sim[i].has_value()) continue;
263 [ + + ]: 136268 : if (offset == 0) return i;
264 : 122651 : --offset;
265 : : }
266 : 0 : assert(false);
267 : : return ClusterIndex(-1);
268 : 206 : };
269 : :
270 : : /** Read a valid subset of the transactions from the provider. */
271 : 13823 : auto subset_fn = [&]() {
272 : 13617 : auto range = (uint64_t{1} << num_tx_sim) - 1;
273 : 13617 : const auto mask = provider.ConsumeIntegralInRange<uint64_t>(0, range);
274 : 13617 : auto mask_shifted = mask;
275 : 13617 : TestBitSet subset;
276 [ + + ]: 449361 : for (ClusterIndex i = 0; i < sim.size(); ++i) {
277 [ + + ]: 435744 : if (!sim[i].has_value()) continue;
278 [ + + ]: 258304 : if (mask_shifted & 1) {
279 : 106294 : subset.Set(i);
280 : : }
281 : 258304 : mask_shifted >>= 1;
282 : : }
283 [ - + ]: 13617 : assert(mask_shifted == 0);
284 : 13617 : return subset;
285 : 206 : };
286 : :
287 : : /** Read any set of transactions from the provider (including unused positions). */
288 : 7513 : auto set_fn = [&]() {
289 : 7307 : auto range = (uint64_t{1} << sim.size()) - 1;
290 : 7307 : const auto mask = provider.ConsumeIntegralInRange<uint64_t>(0, range);
291 : 7307 : TestBitSet set;
292 [ + + ]: 241131 : for (ClusterIndex i = 0; i < sim.size(); ++i) {
293 [ + + ]: 233824 : if ((mask >> i) & 1) {
294 : 86740 : set.Set(i);
295 : : }
296 : : }
297 : 7307 : return set;
298 : 206 : };
299 : :
300 : : /** Propagate ancestor information in sim. */
301 : 7719 : auto anc_update_fn = [&]() {
302 : 8156 : while (true) {
303 : 8156 : bool updates{false};
304 [ + + ]: 269148 : for (ClusterIndex chl = 0; chl < sim.size(); ++chl) {
305 [ + + ]: 260992 : if (!sim[chl].has_value()) continue;
306 [ + - + + ]: 418714 : for (auto par : sim[chl]->second) {
307 [ + + ]: 241636 : if (!sim[chl]->second.IsSupersetOf(sim[par]->second)) {
308 : 2569 : sim[chl]->second |= sim[par]->second;
309 : 2569 : updates = true;
310 : : }
311 : : }
312 : : }
313 [ + + ]: 8156 : if (!updates) break;
314 : : }
315 : 7719 : };
316 : :
317 : : /** Compare the state of transaction i in the simulation with the real one. */
318 : 93538 : auto check_fn = [&](ClusterIndex i) {
319 : : // Compare used positions.
320 [ - + ]: 93332 : assert(real.Positions()[i] == sim[i].has_value());
321 [ + + ]: 93332 : if (sim[i].has_value()) {
322 : : // Compare feerate.
323 [ + - ]: 10481 : assert(real.FeeRate(i) == sim[i]->first);
324 : : // Compare ancestors (note that SanityCheck verifies correspondence between ancestors
325 : : // and descendants, so we can restrict ourselves to ancestors here).
326 [ - + ]: 10481 : assert(real.Ancestors(i) == sim[i]->second);
327 : : }
328 : 93538 : };
329 : :
330 [ + + + + ]: 31611 : LIMITED_WHILE(provider.remaining_bytes() > 0, 1000) {
331 : 31405 : uint8_t command = provider.ConsumeIntegral<uint8_t>();
332 [ + + + + : 31405 : if (num_tx_sim == 0 || ((command % 3) <= 0 && num_tx_sim < TestBitSet::Size())) {
+ + ]
333 : : // AddTransaction.
334 : 10481 : auto fee = provider.ConsumeIntegralInRange<int64_t>(-0x8000000000000, 0x7ffffffffffff);
335 : 10481 : auto size = provider.ConsumeIntegralInRange<int32_t>(1, 0x3fffff);
336 : 10481 : FeeFrac feerate{fee, size};
337 : : // Apply to DepGraph.
338 : 10481 : auto idx = real.AddTransaction(feerate);
339 : : // Verify that the returned index is correct.
340 [ - + ]: 10481 : assert(!sim[idx].has_value());
341 [ + - ]: 137102 : for (ClusterIndex i = 0; i < TestBitSet::Size(); ++i) {
342 [ + + ]: 137102 : if (!sim[i].has_value()) {
343 [ - + ]: 10481 : assert(idx == i);
344 : : break;
345 : : }
346 : : }
347 : : // Update sim.
348 [ - + ]: 10481 : sim[idx] = {feerate, TestBitSet::Singleton(idx)};
349 : 10481 : ++num_tx_sim;
350 : 10481 : continue;
351 : 10481 : }
352 [ + + ]: 20924 : if ((command % 3) <= 1 && num_tx_sim > 0) {
353 : : // AddDependencies.
354 : 13617 : ClusterIndex child = idx_fn();
355 : 13617 : auto parents = subset_fn();
356 : : // Apply to DepGraph.
357 : 13617 : real.AddDependencies(parents, child);
358 : : // Apply to sim.
359 : 13617 : sim[child]->second |= parents;
360 : 13617 : continue;
361 : 13617 : }
362 : 7307 : if (num_tx_sim > 0) {
363 : : // Remove transactions.
364 : 7307 : auto del = set_fn();
365 : : // Propagate all ancestry information before deleting anything in the simulation (as
366 : : // intermediary transactions may be deleted which impact connectivity).
367 : 7307 : anc_update_fn();
368 : : // Compare the state of the transactions being deleted.
369 [ + + + + ]: 100710 : for (auto i : del) check_fn(i);
370 : : // Apply to DepGraph.
371 : 7307 : real.RemoveTransactions(del);
372 : : // Apply to sim.
373 [ + + ]: 241131 : for (ClusterIndex i = 0; i < sim.size(); ++i) {
374 [ + + ]: 233824 : if (sim[i].has_value()) {
375 [ + + ]: 71512 : if (del[i]) {
376 : 7428 : --num_tx_sim;
377 [ + - ]: 241252 : sim[i] = std::nullopt;
378 : : } else {
379 : 64084 : sim[i]->second -= del;
380 : : }
381 : : }
382 : : }
383 : 7307 : continue;
384 : 7307 : }
385 : : // This should be unreachable (one of the 3 above actions should always be possible).
386 : : assert(false);
387 : : }
388 : :
389 : : // Compare the real obtained depgraph against the simulation.
390 : 206 : anc_update_fn();
391 [ + + ]: 6798 : for (ClusterIndex i = 0; i < sim.size(); ++i) check_fn(i);
392 [ - + ]: 206 : assert(real.TxCount() == num_tx_sim);
393 : : // Sanity check the result (which includes round-tripping serialization, if applicable).
394 [ + - ]: 206 : SanityCheck(real);
395 : 206 : }
396 : :
397 [ + - ]: 639 : FUZZ_TARGET(clusterlin_depgraph_serialization)
398 : : {
399 : : // Verify that any deserialized depgraph is acyclic and roundtrips to an identical depgraph.
400 : :
401 : : // Construct a graph by deserializing.
402 [ + - ]: 225 : SpanReader reader(buffer);
403 : 225 : DepGraph<TestBitSet> depgraph;
404 : 225 : try {
405 [ + - ]: 225 : reader >> Using<DepGraphFormatter>(depgraph);
406 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
407 [ + - ]: 225 : SanityCheck(depgraph);
408 : :
409 : : // Verify the graph is a DAG.
410 [ - + ]: 225 : assert(IsAcyclic(depgraph));
411 : 225 : }
412 : :
413 [ + - ]: 544 : FUZZ_TARGET(clusterlin_components)
414 : : {
415 : : // Verify the behavior of DepGraphs's FindConnectedComponent and IsConnected functions.
416 : :
417 : : // Construct a depgraph.
418 [ + - ]: 130 : SpanReader reader(buffer);
419 : 130 : DepGraph<TestBitSet> depgraph;
420 : 130 : try {
421 [ + - ]: 130 : reader >> Using<DepGraphFormatter>(depgraph);
422 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
423 : :
424 : 130 : TestBitSet todo = depgraph.Positions();
425 [ + + ]: 1668 : while (todo.Any()) {
426 : : // Find a connected component inside todo.
427 : 1538 : auto component = depgraph.FindConnectedComponent(todo);
428 : :
429 : : // The component must be a subset of todo and non-empty.
430 [ - + ]: 1538 : assert(component.IsSubsetOf(todo));
431 [ - + ]: 1538 : assert(component.Any());
432 : :
433 : : // If todo is the entire graph, and the entire graph is connected, then the component must
434 : : // be the entire graph.
435 [ + + ]: 1538 : if (todo == depgraph.Positions()) {
436 [ + + - + ]: 206 : assert((component == todo) == depgraph.IsConnected());
437 : : }
438 : :
439 : : // If subset is connected, then component must match subset.
440 [ + + - + ]: 2602 : assert((component == todo) == depgraph.IsConnected(todo));
441 : :
442 : : // The component cannot have any ancestors or descendants outside of component but in todo.
443 [ + + ]: 11406 : for (auto i : component) {
444 [ - + ]: 9868 : assert((depgraph.Ancestors(i) & todo).IsSubsetOf(component));
445 [ - + ]: 9868 : assert((depgraph.Descendants(i) & todo).IsSubsetOf(component));
446 : : }
447 : :
448 : : // Starting from any component element, we must be able to reach every element.
449 [ + + ]: 11406 : for (auto i : component) {
450 : : // Start with just i as reachable.
451 : 9868 : TestBitSet reachable = TestBitSet::Singleton(i);
452 : : // Add in-todo descendants and ancestors to reachable until it does not change anymore.
453 : 72834 : while (true) {
454 : 41351 : TestBitSet new_reachable = reachable;
455 [ + - + + ]: 510988 : for (auto j : new_reachable) {
456 : 428286 : new_reachable |= depgraph.Ancestors(j) & todo;
457 : 428286 : new_reachable |= depgraph.Descendants(j) & todo;
458 : : }
459 [ + + ]: 41351 : if (new_reachable == reachable) break;
460 : 31483 : reachable = new_reachable;
461 : 31483 : }
462 : : // Verify that the result is the entire component.
463 [ - + ]: 9868 : assert(component == reachable);
464 : : }
465 : :
466 : : // Construct an arbitrary subset of todo.
467 : 1538 : uint64_t subset_bits{0};
468 : 1538 : try {
469 [ + + ]: 1538 : reader >> VARINT(subset_bits);
470 [ - + ]: 1253 : } catch (const std::ios_base::failure&) {}
471 : 1538 : TestBitSet subset;
472 [ + - + + ]: 37871 : for (ClusterIndex i : depgraph.Positions()) {
473 [ + + ]: 34795 : if (todo[i]) {
474 [ + + ]: 17876 : if (subset_bits & 1) subset.Set(i);
475 : 17876 : subset_bits >>= 1;
476 : : }
477 : : }
478 : : // Which must be non-empty.
479 [ + + ]: 1538 : if (subset.None()) subset = TestBitSet::Singleton(todo.First());
480 : : // Remove it from todo.
481 : 1538 : todo -= subset;
482 : : }
483 : :
484 : : // No components can be found in an empty subset.
485 [ - + ]: 130 : assert(depgraph.FindConnectedComponent(todo).None());
486 : 130 : }
487 : :
488 [ + - ]: 655 : FUZZ_TARGET(clusterlin_make_connected)
489 : : {
490 : : // Verify that MakeConnected makes graphs connected.
491 : :
492 [ + - ]: 241 : SpanReader reader(buffer);
493 : 241 : DepGraph<TestBitSet> depgraph;
494 : 241 : try {
495 [ + - ]: 241 : reader >> Using<DepGraphFormatter>(depgraph);
496 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
497 [ + - ]: 241 : MakeConnected(depgraph);
498 [ + - ]: 241 : SanityCheck(depgraph);
499 [ - + ]: 241 : assert(depgraph.IsConnected());
500 : 241 : }
501 : :
502 [ + - ]: 536 : FUZZ_TARGET(clusterlin_chunking)
503 : : {
504 : : // Verify the correctness of the ChunkLinearization function.
505 : :
506 : : // Construct a graph by deserializing.
507 [ + - ]: 122 : SpanReader reader(buffer);
508 : 122 : DepGraph<TestBitSet> depgraph;
509 : 122 : try {
510 [ + - ]: 122 : reader >> Using<DepGraphFormatter>(depgraph);
511 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
512 : :
513 : : // Read a valid linearization for depgraph.
514 [ + - ]: 122 : auto linearization = ReadLinearization(depgraph, reader);
515 : :
516 : : // Invoke the chunking function.
517 : 122 : auto chunking = ChunkLinearization(depgraph, linearization);
518 : :
519 : : // Verify that chunk feerates are monotonically non-increasing.
520 [ + + ]: 520 : for (size_t i = 1; i < chunking.size(); ++i) {
521 [ - + ]: 398 : assert(!(chunking[i] >> chunking[i - 1]));
522 : : }
523 : :
524 : : // Naively recompute the chunks (each is the highest-feerate prefix of what remains).
525 : 122 : auto todo = depgraph.Positions();
526 [ + + ]: 634 : for (const auto& chunk_feerate : chunking) {
527 [ - + ]: 512 : assert(todo.Any());
528 : 512 : SetInfo<TestBitSet> accumulator, best;
529 [ + + ]: 11800 : for (ClusterIndex idx : linearization) {
530 [ + + ]: 11288 : if (todo[idx]) {
531 : 6015 : accumulator.Set(depgraph, idx);
532 [ + + + + ]: 6015 : if (best.feerate.IsEmpty() || accumulator.feerate >> best.feerate) {
533 : 1109 : best = accumulator;
534 : : }
535 : : }
536 : : }
537 [ + - ]: 512 : assert(chunk_feerate == best.feerate);
538 [ - + ]: 512 : assert(best.transactions.IsSubsetOf(todo));
539 : 512 : todo -= best.transactions;
540 : : }
541 [ - + ]: 122 : assert(todo.None());
542 : 122 : }
543 : :
544 [ + - ]: 552 : FUZZ_TARGET(clusterlin_ancestor_finder)
545 : : {
546 : : // Verify that AncestorCandidateFinder works as expected.
547 : :
548 : : // Retrieve a depgraph from the fuzz input.
549 [ + - ]: 138 : SpanReader reader(buffer);
550 : 138 : DepGraph<TestBitSet> depgraph;
551 : 138 : try {
552 [ + - ]: 138 : reader >> Using<DepGraphFormatter>(depgraph);
553 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
554 : :
555 : 138 : AncestorCandidateFinder anc_finder(depgraph);
556 : 138 : auto todo = depgraph.Positions();
557 [ + + ]: 1418 : while (todo.Any()) {
558 : : // Call the ancestor finder's FindCandidateSet for what remains of the graph.
559 [ - + ]: 1280 : assert(!anc_finder.AllDone());
560 [ - + ]: 1280 : assert(todo.Count() == anc_finder.NumRemaining());
561 : 1280 : auto best_anc = anc_finder.FindCandidateSet();
562 : : // Sanity check the result.
563 [ - + ]: 1280 : assert(best_anc.transactions.Any());
564 [ - + ]: 1280 : assert(best_anc.transactions.IsSubsetOf(todo));
565 [ + - ]: 1280 : assert(depgraph.FeeRate(best_anc.transactions) == best_anc.feerate);
566 [ - + ]: 1280 : assert(depgraph.IsConnected(best_anc.transactions));
567 : : // Check that it is topologically valid.
568 [ + - + + ]: 5024 : for (auto i : best_anc.transactions) {
569 [ - + ]: 2464 : assert((depgraph.Ancestors(i) & todo).IsSubsetOf(best_anc.transactions));
570 : : }
571 : :
572 : : // Compute all remaining ancestor sets.
573 : 1280 : std::optional<SetInfo<TestBitSet>> real_best_anc;
574 [ + - + + ]: 17840 : for (auto i : todo) {
575 : 15280 : SetInfo info(depgraph, todo & depgraph.Ancestors(i));
576 [ + + + + ]: 15280 : if (!real_best_anc.has_value() || info.feerate > real_best_anc->feerate) {
577 [ + + ]: 18489 : real_best_anc = info;
578 : : }
579 : : }
580 : : // The set returned by anc_finder must equal the real best ancestor sets.
581 [ - + ]: 1280 : assert(real_best_anc.has_value());
582 [ + - ]: 1280 : assert(*real_best_anc == best_anc);
583 : :
584 : : // Find a topologically valid subset of transactions to remove from the graph.
585 [ + - ]: 1280 : auto del_set = ReadTopologicalSet(depgraph, todo, reader);
586 : : // If we did not find anything, use best_anc itself, because we should remove something.
587 [ + + ]: 1280 : if (del_set.None()) del_set = best_anc.transactions;
588 : 1280 : todo -= del_set;
589 : 1280 : anc_finder.MarkDone(del_set);
590 : : }
591 [ - + ]: 138 : assert(anc_finder.AllDone());
592 [ - + ]: 138 : assert(anc_finder.NumRemaining() == 0);
593 : 138 : }
594 : :
595 : : static constexpr auto MAX_SIMPLE_ITERATIONS = 300000;
596 : :
597 [ + - ]: 841 : FUZZ_TARGET(clusterlin_search_finder)
598 : : {
599 : : // Verify that SearchCandidateFinder works as expected by sanity checking the results
600 : : // and comparing with the results from SimpleCandidateFinder, ExhaustiveCandidateFinder, and
601 : : // AncestorCandidateFinder.
602 : :
603 : : // Retrieve an RNG seed, a depgraph, and whether to make it connected, from the fuzz input.
604 [ + - ]: 427 : SpanReader reader(buffer);
605 : 427 : DepGraph<TestBitSet> depgraph;
606 : 427 : uint64_t rng_seed{0};
607 : 427 : uint8_t make_connected{1};
608 : 427 : try {
609 [ + - + + : 427 : reader >> Using<DepGraphFormatter>(depgraph) >> rng_seed >> make_connected;
+ + ]
610 [ - + ]: 151 : } catch (const std::ios_base::failure&) {}
611 : : // The most complicated graphs are connected ones (other ones just split up). Optionally force
612 : : // the graph to be connected.
613 [ + + + - ]: 427 : if (make_connected) MakeConnected(depgraph);
614 : :
615 : : // Instantiate ALL the candidate finders.
616 : 427 : SearchCandidateFinder src_finder(depgraph, rng_seed);
617 : 427 : SimpleCandidateFinder smp_finder(depgraph);
618 : 427 : ExhaustiveCandidateFinder exh_finder(depgraph);
619 : 427 : AncestorCandidateFinder anc_finder(depgraph);
620 : :
621 : 427 : auto todo = depgraph.Positions();
622 [ + + ]: 3687 : while (todo.Any()) {
623 [ - + ]: 3260 : assert(!src_finder.AllDone());
624 [ - + ]: 3260 : assert(!smp_finder.AllDone());
625 [ - + ]: 3260 : assert(!exh_finder.AllDone());
626 [ - + ]: 3260 : assert(!anc_finder.AllDone());
627 [ - + ]: 3260 : assert(anc_finder.NumRemaining() == todo.Count());
628 : :
629 : : // For each iteration, read an iteration count limit from the fuzz input.
630 : 3260 : uint64_t max_iterations = 1;
631 : 3260 : try {
632 [ + + ]: 3260 : reader >> VARINT(max_iterations);
633 [ - + ]: 1401 : } catch (const std::ios_base::failure&) {}
634 : 3260 : max_iterations &= 0xfffff;
635 : :
636 : : // Read an initial subset from the fuzz input.
637 [ + - ]: 3260 : SetInfo init_best(depgraph, ReadTopologicalSet(depgraph, todo, reader));
638 : :
639 : : // Call the search finder's FindCandidateSet for what remains of the graph.
640 [ - + ]: 3260 : auto [found, iterations_done] = src_finder.FindCandidateSet(max_iterations, init_best);
641 : :
642 : : // Sanity check the result.
643 [ - + ]: 3260 : assert(iterations_done <= max_iterations);
644 [ - + ]: 3260 : assert(found.transactions.Any());
645 [ - + ]: 3260 : assert(found.transactions.IsSubsetOf(todo));
646 [ + - ]: 3260 : assert(depgraph.FeeRate(found.transactions) == found.feerate);
647 [ + + - + ]: 3260 : if (!init_best.feerate.IsEmpty()) assert(found.feerate >= init_best.feerate);
648 : : // Check that it is topologically valid.
649 [ + - + + ]: 15545 : for (auto i : found.transactions) {
650 [ - + ]: 9025 : assert(found.transactions.IsSupersetOf(depgraph.Ancestors(i) & todo));
651 : : }
652 : :
653 : : // At most 2^(N-1) iterations can be required: the maximum number of non-empty topological
654 : : // subsets a (connected) cluster with N transactions can have. Even when the cluster is no
655 : : // longer connected after removing certain transactions, this holds, because the connected
656 : : // components are searched separately.
657 [ - + ]: 3260 : assert(iterations_done <= (uint64_t{1} << (todo.Count() - 1)));
658 : : // Additionally, test that no more than sqrt(2^N)+1 iterations are required. This is just
659 : : // an empirical bound that seems to hold, without proof. Still, add a test for it so we
660 : : // can learn about counterexamples if they exist.
661 [ + + + - ]: 3260 : if (iterations_done >= 1 && todo.Count() <= 63) {
662 [ + - ]: 2238 : Assume((iterations_done - 1) * (iterations_done - 1) <= uint64_t{1} << todo.Count());
663 : : }
664 : :
665 : : // Perform quality checks only if SearchCandidateFinder claims an optimal result.
666 [ + + ]: 3260 : if (iterations_done < max_iterations) {
667 : : // Optimal sets are always connected.
668 [ - + ]: 2041 : assert(depgraph.IsConnected(found.transactions));
669 : :
670 : : // Compare with SimpleCandidateFinder.
671 [ - + ]: 2041 : auto [simple, simple_iters] = smp_finder.FindCandidateSet(MAX_SIMPLE_ITERATIONS);
672 [ - + ]: 2041 : assert(found.feerate >= simple.feerate);
673 [ + + ]: 2041 : if (simple_iters < MAX_SIMPLE_ITERATIONS) {
674 [ + - ]: 2011 : assert(found.feerate == simple.feerate);
675 : : }
676 : :
677 : : // Compare with AncestorCandidateFinder;
678 : 2041 : auto anc = anc_finder.FindCandidateSet();
679 [ - + ]: 2041 : assert(found.feerate >= anc.feerate);
680 : :
681 : : // Compare with ExhaustiveCandidateFinder. This quickly gets computationally expensive
682 : : // for large clusters (O(2^n)), so only do it for sufficiently small ones.
683 [ + + ]: 2041 : if (todo.Count() <= 12) {
684 : 1133 : auto exhaustive = exh_finder.FindCandidateSet();
685 [ + - ]: 1133 : assert(exhaustive.feerate == found.feerate);
686 : : // Also compare ExhaustiveCandidateFinder with SimpleCandidateFinder (this is
687 : : // primarily a test for SimpleCandidateFinder's correctness).
688 [ - + ]: 1133 : assert(exhaustive.feerate >= simple.feerate);
689 [ + - ]: 1133 : if (simple_iters < MAX_SIMPLE_ITERATIONS) {
690 [ + - ]: 1133 : assert(exhaustive.feerate == simple.feerate);
691 : : }
692 : : }
693 : : }
694 : :
695 : : // Find a topologically valid subset of transactions to remove from the graph.
696 [ + - ]: 3260 : auto del_set = ReadTopologicalSet(depgraph, todo, reader);
697 : : // If we did not find anything, use found itself, because we should remove something.
698 [ + + ]: 3260 : if (del_set.None()) del_set = found.transactions;
699 : 3260 : todo -= del_set;
700 : 3260 : src_finder.MarkDone(del_set);
701 : 3260 : smp_finder.MarkDone(del_set);
702 : 3260 : exh_finder.MarkDone(del_set);
703 : 3260 : anc_finder.MarkDone(del_set);
704 : : }
705 : :
706 [ - + ]: 427 : assert(src_finder.AllDone());
707 [ - + ]: 427 : assert(smp_finder.AllDone());
708 [ - + ]: 427 : assert(exh_finder.AllDone());
709 [ - + ]: 427 : assert(anc_finder.AllDone());
710 [ - + ]: 427 : assert(anc_finder.NumRemaining() == 0);
711 : 427 : }
712 : :
713 [ + - ]: 600 : FUZZ_TARGET(clusterlin_linearization_chunking)
714 : : {
715 : : // Verify the behavior of LinearizationChunking.
716 : :
717 : : // Retrieve a depgraph from the fuzz input.
718 [ + - ]: 186 : SpanReader reader(buffer);
719 : 186 : DepGraph<TestBitSet> depgraph;
720 : 186 : try {
721 [ + - ]: 186 : reader >> Using<DepGraphFormatter>(depgraph);
722 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
723 : :
724 : : // Retrieve a topologically-valid subset of depgraph.
725 : 186 : auto todo = depgraph.Positions();
726 [ + - ]: 186 : auto subset = SetInfo(depgraph, ReadTopologicalSet(depgraph, todo, reader));
727 : :
728 : : // Retrieve a valid linearization for depgraph.
729 [ + - ]: 186 : auto linearization = ReadLinearization(depgraph, reader);
730 : :
731 : : // Construct a LinearizationChunking object, initially for the whole linearization.
732 : 186 : LinearizationChunking chunking(depgraph, linearization);
733 : :
734 : : // Incrementally remove transactions from the chunking object, and check various properties at
735 : : // every step.
736 [ + + ]: 2370 : while (todo.Any()) {
737 [ - + ]: 1998 : assert(chunking.NumChunksLeft() > 0);
738 : :
739 : : // Construct linearization with just todo.
740 : 1998 : std::vector<ClusterIndex> linearization_left;
741 [ + + ]: 49606 : for (auto i : linearization) {
742 [ + + + - ]: 47608 : if (todo[i]) linearization_left.push_back(i);
743 : : }
744 : :
745 : : // Compute the chunking for linearization_left.
746 : 1998 : auto chunking_left = ChunkLinearization(depgraph, linearization_left);
747 : :
748 : : // Verify that it matches the feerates of the chunks of chunking.
749 [ - + ]: 1998 : assert(chunking.NumChunksLeft() == chunking_left.size());
750 [ + + ]: 12243 : for (ClusterIndex i = 0; i < chunking.NumChunksLeft(); ++i) {
751 [ + - ]: 20490 : assert(chunking.GetChunk(i).feerate == chunking_left[i]);
752 : : }
753 : :
754 : : // Check consistency of chunking.
755 : 1998 : TestBitSet combined;
756 [ + + ]: 12243 : for (ClusterIndex i = 0; i < chunking.NumChunksLeft(); ++i) {
757 : 10245 : const auto& chunk_info = chunking.GetChunk(i);
758 : : // Chunks must be non-empty.
759 [ - + ]: 10245 : assert(chunk_info.transactions.Any());
760 : : // Chunk feerates must be monotonically non-increasing.
761 [ + + - + ]: 10245 : if (i > 0) assert(!(chunk_info.feerate >> chunking.GetChunk(i - 1).feerate));
762 : : // Chunks must be a subset of what is left of the linearization.
763 [ - + ]: 10245 : assert(chunk_info.transactions.IsSubsetOf(todo));
764 : : // Chunks' claimed feerates must match their transactions' aggregate feerate.
765 [ + - ]: 10245 : assert(depgraph.FeeRate(chunk_info.transactions) == chunk_info.feerate);
766 : : // Chunks must be the highest-feerate remaining prefix.
767 : 10245 : SetInfo<TestBitSet> accumulator, best;
768 [ + + ]: 288843 : for (auto j : linearization) {
769 [ + + + + ]: 278598 : if (todo[j] && !combined[j]) {
770 : 94881 : accumulator.Set(depgraph, j);
771 [ + + + + ]: 94881 : if (best.feerate.IsEmpty() || accumulator.feerate > best.feerate) {
772 : 18685 : best = accumulator;
773 : : }
774 : : }
775 : : }
776 [ - + ]: 10245 : assert(best.transactions == chunk_info.transactions);
777 [ + - ]: 10245 : assert(best.feerate == chunk_info.feerate);
778 : : // Chunks cannot overlap.
779 [ - + ]: 10245 : assert(!chunk_info.transactions.Overlaps(combined));
780 [ + - ]: 10245 : combined |= chunk_info.transactions;
781 : : // Chunks must be topological.
782 [ + - + + ]: 44262 : for (auto idx : chunk_info.transactions) {
783 [ - + ]: 23772 : assert((depgraph.Ancestors(idx) & todo).IsSubsetOf(combined));
784 : : }
785 : : }
786 [ - + ]: 1998 : assert(combined == todo);
787 : :
788 : : // Verify the expected properties of LinearizationChunking::IntersectPrefixes:
789 : 1998 : auto intersect = chunking.IntersectPrefixes(subset);
790 : : // - Intersecting again doesn't change the result.
791 [ + - ]: 1998 : assert(chunking.IntersectPrefixes(intersect) == intersect);
792 : : // - The intersection is topological.
793 : 1998 : TestBitSet intersect_anc;
794 [ + + + + ]: 7477 : for (auto idx : intersect.transactions) {
795 : 4348 : intersect_anc |= (depgraph.Ancestors(idx) & todo);
796 : : }
797 [ - + ]: 1998 : assert(intersect.transactions == intersect_anc);
798 : : // - The claimed intersection feerate matches its transactions.
799 [ + - ]: 1998 : assert(intersect.feerate == depgraph.FeeRate(intersect.transactions));
800 : : // - The intersection may only be empty if its input is empty.
801 [ - + ]: 1998 : assert(intersect.transactions.Any() == subset.transactions.Any());
802 : : // - The intersection feerate must be as high as the input.
803 [ - + ]: 1998 : assert(intersect.feerate >= subset.feerate);
804 : : // - No non-empty intersection between the intersection and a prefix of the chunks of the
805 : : // remainder of the linearization may be better than the intersection.
806 : 1998 : TestBitSet prefix;
807 [ + + ]: 12243 : for (ClusterIndex i = 0; i < chunking.NumChunksLeft(); ++i) {
808 : 10245 : prefix |= chunking.GetChunk(i).transactions;
809 : 10245 : auto reintersect = SetInfo(depgraph, prefix & intersect.transactions);
810 [ + + ]: 10245 : if (!reintersect.feerate.IsEmpty()) {
811 [ - + ]: 5749 : assert(reintersect.feerate <= intersect.feerate);
812 : : }
813 : : }
814 : :
815 : : // Find a subset to remove from linearization.
816 [ + - ]: 1998 : auto done = ReadTopologicalSet(depgraph, todo, reader);
817 [ + + ]: 1998 : if (done.None()) {
818 : : // We need to remove a non-empty subset, so fall back to the unlinearized ancestors of
819 : : // the first transaction in todo if done is empty.
820 : 1727 : done = depgraph.Ancestors(todo.First()) & todo;
821 : : }
822 : 1998 : todo -= done;
823 : 1998 : chunking.MarkDone(done);
824 : 1998 : subset = SetInfo(depgraph, subset.transactions - done);
825 : 1998 : }
826 : :
827 [ - + ]: 186 : assert(chunking.NumChunksLeft() == 0);
828 : 186 : }
829 : :
830 [ + - ]: 967 : FUZZ_TARGET(clusterlin_linearize)
831 : : {
832 : : // Verify the behavior of Linearize().
833 : :
834 : : // Retrieve an RNG seed, an iteration count, a depgraph, and whether to make it connected from
835 : : // the fuzz input.
836 [ + + ]: 553 : SpanReader reader(buffer);
837 : 553 : DepGraph<TestBitSet> depgraph;
838 : 553 : uint64_t rng_seed{0};
839 : 553 : uint64_t iter_count{0};
840 : 553 : uint8_t make_connected{1};
841 : 553 : try {
842 [ + + + - : 553 : reader >> VARINT(iter_count) >> Using<DepGraphFormatter>(depgraph) >> rng_seed >> make_connected;
+ + + + ]
843 [ - + ]: 377 : } catch (const std::ios_base::failure&) {}
844 : : // The most complicated graphs are connected ones (other ones just split up). Optionally force
845 : : // the graph to be connected.
846 [ + + + - ]: 553 : if (make_connected) MakeConnected(depgraph);
847 : :
848 : : // Optionally construct an old linearization for it.
849 : 553 : std::vector<ClusterIndex> old_linearization;
850 : 553 : {
851 : 553 : uint8_t have_old_linearization{0};
852 : 553 : try {
853 [ + + ]: 553 : reader >> have_old_linearization;
854 [ - + ]: 251 : } catch(const std::ios_base::failure&) {}
855 [ + + ]: 553 : if (have_old_linearization & 1) {
856 [ + - ]: 430 : old_linearization = ReadLinearization(depgraph, reader);
857 : 215 : SanityCheck(depgraph, old_linearization);
858 : : }
859 : : }
860 : :
861 : : // Invoke Linearize().
862 : 553 : iter_count &= 0x7ffff;
863 : 553 : auto [linearization, optimal] = Linearize(depgraph, iter_count, rng_seed, old_linearization);
864 : 553 : SanityCheck(depgraph, linearization);
865 : 553 : auto chunking = ChunkLinearization(depgraph, linearization);
866 : :
867 : : // Linearization must always be as good as the old one, if provided.
868 [ + + ]: 553 : if (!old_linearization.empty()) {
869 : 213 : auto old_chunking = ChunkLinearization(depgraph, old_linearization);
870 [ + - ]: 213 : auto cmp = CompareChunks(chunking, old_chunking);
871 [ - + ]: 213 : assert(cmp >= 0);
872 : 213 : }
873 : :
874 : : // If the iteration count is sufficiently high, an optimal linearization must be found.
875 : : // Each linearization step can use up to 2^(k-1) iterations, with steps k=1..n. That sum is
876 : : // 2^n - 1.
877 [ + + ]: 553 : const uint64_t n = depgraph.TxCount();
878 [ + + + + ]: 553 : if (n <= 19 && iter_count > (uint64_t{1} << n)) {
879 [ - + ]: 81 : assert(optimal);
880 : : }
881 : : // Additionally, if the assumption of sqrt(2^k)+1 iterations per step holds, plus ceil(k/4)
882 : : // start-up cost per step, plus ceil(n^2/64) start-up cost overall, we can compute the upper
883 : : // bound for a whole linearization (summing for k=1..n) using the Python expression
884 : : // [sum((k+3)//4 + int(math.sqrt(2**k)) + 1 for k in range(1, n + 1)) + (n**2 + 63) // 64 for n in range(0, 35)]:
885 : 553 : static constexpr uint64_t MAX_OPTIMAL_ITERS[] = {
886 : : 0, 4, 8, 12, 18, 26, 37, 51, 70, 97, 133, 182, 251, 346, 480, 666, 927, 1296, 1815, 2545,
887 : : 3576, 5031, 7087, 9991, 14094, 19895, 28096, 39690, 56083, 79263, 112041, 158391, 223936,
888 : : 316629, 447712
889 : : };
890 [ + - + + ]: 553 : if (n < std::size(MAX_OPTIMAL_ITERS) && iter_count >= MAX_OPTIMAL_ITERS[n]) {
891 [ + - ]: 180 : Assume(optimal);
892 : : }
893 : :
894 : : // If Linearize claims optimal result, run quality tests.
895 [ + + ]: 553 : if (optimal) {
896 : : // It must be as good as SimpleLinearize.
897 : 391 : auto [simple_linearization, simple_optimal] = SimpleLinearize(depgraph, MAX_SIMPLE_ITERATIONS);
898 : 391 : SanityCheck(depgraph, simple_linearization);
899 : 391 : auto simple_chunking = ChunkLinearization(depgraph, simple_linearization);
900 [ + - ]: 391 : auto cmp = CompareChunks(chunking, simple_chunking);
901 [ - + ]: 391 : assert(cmp >= 0);
902 : : // If SimpleLinearize finds the optimal result too, they must be equal (if not,
903 : : // SimpleLinearize is broken).
904 [ + + - + ]: 391 : if (simple_optimal) assert(cmp == 0);
905 : :
906 : : // Only for very small clusters, test every topologically-valid permutation.
907 [ + + ]: 391 : if (depgraph.TxCount() <= 7) {
908 : 92 : std::vector<ClusterIndex> perm_linearization;
909 [ + + + - : 537 : for (ClusterIndex i : depgraph.Positions()) perm_linearization.push_back(i);
+ + ]
910 : : // Iterate over all valid permutations.
911 : 113828 : do {
912 : : // Determine whether perm_linearization is topological.
913 : 113828 : TestBitSet perm_done;
914 : 113828 : bool perm_is_topo{true};
915 [ + + ]: 193353 : for (auto i : perm_linearization) {
916 : 190858 : perm_done.Set(i);
917 [ + + ]: 190858 : if (!depgraph.Ancestors(i).IsSubsetOf(perm_done)) {
918 : : perm_is_topo = false;
919 : : break;
920 : : }
921 : : }
922 : : // If so, verify that the obtained linearization is as good as the permutation.
923 [ + + ]: 113828 : if (perm_is_topo) {
924 : 2495 : auto perm_chunking = ChunkLinearization(depgraph, perm_linearization);
925 [ + - ]: 2495 : auto cmp = CompareChunks(chunking, perm_chunking);
926 [ - + ]: 2495 : assert(cmp >= 0);
927 : 2495 : }
928 [ + + ]: 113828 : } while(std::next_permutation(perm_linearization.begin(), perm_linearization.end()));
929 : 92 : }
930 : 391 : }
931 : 553 : }
932 : :
933 [ + - ]: 550 : FUZZ_TARGET(clusterlin_postlinearize)
934 : : {
935 : : // Verify expected properties of PostLinearize() on arbitrary linearizations.
936 : :
937 : : // Retrieve a depgraph from the fuzz input.
938 [ + - ]: 136 : SpanReader reader(buffer);
939 : 136 : DepGraph<TestBitSet> depgraph;
940 : 136 : try {
941 [ + - ]: 136 : reader >> Using<DepGraphFormatter>(depgraph);
942 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
943 : :
944 : : // Retrieve a linearization from the fuzz input.
945 : 136 : std::vector<ClusterIndex> linearization;
946 [ + - ]: 272 : linearization = ReadLinearization(depgraph, reader);
947 : 136 : SanityCheck(depgraph, linearization);
948 : :
949 : : // Produce a post-processed version.
950 [ + - ]: 136 : auto post_linearization = linearization;
951 [ + - ]: 136 : PostLinearize(depgraph, post_linearization);
952 : 136 : SanityCheck(depgraph, post_linearization);
953 : :
954 : : // Compare diagrams: post-linearization cannot worsen anywhere.
955 : 136 : auto chunking = ChunkLinearization(depgraph, linearization);
956 : 136 : auto post_chunking = ChunkLinearization(depgraph, post_linearization);
957 [ + - ]: 136 : auto cmp = CompareChunks(post_chunking, chunking);
958 [ - + ]: 136 : assert(cmp >= 0);
959 : :
960 : : // Run again, things can keep improving (and never get worse)
961 [ + - ]: 136 : auto post_post_linearization = post_linearization;
962 [ + - ]: 136 : PostLinearize(depgraph, post_post_linearization);
963 : 136 : SanityCheck(depgraph, post_post_linearization);
964 : 136 : auto post_post_chunking = ChunkLinearization(depgraph, post_post_linearization);
965 [ + - ]: 136 : cmp = CompareChunks(post_post_chunking, post_chunking);
966 [ - + ]: 136 : assert(cmp >= 0);
967 : :
968 : : // The chunks that come out of postlinearizing are always connected.
969 : 136 : LinearizationChunking linchunking(depgraph, post_linearization);
970 [ + + ]: 1410 : while (linchunking.NumChunksLeft()) {
971 [ - + ]: 1138 : assert(depgraph.IsConnected(linchunking.GetChunk(0).transactions));
972 : 1138 : linchunking.MarkDone(linchunking.GetChunk(0).transactions);
973 : : }
974 : 136 : }
975 : :
976 [ + - ]: 876 : FUZZ_TARGET(clusterlin_postlinearize_tree)
977 : : {
978 : : // Verify expected properties of PostLinearize() on linearizations of graphs that form either
979 : : // an upright or reverse tree structure.
980 : :
981 : : // Construct a direction, RNG seed, and an arbitrary graph from the fuzz input.
982 [ + - ]: 462 : SpanReader reader(buffer);
983 : 462 : uint64_t rng_seed{0};
984 : 462 : DepGraph<TestBitSet> depgraph_gen;
985 : 462 : uint8_t direction{0};
986 : 462 : try {
987 [ + - + + : 462 : reader >> direction >> rng_seed >> Using<DepGraphFormatter>(depgraph_gen);
+ - ]
988 [ - + ]: 2 : } catch (const std::ios_base::failure&) {}
989 : :
990 : : // Now construct a new graph, copying the nodes, but leaving only the first parent (even
991 : : // direction) or the first child (odd direction).
992 : 462 : DepGraph<TestBitSet> depgraph_tree;
993 [ + + ]: 13940 : for (ClusterIndex i = 0; i < depgraph_gen.PositionRange(); ++i) {
994 [ + + ]: 13478 : if (depgraph_gen.Positions()[i]) {
995 : 10881 : depgraph_tree.AddTransaction(depgraph_gen.FeeRate(i));
996 : : } else {
997 : : // For holes, add a dummy transaction which is deleted below, so that non-hole
998 : : // transactions retain their position.
999 : 2597 : depgraph_tree.AddTransaction(FeeFrac{});
1000 : : }
1001 : : }
1002 : 462 : depgraph_tree.RemoveTransactions(TestBitSet::Fill(depgraph_gen.PositionRange()) - depgraph_gen.Positions());
1003 : :
1004 [ + + ]: 462 : if (direction & 1) {
1005 [ + + ]: 7330 : for (ClusterIndex i = 0; i < depgraph_gen.TxCount(); ++i) {
1006 : 7042 : auto children = depgraph_gen.GetReducedChildren(i);
1007 [ + + ]: 7042 : if (children.Any()) {
1008 : 4835 : depgraph_tree.AddDependencies(TestBitSet::Singleton(i), children.First());
1009 : : }
1010 : : }
1011 : : } else {
1012 [ + + ]: 4013 : for (ClusterIndex i = 0; i < depgraph_gen.TxCount(); ++i) {
1013 : 3839 : auto parents = depgraph_gen.GetReducedParents(i);
1014 [ + + ]: 3839 : if (parents.Any()) {
1015 : 1637 : depgraph_tree.AddDependencies(TestBitSet::Singleton(parents.First()), i);
1016 : : }
1017 : : }
1018 : : }
1019 : :
1020 : : // Retrieve a linearization from the fuzz input.
1021 : 462 : std::vector<ClusterIndex> linearization;
1022 [ + - ]: 924 : linearization = ReadLinearization(depgraph_tree, reader);
1023 : 462 : SanityCheck(depgraph_tree, linearization);
1024 : :
1025 : : // Produce a postlinearized version.
1026 [ + - ]: 462 : auto post_linearization = linearization;
1027 [ + - ]: 462 : PostLinearize(depgraph_tree, post_linearization);
1028 : 462 : SanityCheck(depgraph_tree, post_linearization);
1029 : :
1030 : : // Compare diagrams.
1031 : 462 : auto chunking = ChunkLinearization(depgraph_tree, linearization);
1032 : 462 : auto post_chunking = ChunkLinearization(depgraph_tree, post_linearization);
1033 [ + - ]: 462 : auto cmp = CompareChunks(post_chunking, chunking);
1034 [ - + ]: 462 : assert(cmp >= 0);
1035 : :
1036 : : // Verify that post-linearizing again does not change the diagram. The result must be identical
1037 : : // as post_linearization ought to be optimal already with a tree-structured graph.
1038 [ + - ]: 462 : auto post_post_linearization = post_linearization;
1039 [ + - ]: 462 : PostLinearize(depgraph_tree, post_linearization);
1040 : 462 : SanityCheck(depgraph_tree, post_linearization);
1041 : 462 : auto post_post_chunking = ChunkLinearization(depgraph_tree, post_post_linearization);
1042 [ + - ]: 462 : auto cmp_post = CompareChunks(post_post_chunking, post_chunking);
1043 [ - + ]: 462 : assert(cmp_post == 0);
1044 : :
1045 : : // Try to find an even better linearization directly. This must not change the diagram for the
1046 : : // same reason.
1047 : 462 : auto [opt_linearization, _optimal] = Linearize(depgraph_tree, 100000, rng_seed, post_linearization);
1048 : 462 : auto opt_chunking = ChunkLinearization(depgraph_tree, opt_linearization);
1049 [ + - ]: 462 : auto cmp_opt = CompareChunks(opt_chunking, post_chunking);
1050 [ - + ]: 462 : assert(cmp_opt == 0);
1051 : 462 : }
1052 : :
1053 [ + - ]: 556 : FUZZ_TARGET(clusterlin_postlinearize_moved_leaf)
1054 : : {
1055 : : // Verify that taking an existing linearization, and moving a leaf to the back, potentially
1056 : : // increasing its fee, and then post-linearizing, results in something as good as the
1057 : : // original. This guarantees that in an RBF that replaces a transaction with one of the same
1058 : : // size but higher fee, applying the "remove conflicts, append new transaction, postlinearize"
1059 : : // process will never worsen linearization quality.
1060 : :
1061 : : // Construct an arbitrary graph and a fee from the fuzz input.
1062 [ + - ]: 142 : SpanReader reader(buffer);
1063 : 142 : DepGraph<TestBitSet> depgraph;
1064 : 142 : int32_t fee_inc{0};
1065 : 142 : try {
1066 : 142 : uint64_t fee_inc_code;
1067 [ + - + + ]: 142 : reader >> Using<DepGraphFormatter>(depgraph) >> VARINT(fee_inc_code);
1068 : 58 : fee_inc = fee_inc_code & 0x3ffff;
1069 [ - + ]: 84 : } catch (const std::ios_base::failure&) {}
1070 [ + + ]: 142 : if (depgraph.TxCount() == 0) return;
1071 : :
1072 : : // Retrieve two linearizations from the fuzz input.
1073 [ + - ]: 133 : auto lin = ReadLinearization(depgraph, reader);
1074 [ + - ]: 133 : auto lin_leaf = ReadLinearization(depgraph, reader);
1075 : :
1076 : : // Construct a linearization identical to lin, but with the tail end of lin_leaf moved to the
1077 : : // back.
1078 : 133 : std::vector<ClusterIndex> lin_moved;
1079 [ + + ]: 1997 : for (auto i : lin) {
1080 [ + + + - ]: 1864 : if (i != lin_leaf.back()) lin_moved.push_back(i);
1081 : : }
1082 [ + - ]: 133 : lin_moved.push_back(lin_leaf.back());
1083 : :
1084 : : // Postlinearize lin_moved.
1085 [ + - ]: 133 : PostLinearize(depgraph, lin_moved);
1086 : 133 : SanityCheck(depgraph, lin_moved);
1087 : :
1088 : : // Compare diagrams (applying the fee delta after computing the old one).
1089 : 133 : auto old_chunking = ChunkLinearization(depgraph, lin);
1090 : 133 : depgraph.FeeRate(lin_leaf.back()).fee += fee_inc;
1091 : 133 : auto new_chunking = ChunkLinearization(depgraph, lin_moved);
1092 [ + - ]: 133 : auto cmp = CompareChunks(new_chunking, old_chunking);
1093 [ - + ]: 133 : assert(cmp >= 0);
1094 : 142 : }
1095 : :
1096 [ + - ]: 692 : FUZZ_TARGET(clusterlin_merge)
1097 : : {
1098 : : // Construct an arbitrary graph from the fuzz input.
1099 [ + - ]: 278 : SpanReader reader(buffer);
1100 : 278 : DepGraph<TestBitSet> depgraph;
1101 : 278 : try {
1102 [ + - ]: 278 : reader >> Using<DepGraphFormatter>(depgraph);
1103 [ - - ]: 0 : } catch (const std::ios_base::failure&) {}
1104 : :
1105 : : // Retrieve two linearizations from the fuzz input.
1106 [ + - ]: 278 : auto lin1 = ReadLinearization(depgraph, reader);
1107 [ + - ]: 278 : auto lin2 = ReadLinearization(depgraph, reader);
1108 : :
1109 : : // Merge the two.
1110 [ + - ]: 278 : auto lin_merged = MergeLinearizations(depgraph, lin1, lin2);
1111 : :
1112 : : // Compute chunkings and compare.
1113 : 278 : auto chunking1 = ChunkLinearization(depgraph, lin1);
1114 : 278 : auto chunking2 = ChunkLinearization(depgraph, lin2);
1115 : 278 : auto chunking_merged = ChunkLinearization(depgraph, lin_merged);
1116 [ + - ]: 278 : auto cmp1 = CompareChunks(chunking_merged, chunking1);
1117 [ - + ]: 278 : assert(cmp1 >= 0);
1118 [ + - ]: 278 : auto cmp2 = CompareChunks(chunking_merged, chunking2);
1119 [ - + ]: 278 : assert(cmp2 >= 0);
1120 : 278 : }
|