Line data Source code
1 : #include "fd_poh.h"
2 :
3 : /* The PoH implementation is at its core a state machine ...
4 :
5 : +--------+
6 : | UNINIT |
7 : +--------+
8 : |
9 : +---------+ | +---------+
10 : | v v v |
11 : +-------------------+ +----------+ +------------------+
12 : | WAITING_FOR_SLOT |<----| FOLLOWER |----->| WAITING_FOR_BANK |
13 : +-------------------+ +----------+ +------------------+
14 : | ^ |
15 : | | |
16 : | +----------+ |
17 : |------>| LEADER |<--------+
18 : +----------+
19 :
20 : The state machine starts UNINIT, but once a snapshot is loaded it
21 : will transition to follower.
22 :
23 : The state machine is in a resting the state when FOLLOWER, in this
24 : state it knows a `next_leader_slot` and will continually hash to
25 : advance towards that slot. When it reaches the `next_leader_slot`
26 : it will transition to the WAITING_FOR_BANK state, where it waits for
27 : the replay stage to tell it some information relevant to that leader
28 : slot, so that it can start doing mixins and hashing towards the end
29 : of the block. When the block ends, the state transitions back to
30 : follower, even if the next slot is the leader, as we need the replay
31 : stage to tell us about the new leader slot.
32 :
33 : Sometimes it might happen that we have received the bank from replay
34 : stage before we have reached the `next_leader_slot`, in which case
35 : we transition to the WAITING_FOR_SLOT state, where we wait for the
36 : hash count to reach the leader slot.
37 :
38 : At any time, during any state except UNINIT, we can be suddenly
39 : "reset" by the replay tile. Such reset actions may move the reset
40 : slot backwards or forwards, or set it back to something we have
41 : already seen before. BUT, the `next_leader_slot` must always
42 : advance forward.
43 :
44 : If the PoH machine successfully completes a leader slot, by hashing
45 : it until the end, then the a completion message is sent back to
46 : replay with the final blockhash, after which the state machine enters
47 : the follower state once again, and waits for further instructions
48 : from replay. */
49 :
50 0 : #define STATE_UNINIT (0)
51 0 : #define STATE_FOLLOWER (1)
52 0 : #define STATE_WAITING_FOR_BANK (2)
53 0 : #define STATE_WAITING_FOR_SLOT (3)
54 0 : #define STATE_LEADER (4)
55 0 : #define STATE_WAITING_FOR_RESET (5)
56 :
57 : FD_FN_CONST ulong
58 0 : fd_poh_align( void ) {
59 0 : return FD_POH_ALIGN;
60 0 : }
61 :
62 : FD_FN_CONST ulong
63 0 : fd_poh_footprint( void ) {
64 0 : return FD_POH_FOOTPRINT;
65 0 : }
66 :
67 : void *
68 0 : fd_poh_new( void * shmem ) {
69 0 : fd_poh_t * poh = (fd_poh_t *)shmem;
70 :
71 0 : if( FD_UNLIKELY( !poh ) ) {
72 0 : FD_LOG_WARNING(( "NULL shmem" ));
73 0 : return NULL;
74 0 : }
75 :
76 0 : if( FD_UNLIKELY( !fd_ulong_is_aligned( (ulong)poh, fd_poh_align() ) ) ) {
77 0 : FD_LOG_WARNING(( "misaligned shmem" ));
78 0 : return NULL;
79 0 : }
80 :
81 0 : poh->hashcnt_per_tick = ULONG_MAX;
82 0 : poh->state = STATE_UNINIT;
83 :
84 0 : FD_COMPILER_MFENCE();
85 0 : FD_VOLATILE( poh->magic ) = FD_POH_MAGIC;
86 0 : FD_COMPILER_MFENCE();
87 :
88 0 : return (void *)poh;
89 0 : }
90 :
91 : fd_poh_t *
92 : fd_poh_join( void * shpoh,
93 : fd_poh_out_t * shred_out,
94 0 : fd_poh_out_t * replay_out ) {
95 0 : if( FD_UNLIKELY( !shpoh ) ) {
96 0 : FD_LOG_WARNING(( "NULL shpoh" ));
97 0 : return NULL;
98 0 : }
99 :
100 0 : if( FD_UNLIKELY( !fd_ulong_is_aligned( (ulong)shpoh, fd_poh_align() ) ) ) {
101 0 : FD_LOG_WARNING(( "misaligned shpoh" ));
102 0 : return NULL;
103 0 : }
104 :
105 0 : fd_poh_t * poh = (fd_poh_t *)shpoh;
106 :
107 0 : if( FD_UNLIKELY( poh->magic!=FD_POH_MAGIC ) ) {
108 0 : FD_LOG_WARNING(( "bad magic" ));
109 0 : return NULL;
110 0 : }
111 :
112 0 : *poh->shred_out = *shred_out;
113 0 : *poh->replay_out = *replay_out;
114 :
115 0 : return poh;
116 0 : }
117 :
118 : static void
119 : transition_to_follower( fd_poh_t * poh,
120 : fd_stem_context_t * stem,
121 0 : int completed_leader_slot ) {
122 0 : FD_TEST( poh->state==STATE_LEADER || poh->state==STATE_WAITING_FOR_BANK || poh->state==STATE_WAITING_FOR_SLOT || poh->state==STATE_WAITING_FOR_RESET );
123 :
124 0 : if( FD_LIKELY( completed_leader_slot ) ) FD_TEST( poh->state==STATE_LEADER );
125 :
126 0 : if( FD_LIKELY( poh->state==STATE_LEADER || poh->state==STATE_WAITING_FOR_SLOT ) ) {
127 0 : fd_poh_leader_slot_ended_t * dst = fd_chunk_to_laddr( poh->replay_out->mem, poh->replay_out->chunk );
128 0 : dst->completed = completed_leader_slot;
129 0 : dst->slot = poh->slot-1UL;
130 0 : fd_memcpy( dst->blockhash, poh->hash, 32UL );
131 0 : ulong tspub = (ulong)fd_frag_meta_ts_comp( fd_tickcount() );
132 0 : fd_stem_publish( stem, poh->replay_out->idx, 0UL, poh->replay_out->chunk, sizeof(fd_poh_leader_slot_ended_t), 0UL, 0UL, tspub );
133 0 : poh->replay_out->chunk = fd_dcache_compact_next( poh->replay_out->chunk, sizeof(fd_poh_leader_slot_ended_t), poh->replay_out->chunk0, poh->replay_out->wmark );
134 0 : }
135 :
136 0 : poh->state = STATE_FOLLOWER;
137 0 : }
138 :
139 : static void
140 : update_hashes_per_tick( fd_poh_t * poh,
141 0 : ulong hashcnt_per_tick ) {
142 0 : if( FD_UNLIKELY( poh->hashcnt_per_tick!=hashcnt_per_tick ) ) {
143 0 : if( FD_UNLIKELY( poh->hashcnt_per_tick!=ULONG_MAX ) ) {
144 0 : FD_LOG_WARNING(( "hashes per tick changed from %lu to %lu", poh->hashcnt_per_tick, hashcnt_per_tick ));
145 0 : }
146 :
147 : /* Recompute derived information about the clock. */
148 0 : poh->hashcnt_duration_ns = (double)poh->tick_duration_ns/(double)hashcnt_per_tick;
149 0 : poh->hashcnt_per_slot = poh->ticks_per_slot*hashcnt_per_tick;
150 0 : poh->hashcnt_per_tick = hashcnt_per_tick;
151 :
152 : /* Discard any ticks we might have done in the interim. They will
153 : have the wrong number of hashes per tick. We can just catch back
154 : up quickly if not too many slots were skipped and hopefully
155 : publish on time. Note that tick production and verification of
156 : skipped slots is done for the eventual bank that publishes a
157 : slot, for example:
158 :
159 : Reset Slot: 998
160 : Epoch Transition Slot: 1000
161 : Leader Slot: 1002
162 :
163 : In this case, if a feature changing the hashcnt_per_tick is
164 : activated in slot 1000, and we are publishing empty ticks for
165 : slots 998, 999, 1000, and 1001, they should all have the new
166 : hashes_per_tick number of hashes, rather than the older one, or
167 : some combination. */
168 :
169 0 : FD_TEST( poh->last_slot==poh->reset_slot );
170 0 : FD_TEST( !poh->last_hashcnt );
171 0 : poh->slot = poh->reset_slot;
172 0 : poh->hashcnt = 0UL;
173 0 : }
174 0 : }
175 :
176 : void
177 : fd_poh_reset( fd_poh_t * poh,
178 : fd_stem_context_t * stem,
179 : long timestamp, /* The local timestamp when the reset is occurring */
180 : ulong hashcnt_per_tick, /* The hashcnt per tick of the bank that completed */
181 : ulong ticks_per_slot,
182 : ulong tick_duration_ns,
183 : ulong completed_slot, /* The slot that successfully produced a block */
184 : uchar const * completed_blockhash, /* The hash of the last tick in the produced block */
185 : ulong next_leader_slot, /* The next slot where this node will be leader */
186 : ulong max_microblocks_in_slot, /* The maximum number of microblocks that may appear in a slot */
187 0 : uchar const * completed_block_id /* The block id of the completed block */) {
188 0 : memcpy( poh->reset_hash, completed_blockhash, 32UL );
189 0 : memcpy( poh->hash, completed_blockhash, 32UL );
190 0 : memcpy( poh->completed_block_id, completed_block_id, 32UL );
191 0 : poh->slot = completed_slot+1UL;
192 0 : poh->hashcnt = 0UL;
193 0 : poh->last_slot = poh->slot;
194 0 : poh->last_hashcnt = 0UL;
195 0 : poh->reset_slot = poh->slot;
196 0 : poh->next_leader_slot = next_leader_slot;
197 0 : poh->max_microblocks_per_slot = max_microblocks_in_slot;
198 0 : poh->reset_slot_start_ns = timestamp;
199 :
200 0 : if( FD_UNLIKELY( poh->state==STATE_UNINIT ) ) {
201 0 : poh->tick_duration_ns = tick_duration_ns;
202 0 : poh->ticks_per_slot = ticks_per_slot;
203 0 : poh->state = STATE_FOLLOWER;
204 0 : } else {
205 0 : FD_TEST( tick_duration_ns==poh->tick_duration_ns );
206 0 : FD_TEST( ticks_per_slot==poh->ticks_per_slot );
207 0 : }
208 0 : update_hashes_per_tick( poh, hashcnt_per_tick );
209 :
210 : /* When we reset, we need to allow PoH to tick freely again rather
211 : than being constrained. If we are leader after the reset, this
212 : is OK because we won't tick until we get a bank, and the lower
213 : bound will be reset with the value from the bank. */
214 0 : poh->microblocks_lower_bound = poh->max_microblocks_per_slot;
215 :
216 0 : if( FD_UNLIKELY( poh->state!=STATE_FOLLOWER ) ) transition_to_follower( poh, stem, 0 );
217 0 : if( FD_UNLIKELY( poh->slot==poh->next_leader_slot ) ) poh->state = STATE_WAITING_FOR_BANK;
218 0 : }
219 :
220 : void
221 : fd_poh_begin_leader( fd_poh_t * poh,
222 : ulong slot,
223 : ulong hashcnt_per_tick,
224 : ulong ticks_per_slot,
225 : ulong tick_duration_ns,
226 0 : ulong max_microblocks_in_slot ) {
227 0 : FD_TEST( poh->state==STATE_FOLLOWER || poh->state==STATE_WAITING_FOR_BANK );
228 0 : FD_TEST( slot==poh->next_leader_slot );
229 :
230 : /* PoH ends the slot once it "ticks" through all of the hashes, but we
231 : only want that to happen if we have received a done packing message
232 : from pack, so we always reserve an empty microblock at the end so
233 : the tick advance will not end the slot without being told. */
234 0 : poh->max_microblocks_per_slot = max_microblocks_in_slot+1UL;
235 :
236 0 : FD_TEST( tick_duration_ns==poh->tick_duration_ns );
237 0 : FD_TEST( ticks_per_slot==poh->ticks_per_slot );
238 0 : update_hashes_per_tick( poh, hashcnt_per_tick );
239 :
240 0 : if( FD_LIKELY( poh->state==STATE_FOLLOWER ) ) poh->state = STATE_WAITING_FOR_SLOT;
241 0 : else poh->state = STATE_LEADER;
242 :
243 0 : poh->microblocks_lower_bound = 0UL;
244 :
245 0 : FD_LOG_INFO(( "begin_leader(slot=%lu, last_slot=%lu, last_hashcnt=%lu)", slot, poh->last_slot, poh->last_hashcnt ));
246 0 : }
247 :
248 : int
249 0 : fd_poh_have_leader_bank( fd_poh_t const * poh ) {
250 0 : return poh->state==STATE_WAITING_FOR_SLOT || poh->state==STATE_LEADER;
251 0 : }
252 :
253 : int
254 0 : fd_poh_hashing_to_leader_slot( fd_poh_t const * poh ) {
255 0 : int hashing = poh->state==STATE_WAITING_FOR_SLOT || poh->state==STATE_LEADER;
256 0 : return hashing && poh->slot<poh->next_leader_slot;
257 0 : }
258 :
259 : void
260 : fd_poh_done_packing( fd_poh_t * poh,
261 0 : ulong microblocks_in_slot ) {
262 0 : FD_TEST( poh->state==STATE_LEADER );
263 0 : FD_LOG_INFO(( "done_packing(slot=%lu,seen_microblocks=%lu,microblocks_in_slot=%lu)",
264 0 : poh->slot,
265 0 : poh->microblocks_lower_bound,
266 0 : microblocks_in_slot ));
267 0 : FD_TEST( poh->microblocks_lower_bound==microblocks_in_slot );
268 0 : FD_TEST( poh->microblocks_lower_bound<=poh->max_microblocks_per_slot );
269 0 : poh->microblocks_lower_bound += poh->max_microblocks_per_slot - microblocks_in_slot;
270 0 : FD_TEST( poh->microblocks_lower_bound==poh->max_microblocks_per_slot );
271 0 : }
272 :
273 : static void
274 : publish_tick( fd_poh_t * poh,
275 : fd_stem_context_t * stem,
276 : uchar hash[ static 32 ],
277 0 : int is_skipped ) {
278 0 : ulong hashcnt = poh->hashcnt_per_tick*(1UL+(poh->last_hashcnt/poh->hashcnt_per_tick));
279 :
280 0 : uchar * dst = (uchar *)fd_chunk_to_laddr( poh->shred_out->mem, poh->shred_out->chunk );
281 :
282 0 : FD_TEST( poh->last_slot>=poh->reset_slot );
283 0 : fd_entry_batch_meta_t * meta = (fd_entry_batch_meta_t *)dst;
284 0 : if( FD_UNLIKELY( is_skipped ) ) {
285 : /* We are publishing ticks for a skipped slot, the reference tick
286 : and block complete flags should always be zero. */
287 0 : meta->reference_tick = 0UL;
288 0 : meta->block_complete = 0;
289 0 : } else {
290 0 : meta->reference_tick = hashcnt/poh->hashcnt_per_tick;
291 0 : meta->block_complete = hashcnt==poh->hashcnt_per_slot;
292 0 : }
293 :
294 0 : meta->parent_block_id_valid = 1;
295 0 : fd_memcpy( meta->parent_block_id, poh->completed_block_id, 32UL );
296 :
297 0 : ulong slot = fd_ulong_if( meta->block_complete, poh->slot-1UL, poh->slot );
298 0 : meta->parent_offset = 1UL+slot-poh->reset_slot;
299 :
300 0 : FD_TEST( hashcnt>poh->last_hashcnt );
301 0 : ulong hash_delta = hashcnt-poh->last_hashcnt;
302 :
303 0 : dst += sizeof(fd_entry_batch_meta_t);
304 0 : fd_entry_batch_header_t * tick = (fd_entry_batch_header_t *)dst;
305 0 : tick->hashcnt_delta = hash_delta;
306 0 : fd_memcpy( tick->hash, hash, 32UL );
307 0 : tick->txn_cnt = 0UL;
308 :
309 0 : ulong tspub = (ulong)fd_frag_meta_ts_comp( fd_tickcount() );
310 0 : ulong sz = sizeof(fd_entry_batch_meta_t)+sizeof(fd_entry_batch_header_t);
311 0 : ulong sig = fd_disco_poh_sig( slot, POH_PKT_TYPE_MICROBLOCK, 0UL );
312 0 : fd_stem_publish( stem, poh->shred_out->idx, sig, poh->shred_out->chunk, sz, 0UL, 0UL, tspub );
313 0 : poh->shred_out->chunk = fd_dcache_compact_next( poh->shred_out->chunk, sz, poh->shred_out->chunk0, poh->shred_out->wmark );
314 :
315 0 : if( FD_UNLIKELY( hashcnt==poh->hashcnt_per_slot ) ) {
316 0 : poh->last_slot++;
317 0 : poh->last_hashcnt = 0UL;
318 0 : } else {
319 0 : poh->last_hashcnt = hashcnt;
320 0 : }
321 0 : }
322 :
323 : void
324 : fd_poh_advance( fd_poh_t * poh,
325 : fd_stem_context_t * stem,
326 : int * opt_poll_in,
327 0 : int * charge_busy ) {
328 0 : if( FD_UNLIKELY( poh->state==STATE_UNINIT || poh->state==STATE_WAITING_FOR_RESET ) ) return;
329 0 : if( FD_UNLIKELY( poh->state==STATE_WAITING_FOR_BANK ) ) {
330 : /* If we are the leader, but we didn't yet learn what the leader
331 : bank object is from the replay tile, do not do any hashing. */
332 0 : return;
333 0 : }
334 :
335 : /* If we have skipped ticks pending because we skipped some slots to
336 : become leader, register them now one at a time. */
337 0 : if( FD_UNLIKELY( poh->state==STATE_LEADER && poh->last_slot<poh->slot ) ) {
338 0 : ulong publish_hashcnt = poh->last_hashcnt+poh->hashcnt_per_tick;
339 0 : ulong tick_idx = (poh->last_slot*poh->ticks_per_slot+publish_hashcnt/poh->hashcnt_per_tick)%MAX_SKIPPED_TICKS;
340 :
341 0 : publish_tick( poh, stem, poh->skipped_tick_hashes[ tick_idx ], 1 );
342 :
343 : /* If we are catching up now and publishing a bunch of skipped
344 : ticks, we do not want to process any incoming microblocks until
345 : all the skipped ticks have been published out; otherwise we would
346 : intersperse skipped tick messages with microblocks. */
347 0 : *opt_poll_in = 0;
348 0 : *charge_busy = 1;
349 0 : return;
350 0 : }
351 :
352 0 : int low_power_mode = poh->hashcnt_per_tick==1UL;
353 :
354 : /* If we are the leader, always leave enough capacity in the slot so
355 : that we can mixin any potential microblocks still coming from the
356 : pack tile for this slot. */
357 0 : ulong max_remaining_microblocks = poh->max_microblocks_per_slot - poh->microblocks_lower_bound;
358 :
359 : /* With hashcnt_per_tick hashes per tick, we actually get
360 : hashcnt_per_tick-1 chances to mixin a microblock. For each tick
361 : span that we need to reserve, we also need to reserve the hashcnt
362 : for the tick, hence the +
363 : max_remaining_microblocks/(hashcnt_per_tick-1) rounded up.
364 :
365 : However, if hashcnt_per_tick is 1 because we're in low power mode,
366 : this should probably just be max_remaining_microblocks. */
367 0 : ulong max_remaining_ticks_or_microblocks = max_remaining_microblocks;
368 0 : if( FD_LIKELY( !low_power_mode ) ) max_remaining_ticks_or_microblocks += (max_remaining_microblocks+poh->hashcnt_per_tick-2UL)/(poh->hashcnt_per_tick-1UL);
369 :
370 0 : ulong restricted_hashcnt = fd_ulong_if( poh->hashcnt_per_slot>=max_remaining_ticks_or_microblocks, poh->hashcnt_per_slot-max_remaining_ticks_or_microblocks, 0UL );
371 :
372 0 : ulong min_hashcnt = poh->hashcnt;
373 :
374 0 : if( FD_LIKELY( !low_power_mode ) ) {
375 : /* Recall that there are two kinds of events that will get published
376 : to the shredder,
377 :
378 : (a) Ticks. These occur every 62,500 (hashcnt_per_tick) hashcnts,
379 : and there will be 64 (ticks_per_slot) of them in each slot.
380 :
381 : Ticks must not have any transactions mixed into the hash.
382 : This is not strictly needed in theory, but is required by the
383 : current consensus protocol. They get published here in
384 : after_credit.
385 :
386 : (b) Microblocks. These can occur at any other hashcnt, as long
387 : as it is not a tick. Microblocks cannot be empty, and must
388 : have at least one transactions mixed in. These get
389 : published in after_frag.
390 :
391 : If hashcnt_per_tick is 1, then we are in low power mode and the
392 : following does not apply, since we can mix in transactions at any
393 : time.
394 :
395 : In the normal, non-low-power mode, though, we have to be careful
396 : to make sure that we do not publish microblocks on tick
397 : boundaries. To do that, we need to obey two rules:
398 : (i) after_credit must not leave hashcnt one before a tick
399 : boundary
400 : (ii) if after_credit begins one before a tick boundary, it must
401 : advance hashcnt and publish the tick
402 :
403 : There's some interplay between min_hashcnt and restricted_hashcnt
404 : here, and we need to show that there's always a value of
405 : target_hashcnt we can pick such that
406 : min_hashcnt <= target_hashcnt <= restricted_hashcnt.
407 : We'll prove this by induction for current_slot==0 and
408 : is_leader==true, since all other slots should be the same.
409 :
410 : Let m_j and r_j be the min_hashcnt and restricted_hashcnt
411 : (respectively) for the jth call to after_credit in a slot. We
412 : want to show that for all values of j, it's possible to pick a
413 : value h_j, the value of target_hashcnt for the jth call to
414 : after_credit (which is also the value of hashcnt after
415 : after_credit has completed) such that m_j<=h_j<=r_j.
416 :
417 : Additionally, let T be hashcnt_per_tick and N be ticks_per_slot.
418 :
419 : Starting with the base case, j==0. m_j=0, and
420 : r_0 = N*T - max_microblocks_per_slot
421 : - ceil(max_microblocks_per_slot/(T-1)).
422 :
423 : This is monotonic decreasing in max_microblocks_per_slot, so it
424 : achieves its minimum when max_microblocks_per_slot is its
425 : maximum.
426 : r_0 >= N*T - N*(T-1) - ceil( (N*(T-1))/(T-1))
427 : = N*T - N*(T-1)-N = 0.
428 : Thus, m_0 <= r_0, as desired.
429 :
430 :
431 :
432 : Then, for the inductive step, assume there exists h_j such that
433 : m_j<=h_j<=r_j, and we want to show that there exists h_{j+1},
434 : which is the same as showing m_{j+1}<=r_{j+1}.
435 :
436 : Let a_j be 1 if we had a microblock immediately following the jth
437 : call to after_credit, and 0 otherwise. Then hashcnt at the start
438 : of the (j+1)th call to after_frag is h_j+a_j.
439 : Also, set b_{j+1}=1 if we are in the case covered by rule (ii)
440 : above during the (j+1)th call to after_credit, i.e. if
441 : (h_j+a_j)%T==T-1. Thus, m_{j+1} = h_j + a_j + b_{j+1}.
442 :
443 : If we received an additional microblock, then
444 : max_remaining_microblocks goes down by 1, and
445 : max_remaining_ticks_or_microblocks goes down by either 1 or 2,
446 : which means restricted_hashcnt goes up by either 1 or 2. In
447 : particular, it goes up by 2 if the new value of
448 : max_remaining_microblocks (at the start of the (j+1)th call to
449 : after_credit) is congruent to 0 mod T-1. Let b'_{j+1} be 1 if
450 : this condition is met and 0 otherwise. If we receive a
451 : done_packing message, restricted_hashcnt can go up by more, but
452 : we can ignore that case, since it is less restrictive.
453 : Thus, r_{j+1}=r_j+a_j+b'_{j+1}.
454 :
455 : If h_j < r_j (strictly less), then h_j+a_j < r_j+a_j. And thus,
456 : since b_{j+1}<=b'_{j+1}+1, just by virtue of them both being
457 : binary,
458 : h_j + a_j + b_{j+1} < r_j + a_j + b'_{j+1} + 1,
459 : which is the same (for integers) as
460 : h_j + a_j + b_{j+1} <= r_j + a_j + b'_{j+1},
461 : m_{j+1} <= r_{j+1}
462 :
463 : On the other hand, if h_j==r_j, this is easy unless b_{j+1}==1,
464 : which can also only happen if a_j==1. Then (h_j+a_j)%T==T-1,
465 : which means there's an integer k such that
466 :
467 : h_j+a_j==(ticks_per_slot-k)*T-1
468 : h_j ==ticks_per_slot*T - k*(T-1)-1 - k-1
469 : ==ticks_per_slot*T - (k*(T-1)+1) - ceil( (k*(T-1)+1)/(T-1) )
470 :
471 : Since h_j==r_j in this case, and
472 : r_j==(ticks_per_slot*T) - max_remaining_microblocks_j - ceil(max_remaining_microblocks_j/(T-1)),
473 : we can see that the value of max_remaining_microblocks at the
474 : start of the jth call to after_credit is k*(T-1)+1. Again, since
475 : a_j==1, then the value of max_remaining_microblocks at the start
476 : of the j+1th call to after_credit decreases by 1 to k*(T-1),
477 : which means b'_{j+1}=1.
478 :
479 : Thus, h_j + a_j + b_{j+1} == r_j + a_j + b'_{j+1}, so, in
480 : particular, h_{j+1}<=r_{j+1} as desired. */
481 0 : min_hashcnt += (ulong)(min_hashcnt%poh->hashcnt_per_tick == (poh->hashcnt_per_tick-1UL)); /* add b_{j+1}, enforcing rule (ii) */
482 0 : }
483 : /* Now figure out how many hashes are needed to "catch up" the hash
484 : count to the current system clock, and clamp it to the allowed
485 : range. */
486 0 : long now = fd_log_wallclock();
487 0 : ulong target_hashcnt;
488 0 : if( FD_LIKELY( poh->state==STATE_FOLLOWER ||poh->state==STATE_WAITING_FOR_SLOT ) ) {
489 0 : target_hashcnt = (ulong)((double)(now - poh->reset_slot_start_ns) / poh->hashcnt_duration_ns) - (poh->slot-poh->reset_slot)*poh->hashcnt_per_slot;
490 0 : } else {
491 0 : FD_TEST( poh->state==STATE_LEADER );
492 0 : target_hashcnt = (ulong)((double)(now - poh->leader_slot_start_ns) / poh->hashcnt_duration_ns);
493 0 : }
494 : /* Clamp to [min_hashcnt, restricted_hashcnt] as above */
495 0 : target_hashcnt = fd_ulong_max( fd_ulong_min( target_hashcnt, restricted_hashcnt ), min_hashcnt );
496 :
497 : /* The above proof showed that it was always possible to pick a value
498 : of target_hashcnt, but we still have a lot of freedom in how to
499 : pick it. It simplifies the code a lot if we don't keep going after
500 : a tick in this function. In particular, we want to publish at most
501 : 1 tick in this call, since otherwise we could consume infinite
502 : credits to publish here. The credits are set so that we should
503 : only ever publish one tick during this loop. Also, all the extra
504 : stuff (leader transitions, publishing ticks, etc.) we have to do
505 : happens at tick boundaries, so this lets us consolidate all those
506 : cases.
507 :
508 : Mathematically, since the current value of hashcnt is h_j+a_j, the
509 : next tick (advancing a full tick if we're currently at a tick) is
510 : t_{j+1} = T*(floor( (h_j+a_j)/T )+1). We need to show that if we set
511 : h'_{j+1} = min( h_{j+1}, t_{j+1} ), it is still valid.
512 :
513 : First, h'_{j+1} <= h_{j+1} <= r_{j+1}, so we're okay in that
514 : direction.
515 :
516 : Next, observe that t_{j+1}>=h_j + a_j + 1, and recall that b_{j+1}
517 : is 0 or 1. So then,
518 : t_{j+1} >= h_j+a_j+b_{j+1} = m_{j+1}.
519 :
520 : We know h_{j+1) >= m_{j+1} from before, so then h'_{j+1} >=
521 : m_{j+1}, as desired. */
522 :
523 0 : ulong next_tick_hashcnt = poh->hashcnt_per_tick * (1UL+(poh->hashcnt/poh->hashcnt_per_tick));
524 0 : target_hashcnt = fd_ulong_min( target_hashcnt, next_tick_hashcnt );
525 :
526 : /* We still need to enforce rule (i). We know that min_hashcnt%T !=
527 : T-1 because of rule (ii). That means that if target_hashcnt%T ==
528 : T-1 at this point, target_hashcnt > min_hashcnt (notice the
529 : strict), so target_hashcnt-1 >= min_hashcnt and is thus still a
530 : valid choice for target_hashcnt. */
531 0 : target_hashcnt -= (ulong)( (!low_power_mode) & ((target_hashcnt%poh->hashcnt_per_tick)==(poh->hashcnt_per_tick-1UL)) );
532 :
533 0 : FD_TEST( target_hashcnt >= poh->hashcnt );
534 0 : FD_TEST( target_hashcnt >= min_hashcnt );
535 0 : FD_TEST( target_hashcnt <= restricted_hashcnt );
536 :
537 0 : if( FD_UNLIKELY( poh->hashcnt==target_hashcnt ) ) return; /* Nothing to do, don't publish a tick twice */
538 :
539 0 : *charge_busy = 1;
540 :
541 0 : if( FD_LIKELY( poh->hashcnt<target_hashcnt ) ) {
542 0 : fd_sha256_hash_32_repeated( poh->hash, poh->hash, target_hashcnt-poh->hashcnt );
543 0 : poh->hashcnt = target_hashcnt;
544 0 : }
545 :
546 0 : if( FD_UNLIKELY( poh->hashcnt==poh->hashcnt_per_slot ) ) {
547 0 : poh->slot++;
548 0 : poh->hashcnt = 0UL;
549 0 : }
550 :
551 0 : switch( poh->state ) {
552 0 : case STATE_LEADER: {
553 0 : if( FD_UNLIKELY( !(poh->hashcnt%poh->hashcnt_per_tick) ) ) {
554 : /* We ticked while leader... send an empty microblock (a tick)
555 : to the shred tile. */
556 0 : publish_tick( poh, stem, poh->hash, 0 );
557 0 : }
558 0 : if( FD_UNLIKELY( poh->slot>poh->next_leader_slot ) ) {
559 : /* We ticked while leader and are no longer leader... transition
560 : the state machine. */
561 0 : FD_TEST( !max_remaining_microblocks );
562 0 : FD_LOG_INFO(( "fd_poh_ticked_outof_leader(slot=%lu)", poh->slot-1UL ));
563 0 : transition_to_follower( poh, stem, 1 );
564 0 : poh->state = STATE_WAITING_FOR_RESET;
565 0 : }
566 0 : break;
567 0 : }
568 0 : case STATE_WAITING_FOR_SLOT:
569 0 : case STATE_FOLLOWER: {
570 0 : if( FD_UNLIKELY( !(poh->hashcnt%poh->hashcnt_per_tick ) ) ) {
571 : /* We finished a tick while not leader... save the current hash
572 : so it can be played back into the bank when we become the
573 : leader. */
574 0 : ulong tick_idx = (poh->slot*poh->ticks_per_slot+poh->hashcnt/poh->hashcnt_per_tick)%MAX_SKIPPED_TICKS;
575 0 : fd_memcpy( poh->skipped_tick_hashes[ tick_idx ], poh->hash, 32UL );
576 :
577 0 : ulong initial_tick_idx = (poh->last_slot*poh->ticks_per_slot+poh->last_hashcnt/poh->hashcnt_per_tick)%MAX_SKIPPED_TICKS;
578 0 : if( FD_UNLIKELY( tick_idx==initial_tick_idx ) ) FD_LOG_ERR(( "Too many skipped ticks from slot %lu to slot %lu, chain must halt", poh->last_slot, poh->slot ));
579 0 : }
580 :
581 0 : FD_TEST( poh->slot<=poh->next_leader_slot );
582 0 : if( FD_UNLIKELY( poh->slot==poh->next_leader_slot ) ) {
583 : /* We ticked while not leader and are now leader... transition
584 : the state machine. */
585 0 : if( FD_LIKELY( poh->state==STATE_FOLLOWER ) ) poh->state = STATE_WAITING_FOR_BANK;
586 0 : else poh->state = STATE_LEADER;
587 0 : }
588 0 : break;
589 0 : }
590 0 : default: {
591 0 : break;
592 0 : }
593 0 : }
594 0 : }
595 :
596 : static void
597 : publish_microblock( fd_poh_t * poh,
598 : fd_stem_context_t * stem,
599 : ulong slot,
600 : ulong hashcnt_delta,
601 : ulong txn_cnt,
602 0 : fd_txn_p_t const * txns ) {
603 0 : uchar * dst = (uchar *)fd_chunk_to_laddr( poh->shred_out->mem, poh->shred_out->chunk );
604 0 : FD_TEST( slot>=poh->reset_slot );
605 0 : fd_entry_batch_meta_t * meta = (fd_entry_batch_meta_t *)dst;
606 0 : meta->parent_offset = 1UL+slot-poh->reset_slot;
607 0 : meta->reference_tick = (poh->hashcnt/poh->hashcnt_per_tick) % poh->ticks_per_slot;
608 0 : meta->block_complete = !poh->hashcnt;
609 :
610 0 : meta->parent_block_id_valid = 1;
611 0 : fd_memcpy( meta->parent_block_id, poh->completed_block_id, 32UL );
612 :
613 0 : dst += sizeof(fd_entry_batch_meta_t);
614 0 : fd_entry_batch_header_t * header = (fd_entry_batch_header_t *)dst;
615 0 : header->hashcnt_delta = hashcnt_delta;
616 0 : fd_memcpy( header->hash, poh->hash, 32UL );
617 :
618 0 : dst += sizeof(fd_entry_batch_header_t);
619 0 : ulong payload_sz = 0UL;
620 0 : ulong included_txn_cnt = 0UL;
621 0 : for( ulong i=0UL; i<txn_cnt; i++ ) {
622 0 : fd_txn_p_t const * txn = txns + i;
623 0 : if( FD_UNLIKELY( !(txn->flags & FD_TXN_P_FLAGS_EXECUTE_SUCCESS) ) ) continue;
624 :
625 0 : fd_memcpy( dst, txn->payload, txn->payload_sz );
626 0 : payload_sz += txn->payload_sz;
627 0 : dst += txn->payload_sz;
628 0 : included_txn_cnt++;
629 0 : }
630 0 : header->txn_cnt = included_txn_cnt;
631 :
632 : /* We always have credits to publish here, because we have a burst
633 : value of 3 credits, and at most we will publish_tick() once and
634 : then publish_became_leader() once, leaving one credit here to
635 : publish the microblock. */
636 0 : ulong tspub = (ulong)fd_frag_meta_ts_comp( fd_tickcount() );
637 0 : ulong sz = sizeof(fd_entry_batch_meta_t)+sizeof(fd_entry_batch_header_t)+payload_sz;
638 0 : ulong new_sig = fd_disco_poh_sig( slot, POH_PKT_TYPE_MICROBLOCK, 0UL );
639 0 : fd_stem_publish( stem, poh->shred_out->idx, new_sig, poh->shred_out->chunk, sz, 0UL, 0UL, tspub );
640 0 : poh->shred_out->chunk = fd_dcache_compact_next( poh->shred_out->chunk, sz, poh->shred_out->chunk0, poh->shred_out->wmark );
641 0 : }
642 :
643 : void
644 : fd_poh1_mixin( fd_poh_t * poh,
645 : fd_stem_context_t * stem,
646 : ulong slot,
647 : uchar const * hash,
648 : ulong txn_cnt,
649 0 : fd_txn_p_t const * txns ) {
650 0 : if( FD_UNLIKELY( slot!=poh->next_leader_slot || slot!=poh->slot ) ) {
651 0 : FD_LOG_ERR(( "packed too early or late slot=%lu, current_slot=%lu", slot, poh->slot ));
652 0 : }
653 :
654 0 : FD_TEST( poh->state==STATE_LEADER );
655 0 : FD_TEST( poh->microblocks_lower_bound<poh->max_microblocks_per_slot );
656 0 : poh->microblocks_lower_bound += 1UL;
657 :
658 0 : ulong executed_txn_cnt = 0UL;
659 0 : for( ulong i=0UL; i<txn_cnt; i++ ) {
660 : /* It's important that we check if a transaction is included in the
661 : block with FD_TXN_P_FLAGS_EXECUTE_SUCCESS since
662 : actual_consumed_cus may have a nonzero value for excluded
663 : transactions used for monitoring purposes */
664 0 : if( FD_LIKELY( txns[ i ].flags & FD_TXN_P_FLAGS_EXECUTE_SUCCESS ) ) {
665 0 : executed_txn_cnt++;
666 0 : }
667 0 : }
668 :
669 : /* We don't publish transactions that fail to execute. If all the
670 : transactions failed to execute, the microblock would be empty,
671 : causing agave to think it's a tick and complain. Instead, we just
672 : skip the microblock and don't hash or update the hashcnt. */
673 0 : if( FD_UNLIKELY( !executed_txn_cnt ) ) return;
674 :
675 0 : uchar data[ 64 ];
676 0 : fd_memcpy( data, poh->hash, 32UL );
677 0 : fd_memcpy( data+32UL, hash, 32UL );
678 0 : fd_sha256_hash( data, 64UL, poh->hash );
679 :
680 0 : poh->hashcnt++;
681 0 : FD_TEST( poh->hashcnt>poh->last_hashcnt );
682 0 : ulong hashcnt_delta = poh->hashcnt - poh->last_hashcnt;
683 :
684 : /* The hashing loop above will never leave us exactly one away from
685 : crossing a tick boundary, so this increment will never cause the
686 : current tick (or the slot) to change, except in low power mode
687 : for development, in which case we do need to register the tick
688 : with the leader bank. We don't need to publish the tick since
689 : sending the microblock below is the publishing action. */
690 0 : if( FD_UNLIKELY( !(poh->hashcnt%poh->hashcnt_per_slot ) ) ) {
691 0 : poh->slot++;
692 0 : poh->hashcnt = 0UL;
693 0 : }
694 :
695 0 : poh->last_slot = poh->slot;
696 0 : poh->last_hashcnt = poh->hashcnt;
697 :
698 0 : if( FD_UNLIKELY( !(poh->hashcnt%poh->hashcnt_per_tick ) ) ) {
699 0 : if( FD_UNLIKELY( poh->slot>poh->next_leader_slot ) ) {
700 : /* We ticked while leader and are no longer leader... transition
701 : the state machine. */
702 0 : transition_to_follower( poh, stem, 1 );
703 0 : poh->state = STATE_WAITING_FOR_RESET;
704 0 : }
705 0 : }
706 :
707 0 : publish_microblock( poh, stem, slot, hashcnt_delta, txn_cnt, txns );
708 0 : }
|