LCOV - code coverage report
Current view: top level - disco/dedup - fd_dedup_tile.c (source / functions) Hit Total Coverage
Test: cov.lcov Lines: 0 155 0.0 %
Date: 2025-09-18 04:41:32 Functions: 0 9 0.0 %

          Line data    Source code
       1             : #include "../tiles.h"
       2             : 
       3             : #include "generated/fd_dedup_tile_seccomp.h"
       4             : 
       5             : #include "../verify/fd_verify_tile.h"
       6             : #include "../metrics/fd_metrics.h"
       7             : 
       8             : #include <linux/unistd.h>
       9             : 
      10             : /* fd_dedup provides services to deduplicate multiple streams of input
      11             :    fragments and present them to a mix of reliable and unreliable
      12             :    consumers as though they were generated by a single multi-stream
      13             :    producer. */
      14             : 
      15           0 : #define IN_KIND_GOSSIP       (0UL)
      16           0 : #define IN_KIND_VERIFY       (1UL)
      17           0 : #define IN_KIND_EXECUTED_TXN (2UL)
      18             : 
      19             : /* fd_dedup_in_ctx_t is a context object for each in (producer) mcache
      20             :    connected to the dedup tile. */
      21             : 
      22             : typedef struct {
      23             :   fd_wksp_t * mem;
      24             :   ulong       chunk0;
      25             :   ulong       wmark;
      26             :   ulong       mtu;
      27             : } fd_dedup_in_ctx_t;
      28             : 
      29             : /* fd_dedup_ctx_t is the context object provided to callbacks from
      30             :    fd_stem, and contains all state needed to progress the tile. */
      31             : 
      32             : typedef struct {
      33             :   ulong   tcache_depth;   /* == fd_tcache_depth( tcache ), depth of this dedups's tcache (const) */
      34             :   ulong   tcache_map_cnt; /* == fd_tcache_map_cnt( tcache ), number of slots to use for tcache map (const) */
      35             :   ulong * tcache_sync;    /* == fd_tcache_oldest_laddr( tcache ), local join to the oldest key in the tcache */
      36             :   ulong * tcache_ring;
      37             :   ulong * tcache_map;
      38             : 
      39             :   ulong             in_kind[ 64UL ];
      40             :   fd_dedup_in_ctx_t in[ 64UL ];
      41             : 
      42             :   int   bundle_failed;
      43             :   ulong bundle_id;
      44             :   ulong bundle_idx;
      45             :   uchar bundle_signatures[ 4UL ][ 64UL ];
      46             : 
      47             :   fd_wksp_t * out_mem;
      48             :   ulong       out_chunk0;
      49             :   ulong       out_wmark;
      50             :   ulong       out_chunk;
      51             : 
      52             :   ulong       hashmap_seed;
      53             : 
      54             :   struct {
      55             :     ulong bundle_peer_failure_cnt;
      56             :     ulong dedup_fail_cnt;
      57             :   } metrics;
      58             : } fd_dedup_ctx_t;
      59             : 
      60             : FD_FN_CONST static inline ulong
      61           0 : scratch_align( void ) {
      62           0 :   return alignof( fd_dedup_ctx_t );
      63           0 : }
      64             : 
      65             : FD_FN_PURE static inline ulong
      66           0 : scratch_footprint( fd_topo_tile_t const * tile ) {
      67           0 :   ulong l = FD_LAYOUT_INIT;
      68           0 :   l = FD_LAYOUT_APPEND( l, alignof( fd_dedup_ctx_t ), sizeof( fd_dedup_ctx_t ) );
      69           0 :   l = FD_LAYOUT_APPEND( l, fd_tcache_align(), fd_tcache_footprint( tile->dedup.tcache_depth, 0UL ) );
      70           0 :   return FD_LAYOUT_FINI( l, scratch_align() );
      71           0 : }
      72             : 
      73             : static inline void
      74           0 : metrics_write( fd_dedup_ctx_t * ctx ) {
      75           0 :   FD_MCNT_SET( DEDUP, TRANSACTION_BUNDLE_PEER_FAILURE, ctx->metrics.bundle_peer_failure_cnt );
      76           0 :   FD_MCNT_SET( DEDUP, TRANSACTION_DEDUP_FAILURE,       ctx->metrics.dedup_fail_cnt );
      77           0 : }
      78             : 
      79             : /* during_frag is called between pairs for sequence number checks, as
      80             :    we are reading incoming frags.  We don't actually need to copy the
      81             :    fragment here, flow control prevents it getting overrun, and
      82             :    downstream consumers could reuse the same chunk and workspace to
      83             :    improve performance.
      84             : 
      85             :    The bounds checking and copying here are defensive measures,
      86             : 
      87             :     * In a functioning system, the bounds checking should never fail,
      88             :       but we want to prevent an attacker with code execution on a producer
      89             :       tile from trivially being able to jump to a consumer tile with
      90             :       out of bounds chunks.
      91             : 
      92             :     * For security reasons, we have chosen to isolate all workspaces from
      93             :       one another, so for example, if the QUIC tile is compromised with
      94             :       RCE, it cannot wait until the sigverify tile has verified a transaction,
      95             :       and then overwrite the transaction while it's being processed by the
      96             :       banking stage. */
      97             : 
      98             : static inline void
      99             : during_frag( fd_dedup_ctx_t * ctx,
     100             :              ulong            in_idx,
     101             :              ulong            seq FD_PARAM_UNUSED,
     102             :              ulong            sig FD_PARAM_UNUSED,
     103             :              ulong            chunk,
     104             :              ulong            sz,
     105           0 :              ulong            ctl FD_PARAM_UNUSED ) {
     106             : 
     107           0 :   if( FD_UNLIKELY( chunk<ctx->in[ in_idx ].chunk0 || chunk>ctx->in[ in_idx ].wmark || sz>ctx->in[ in_idx ].mtu ) )
     108           0 :     FD_LOG_ERR(( "chunk %lu %lu corrupt, not in range [%lu,%lu]", chunk, sz, ctx->in[ in_idx ].chunk0, ctx->in[ in_idx ].wmark ));
     109             : 
     110           0 :   uchar * src = (uchar *)fd_chunk_to_laddr( ctx->in[ in_idx ].mem, chunk );
     111           0 :   uchar * dst = (uchar *)fd_chunk_to_laddr( ctx->out_mem, ctx->out_chunk );
     112             : 
     113           0 :   if( FD_UNLIKELY( ctx->in_kind[ in_idx ]==IN_KIND_GOSSIP ) ) {
     114           0 :     if( FD_UNLIKELY( sz>FD_TPU_RAW_MTU ) ) FD_LOG_ERR(( "received a gossip transaction that was too large" ));
     115           0 :     fd_memcpy( dst, src, sz );
     116             : 
     117           0 :     fd_txn_m_t const * txnm = (fd_txn_m_t const *)dst;
     118           0 :     if( FD_UNLIKELY( txnm->payload_sz>FD_TPU_MTU ) ) {
     119           0 :       FD_LOG_ERR(( "vote txn payload size %hu exceeds max %lu", txnm->payload_sz, FD_TPU_MTU ));
     120           0 :     }
     121           0 :   } else if( FD_UNLIKELY( ctx->in_kind[ in_idx ]==IN_KIND_EXECUTED_TXN ) ) {
     122           0 :     if( FD_UNLIKELY( sz!=FD_TXN_SIGNATURE_SZ ) ) FD_LOG_ERR(( "received an executed transaction signature message with the wrong size %lu", sz ));
     123             :     /* Executed txns just have their signature inserted into the tcache
     124             :        so we can dedup them easily. */
     125           0 :     ulong ha_dedup_tag = fd_hash( ctx->hashmap_seed, src+FD_TXN_SIGNATURE_SZ, FD_TXN_SIGNATURE_SZ );
     126           0 :     int _is_dup;
     127           0 :     FD_TCACHE_INSERT( _is_dup, *ctx->tcache_sync, ctx->tcache_ring, ctx->tcache_depth, ctx->tcache_map, ctx->tcache_map_cnt, ha_dedup_tag );
     128           0 :     (void)_is_dup;
     129           0 :   } else {
     130           0 :     fd_memcpy( dst, src, sz );
     131           0 :   }
     132           0 : }
     133             : 
     134             : /* After the transaction has been fully received, and we know we were
     135             :    not overrun while reading it, check if it's a duplicate of a prior
     136             :    transaction.
     137             : 
     138             :    If the transaction came in from the gossip link, then it hasn't been
     139             :    parsed by us.  So parse it here if necessary. */
     140             : 
     141             : static inline void
     142             : after_frag( fd_dedup_ctx_t *    ctx,
     143             :             ulong               in_idx,
     144             :             ulong               seq,
     145             :             ulong               sig,
     146             :             ulong               sz,
     147             :             ulong               tsorig,
     148             :             ulong               _tspub,
     149           0 :             fd_stem_context_t * stem ) {
     150           0 :   (void)seq;
     151           0 :   (void)sig;
     152           0 :   (void)sz;
     153           0 :   (void)_tspub;
     154             : 
     155           0 :   if( FD_UNLIKELY( ctx->in_kind[ in_idx ]==IN_KIND_EXECUTED_TXN ) ) return;
     156             : 
     157           0 :   fd_txn_m_t * txnm = (fd_txn_m_t *)fd_chunk_to_laddr( ctx->out_mem, ctx->out_chunk );
     158           0 :   FD_TEST( txnm->payload_sz<=FD_TPU_MTU );
     159           0 :   fd_txn_t * txn = fd_txn_m_txn_t( txnm );
     160             : 
     161           0 :   if( FD_UNLIKELY( txnm->block_engine.bundle_id && (txnm->block_engine.bundle_id!=ctx->bundle_id) ) ) {
     162           0 :     ctx->bundle_failed = 0;
     163           0 :     ctx->bundle_id     = txnm->block_engine.bundle_id;
     164           0 :     ctx->bundle_idx    = 0UL;
     165           0 :   }
     166             : 
     167           0 :   if( FD_UNLIKELY( txnm->block_engine.bundle_id && ctx->bundle_failed ) ) {
     168           0 :     ctx->metrics.bundle_peer_failure_cnt++;
     169           0 :     return;
     170           0 :   }
     171             : 
     172           0 :   if( FD_UNLIKELY( ctx->in_kind[ in_idx ]==IN_KIND_GOSSIP ) ) {
     173             :     /* Transactions coming in from these links are not parsed.
     174             : 
     175             :        We'll need to parse it so it's ready for downstream consumers.
     176             :        Equally importantly, we need to parse to extract the signature
     177             :        for dedup.  Just parse it right into the output dcache. */
     178           0 :     txnm->txn_t_sz = (ushort)fd_txn_parse( fd_txn_m_payload( txnm ), txnm->payload_sz, txn, NULL );
     179           0 :     if( FD_UNLIKELY( !txnm->txn_t_sz ) ) FD_LOG_ERR(( "fd_txn_parse failed for vote transactions that should have been sigverified" ));
     180             : 
     181           0 :     FD_MCNT_INC( DEDUP, GOSSIPED_VOTES_RECEIVED, 1UL );
     182           0 :   }
     183             : 
     184           0 :   int is_dup = 0;
     185           0 :   if( FD_LIKELY( !txnm->block_engine.bundle_id ) ) {
     186             :     /* Compute fd_hash(signature) for dedup. */
     187           0 :     ulong ha_dedup_tag = fd_hash( ctx->hashmap_seed, fd_txn_m_payload( txnm )+txn->signature_off, 64UL );
     188             : 
     189           0 :     FD_TCACHE_INSERT( is_dup, *ctx->tcache_sync, ctx->tcache_ring, ctx->tcache_depth, ctx->tcache_map, ctx->tcache_map_cnt, ha_dedup_tag );
     190           0 :   } else {
     191             :     /* Make sure bundles don't contain a duplicate transaction inside
     192             :        the bundle, which would not be valid. */
     193             : 
     194           0 :     if( FD_UNLIKELY( ctx->bundle_idx>4UL ) ) FD_LOG_ERR(( "bundle_idx %lu > 4", ctx->bundle_idx ));
     195             : 
     196           0 :     for( ulong i=0UL; i<ctx->bundle_idx; i++ ) {
     197           0 :       if( !memcmp( ctx->bundle_signatures[ i ], fd_txn_m_payload( txnm )+txn->signature_off, 64UL ) ) {
     198           0 :         is_dup = 1;
     199           0 :         break;
     200           0 :       }
     201           0 :     }
     202             : 
     203           0 :     if( FD_UNLIKELY( ctx->bundle_idx==4UL ) ) ctx->bundle_idx++;
     204           0 :     else fd_memcpy( ctx->bundle_signatures[ ctx->bundle_idx++ ], fd_txn_m_payload( txnm )+txn->signature_off, 64UL );
     205           0 :   }
     206             : 
     207           0 :   if( FD_LIKELY( is_dup ) ) {
     208           0 :     if( FD_UNLIKELY( txnm->block_engine.bundle_id ) ) ctx->bundle_failed = 1;
     209             : 
     210           0 :     ctx->metrics.dedup_fail_cnt++;
     211           0 :   } else {
     212           0 :     ulong realized_sz = fd_txn_m_realized_footprint( txnm, 1, 0 );
     213           0 :     ulong tspub = (ulong)fd_frag_meta_ts_comp( fd_tickcount() );
     214           0 :     fd_stem_publish( stem, 0UL, 0, ctx->out_chunk, realized_sz, 0UL, tsorig, tspub );
     215           0 :     ctx->out_chunk = fd_dcache_compact_next( ctx->out_chunk, realized_sz, ctx->out_chunk0, ctx->out_wmark );
     216           0 :   }
     217           0 : }
     218             : 
     219             : static void
     220             : privileged_init( fd_topo_t *      topo,
     221           0 :                  fd_topo_tile_t * tile ) {
     222           0 :   void * scratch = fd_topo_obj_laddr( topo, tile->tile_obj_id );
     223             : 
     224           0 :   FD_SCRATCH_ALLOC_INIT( l, scratch );
     225           0 :   fd_dedup_ctx_t * ctx = FD_SCRATCH_ALLOC_APPEND( l, alignof( fd_dedup_ctx_t ), sizeof( fd_dedup_ctx_t ) );
     226           0 :   FD_TEST( fd_rng_secure( &ctx->hashmap_seed, 8U ) );
     227           0 : }
     228             : 
     229             : static void
     230             : unprivileged_init( fd_topo_t *      topo,
     231           0 :                    fd_topo_tile_t * tile ) {
     232           0 :   void * scratch = fd_topo_obj_laddr( topo, tile->tile_obj_id );
     233             : 
     234           0 :   FD_SCRATCH_ALLOC_INIT( l, scratch );
     235           0 :   fd_dedup_ctx_t * ctx = FD_SCRATCH_ALLOC_APPEND( l, alignof( fd_dedup_ctx_t ), sizeof( fd_dedup_ctx_t ) );
     236           0 :   fd_tcache_t * tcache = fd_tcache_join( fd_tcache_new( FD_SCRATCH_ALLOC_APPEND( l, fd_tcache_align(), fd_tcache_footprint( tile->dedup.tcache_depth, 0) ), tile->dedup.tcache_depth, 0 ) );
     237           0 :   if( FD_UNLIKELY( !tcache ) ) FD_LOG_ERR(( "fd_tcache_new failed" ));
     238             : 
     239           0 :   ctx->bundle_failed = 0;
     240           0 :   ctx->bundle_id     = 0UL;
     241           0 :   ctx->bundle_idx    = 0UL;
     242             : 
     243           0 :   memset( &ctx->metrics, 0, sizeof( ctx->metrics ) );
     244             : 
     245           0 :   ctx->tcache_depth   = fd_tcache_depth       ( tcache );
     246           0 :   ctx->tcache_map_cnt = fd_tcache_map_cnt     ( tcache );
     247           0 :   ctx->tcache_sync    = fd_tcache_oldest_laddr( tcache );
     248           0 :   ctx->tcache_ring    = fd_tcache_ring_laddr  ( tcache );
     249           0 :   ctx->tcache_map     = fd_tcache_map_laddr   ( tcache );
     250             : 
     251           0 :   FD_TEST( tile->in_cnt<=sizeof( ctx->in )/sizeof( ctx->in[ 0 ] ) );
     252           0 :   for( ulong i=0UL; i<tile->in_cnt; i++ ) {
     253           0 :     fd_topo_link_t * link = &topo->links[ tile->in_link_id[ i ] ];
     254           0 :     fd_topo_wksp_t * link_wksp = &topo->workspaces[ topo->objs[ link->dcache_obj_id ].wksp_id ];
     255             : 
     256           0 :     ctx->in[i].mem    = link_wksp->wksp;
     257           0 :     ctx->in[i].mtu    = link->mtu;
     258           0 :     ctx->in[i].chunk0 = fd_dcache_compact_chunk0( ctx->in[i].mem, link->dcache );
     259           0 :     ctx->in[i].wmark  = fd_dcache_compact_wmark ( ctx->in[i].mem, link->dcache, link->mtu );
     260             : 
     261           0 :     if( !strcmp( link->name, "gossip_dedup" ) ) {
     262           0 :       ctx->in_kind[ i ] = IN_KIND_GOSSIP;
     263           0 :     } else if( !strcmp( link->name, "verify_dedup" ) ) {
     264           0 :       ctx->in_kind[ i ] = IN_KIND_VERIFY;
     265           0 :     } else if( !strcmp( link->name, "executed_txn" ) ) {
     266           0 :       ctx->in_kind[ i ] = IN_KIND_EXECUTED_TXN;
     267           0 :     } else {
     268           0 :       FD_LOG_ERR(( "unexpected link name %s", link->name ));
     269           0 :     }
     270           0 :   }
     271             : 
     272           0 :   ctx->out_mem    = topo->workspaces[ topo->objs[ topo->links[ tile->out_link_id[ 0 ] ].dcache_obj_id ].wksp_id ].wksp;
     273           0 :   ctx->out_chunk0 = fd_dcache_compact_chunk0( ctx->out_mem, topo->links[ tile->out_link_id[ 0 ] ].dcache );
     274           0 :   ctx->out_wmark  = fd_dcache_compact_wmark ( ctx->out_mem, topo->links[ tile->out_link_id[ 0 ] ].dcache, topo->links[ tile->out_link_id[ 0 ] ].mtu );
     275           0 :   ctx->out_chunk  = ctx->out_chunk0;
     276             : 
     277           0 :   ulong scratch_top = FD_SCRATCH_ALLOC_FINI( l, 1UL );
     278           0 :   if( FD_UNLIKELY( scratch_top > (ulong)scratch + scratch_footprint( tile ) ) )
     279           0 :     FD_LOG_ERR(( "scratch overflow %lu %lu %lu", scratch_top - (ulong)scratch - scratch_footprint( tile ), scratch_top, (ulong)scratch + scratch_footprint( tile ) ));
     280           0 : }
     281             : 
     282             : static ulong
     283             : populate_allowed_seccomp( fd_topo_t const *      topo,
     284             :                           fd_topo_tile_t const * tile,
     285             :                           ulong                  out_cnt,
     286           0 :                           struct sock_filter *   out ) {
     287           0 :   (void)topo;
     288           0 :   (void)tile;
     289             : 
     290           0 :   populate_sock_filter_policy_fd_dedup_tile( out_cnt, out, (uint)fd_log_private_logfile_fd() );
     291           0 :   return sock_filter_policy_fd_dedup_tile_instr_cnt;
     292           0 : }
     293             : 
     294             : static ulong
     295             : populate_allowed_fds( fd_topo_t const *      topo,
     296             :                       fd_topo_tile_t const * tile,
     297             :                       ulong                  out_fds_cnt,
     298           0 :                       int *                  out_fds ) {
     299           0 :   (void)topo;
     300           0 :   (void)tile;
     301             : 
     302           0 :   if( FD_UNLIKELY( out_fds_cnt<2UL ) ) FD_LOG_ERR(( "out_fds_cnt %lu", out_fds_cnt ));
     303             : 
     304           0 :   ulong out_cnt = 0UL;
     305           0 :   out_fds[ out_cnt++ ] = 2; /* stderr */
     306           0 :   if( FD_LIKELY( -1!=fd_log_private_logfile_fd() ) )
     307           0 :     out_fds[ out_cnt++ ] = fd_log_private_logfile_fd(); /* logfile */
     308           0 :   return out_cnt;
     309           0 : }
     310             : 
     311           0 : #define STEM_BURST (1UL)
     312             : 
     313           0 : #define STEM_CALLBACK_CONTEXT_TYPE  fd_dedup_ctx_t
     314           0 : #define STEM_CALLBACK_CONTEXT_ALIGN alignof(fd_dedup_ctx_t)
     315             : 
     316           0 : #define STEM_CALLBACK_METRICS_WRITE metrics_write
     317           0 : #define STEM_CALLBACK_DURING_FRAG   during_frag
     318           0 : #define STEM_CALLBACK_AFTER_FRAG    after_frag
     319             : 
     320             : #include "../stem/fd_stem.c"
     321             : 
     322             : fd_topo_run_tile_t fd_tile_dedup = {
     323             :   .name                     = "dedup",
     324             :   .populate_allowed_seccomp = populate_allowed_seccomp,
     325             :   .populate_allowed_fds     = populate_allowed_fds,
     326             :   .scratch_align            = scratch_align,
     327             :   .scratch_footprint        = scratch_footprint,
     328             :   .privileged_init          = privileged_init,
     329             :   .unprivileged_init        = unprivileged_init,
     330             :   .run                      = stem_run,
     331             : };

Generated by: LCOV version 1.14