Reapply "str-288: parallel encoding with Rayon threadpool and plugin lifecycle management (#661)"

Ozodimgba · web-flow · commit bea22e2eb497 · 2026-03-03T10:45:03.000Z
This reverts commit 04c54df. fix: attach parallel encoding to all broadcast_tx.send() paths
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/Cargo.toml b/Cargo.toml
@@ -54,6 +54,7 @@ prost = "0.14.0"
 prost-types = "0.14.0"
 prost_011 = { package = "prost", version = "0.11.9" }
 protoc-bin-vendored = "3.2.0"
+rayon = "1.11.0"
 serde = "1.0.145"
 serde_json = "1.0.86"
 smallvec = "1.15.1"
diff --git a/yellowstone-grpc-geyser/Cargo.toml b/yellowstone-grpc-geyser/Cargo.toml
@@ -39,6 +39,7 @@ pin-project = { workspace = true }
 prometheus = { workspace = true }
 prost = { workspace = true }
 prost-types = { workspace = true }
+rayon = { workspace = true }
 serde = { workspace = true }
 serde_json = { workspace = true }
 thiserror = { workspace = true }
diff --git a/yellowstone-grpc-geyser/src/config.rs b/yellowstone-grpc-geyser/src/config.rs
@@ -200,6 +200,12 @@ pub struct ConfigGrpc {
         deserialize_with = "deserialize_int_str"
     )]
     pub replay_stored_slots: u64,
+    /// Number of threads for parallel encoding
+    #[serde(
+        default = "ConfigGrpc::encoder_threads_default",
+        deserialize_with = "deserialize_int_str"
+    )]
+    pub encoder_threads: usize,
     #[serde(default)]
     pub server_http2_adaptive_window: Option<bool>,
     #[serde(default, with = "humantime_serde")]
@@ -255,6 +261,10 @@ impl ConfigGrpc {
     const fn default_replay_stored_slots() -> u64 {
         0
     }
+
+    const fn encoder_threads_default() -> usize {
+        4
+    }
 }
 
 #[derive(Debug, Clone, Deserialize)]
diff --git a/yellowstone-grpc-geyser/src/grpc.rs b/yellowstone-grpc-geyser/src/grpc.rs
@@ -4,7 +4,9 @@ use {
         metered::MeteredLayer,
         metrics::{
             self, incr_grpc_method_call_count, set_subscriber_queue_size, DebugClientMessage,
+            GEYSER_BATCH_SIZE,
         },
+        parallel::ParallelEncoder,
         plugin::{
             filter::{
                 limits::FilterLimits,
@@ -495,6 +497,7 @@ impl GrpcService {
         is_reload: bool,
         service_cancellation_token: CancellationToken,
         task_tracker: TaskTracker,
+        parallel_encoder: ParallelEncoder,
     ) -> anyhow::Result<(
         Option<crossbeam_channel::Sender<Box<Message>>>,
         mpsc::UnboundedSender<Message>,
@@ -613,6 +616,7 @@ impl GrpcService {
                 replay_stored_slots_rx,
                 replay_first_available_slot,
                 config.replay_stored_slots,
+                parallel_encoder,
             )
             .await;
         });
@@ -655,6 +659,7 @@ impl GrpcService {
         replay_stored_slots_rx: Option<mpsc::Receiver<ReplayStoredSlotsRequest>>,
         replay_first_available_slot: Option<Arc<AtomicU64>>,
         replay_stored_slots: u64,
+        parallel_encoder: ParallelEncoder,
     ) {
         const PROCESSED_MESSAGES_MAX: usize = 31;
         const PROCESSED_MESSAGES_SLEEP: Duration = Duration::from_millis(10);
@@ -899,8 +904,10 @@ impl GrpcService {
 
                             // processed
                             processed_messages.push(message.clone());
+                            GEYSER_BATCH_SIZE.observe(processed_messages.len() as f64);
+                            let encoded = parallel_encoder.encode(processed_messages).await;
                             let _ =
-                                broadcast_tx.send((CommitmentLevel::Processed, processed_messages.into()));
+                                broadcast_tx.send((CommitmentLevel::Processed, encoded.into()));
                             processed_messages = Vec::with_capacity(PROCESSED_MESSAGES_MAX);
                             processed_sleep
                                 .as_mut()
@@ -938,8 +945,10 @@ impl GrpcService {
                                 || !confirmed_messages.is_empty()
                                 || !finalized_messages.is_empty()
                             {
+                                GEYSER_BATCH_SIZE.observe(processed_messages.len() as f64);
+                                let encoded = parallel_encoder.encode(processed_messages).await;
                                 let _ = broadcast_tx
-                                    .send((CommitmentLevel::Processed, processed_messages.into()));
+                                    .send((CommitmentLevel::Processed, encoded.into()));
                                 processed_messages = Vec::with_capacity(PROCESSED_MESSAGES_MAX);
                                 processed_sleep
                                     .as_mut()
@@ -960,7 +969,9 @@ impl GrpcService {
                 }
                 () = &mut processed_sleep => {
                     if !processed_messages.is_empty() {
-                        let _ = broadcast_tx.send((CommitmentLevel::Processed, processed_messages.into()));
+                        GEYSER_BATCH_SIZE.observe(processed_messages.len() as f64);
+                        let encoded = parallel_encoder.encode(processed_messages).await;
+                        let _ = broadcast_tx.send((CommitmentLevel::Processed, encoded.into()));
                         processed_messages = Vec::with_capacity(PROCESSED_MESSAGES_MAX);
                     }
                     processed_sleep.as_mut().reset(Instant::now() + PROCESSED_MESSAGES_SLEEP);
diff --git a/yellowstone-grpc-geyser/src/lib.rs b/yellowstone-grpc-geyser/src/lib.rs
@@ -2,6 +2,7 @@ pub mod config;
 pub mod grpc;
 pub mod metered;
 pub mod metrics;
+pub mod parallel;
 pub mod plugin;
 pub mod transport;
 pub(crate) mod util;
diff --git a/yellowstone-grpc-geyser/src/parallel.rs b/yellowstone-grpc-geyser/src/parallel.rs
@@ -0,0 +1,223 @@
+use {
+    crate::plugin::{
+        filter::encoder::{AccountEncoder, TransactionEncoder},
+        message::Message,
+    },
+    rayon::{ThreadPool, ThreadPoolBuilder},
+    tokio::sync::{mpsc, oneshot},
+};
+
+pub struct ParallelEncoder {
+    tx: mpsc::UnboundedSender<EncodeRequest>,
+}
+
+struct EncodeRequest {
+    batch: Vec<(u64, Message)>,
+    response: oneshot::Sender<Vec<(u64, Message)>>,
+}
+
+impl ParallelEncoder {
+    pub fn new(num_threads: usize) -> (Self, std::thread::JoinHandle<()>) {
+        let pool = ThreadPoolBuilder::new()
+            .num_threads(num_threads)
+            .thread_name(|i| format!("geyser-encoder-{i}"))
+            .build()
+            .expect("failed to create rayon pool");
+
+        let (tx, rx) = mpsc::unbounded_channel();
+
+        let handle = std::thread::Builder::new()
+            .name("geyser-encoder-bridge".into())
+            .spawn(move || Self::bridge_loop(rx, pool))
+            .expect("failed to spawn encoder bridge");
+
+        (Self { tx }, handle)
+    }
+
+    fn bridge_loop(mut rx: mpsc::UnboundedReceiver<EncodeRequest>, pool: ThreadPool) {
+        use rayon::prelude::*;
+
+        while let Some(req) = rx.blocking_recv() {
+            let EncodeRequest {
+                mut batch,
+                response,
+            } = req;
+
+            pool.install(|| {
+                batch.par_iter_mut().for_each(|(_msgid, msg)| {
+                    Self::encode_message(msg);
+                });
+            });
+
+            let _ = response.send(batch);
+        }
+
+        log::info!("exiting encoder bridge loop");
+    }
+
+    fn encode_message(msg: &Message) {
+        match msg {
+            Message::Transaction(tx) => {
+                if tx.transaction.pre_encoded.get().is_none() {
+                    TransactionEncoder::pre_encode(&tx.transaction);
+                }
+            }
+            Message::Account(acc) => {
+                if acc.account.pre_encoded.get().is_none() {
+                    AccountEncoder::pre_encode(&acc.account);
+                }
+            }
+            _ => {}
+        }
+    }
+
+    pub async fn encode(&self, batch: Vec<(u64, Message)>) -> Vec<(u64, Message)> {
+        if batch.len() < 4 {
+            return Self::encode_sync(batch);
+        }
+
+        let (tx, rx) = oneshot::channel();
+
+        // move batch, don't clone
+        if self
+            .tx
+            .send(EncodeRequest {
+                batch,
+                response: tx,
+            })
+            .is_err()
+        {
+            // channel closed - this shouldn't happen in normal operation
+            panic!("encoder channel closed");
+        }
+
+        rx.await.expect("encoder response failed")
+    }
+
+    fn encode_sync(mut batch: Vec<(u64, Message)>) -> Vec<(u64, Message)> {
+        for (_msgid, msg) in &mut batch {
+            Self::encode_message(msg);
+        }
+        batch
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use {
+        super::*,
+        crate::plugin::message::{
+            MessageAccount, MessageAccountInfo, MessageTransaction, MessageTransactionInfo,
+        },
+        bytes::Bytes,
+        prost_types::Timestamp,
+        solana_pubkey::Pubkey,
+        solana_signature::Signature,
+        std::{
+            sync::{Arc, OnceLock},
+            time::SystemTime,
+        },
+    };
+
+    fn create_test_transaction() -> Message {
+        let tx_info = MessageTransactionInfo {
+            signature: Signature::from([1u8; 64]),
+            is_vote: false,
+            transaction: Default::default(),
+            meta: Default::default(),
+            index: 0,
+            account_keys: Default::default(),
+            pre_encoded: OnceLock::new(),
+        };
+        Message::Transaction(MessageTransaction {
+            transaction: Arc::new(tx_info),
+            slot: 100,
+            created_at: Timestamp::from(SystemTime::now()),
+        })
+    }
+
+    fn create_test_account() -> Message {
+        let acc_info = MessageAccountInfo {
+            pubkey: Pubkey::new_unique(),
+            lamports: 1000,
+            owner: Pubkey::new_unique(),
+            executable: false,
+            rent_epoch: 0,
+            data: Bytes::from(vec![1, 2, 3]),
+            write_version: 1,
+            txn_signature: None,
+            pre_encoded: OnceLock::new(),
+        };
+        Message::Account(MessageAccount {
+            account: Arc::new(acc_info),
+            slot: 100,
+            is_startup: false,
+            created_at: Timestamp::from(SystemTime::now()),
+        })
+    }
+
+    #[tokio::test]
+    async fn test_parallel_encoder_transactions() {
+        let (encoder, _handle) = ParallelEncoder::new(2);
+
+        let batch: Vec<(u64, Message)> = (0..10).map(|i| (i, create_test_transaction())).collect();
+
+        let encoded = encoder.encode(batch).await;
+
+        assert_eq!(encoded.len(), 10);
+        for (_msgid, msg) in encoded {
+            if let Message::Transaction(tx) = msg {
+                assert!(
+                    tx.transaction.pre_encoded.get().is_some(),
+                    "transaction should be encoded"
+                );
+            }
+        }
+    }
+
+    #[tokio::test]
+    async fn test_parallel_encoder_accounts() {
+        let (encoder, _handle) = ParallelEncoder::new(2);
+
+        let batch: Vec<(u64, Message)> = (0..10).map(|i| (i, create_test_account())).collect();
+
+        let encoded = encoder.encode(batch).await;
+
+        assert_eq!(encoded.len(), 10);
+        for (_msgid, msg) in encoded {
+            if let Message::Account(acc) = msg {
+                assert!(
+                    acc.account.pre_encoded.get().is_some(),
+                    "account should be encoded"
+                );
+            }
+        }
+    }
+
+    #[tokio::test]
+    async fn test_small_batch_uses_sync() {
+        let (encoder, _handle) = ParallelEncoder::new(2);
+
+        // Small batch < 4 should use sync path
+        let batch: Vec<(u64, Message)> = (0..2).map(|i| (i, create_test_transaction())).collect();
+
+        let encoded = encoder.encode(batch).await;
+
+        assert_eq!(encoded.len(), 2);
+    }
+
+    #[tokio::test]
+    async fn test_mixed_batch() {
+        let (encoder, _handle) = ParallelEncoder::new(2);
+
+        let mut batch: Vec<(u64, Message)> = Vec::new();
+        for i in 0..5 {
+            batch.push((i * 2, create_test_transaction()));
+            batch.push((i * 2 + 1, create_test_account()));
+        }
+
+        let encoded = encoder.encode(batch).await;
+
+        assert_eq!(encoded.len(), 10);
+    }
+}
diff --git a/yellowstone-grpc-geyser/src/plugin/entry.rs b/yellowstone-grpc-geyser/src/plugin/entry.rs