flatten transaction sending (untested)

2022-05-28 04:26:24 +00:00 · 2022-05-28 04:26:24 +00:00 · 588a6c7924
parent 4335d2120e
commit 588a6c7924
5 changed files with 101 additions and 108 deletions
--- a/redis-cell-client/src/client.rs
+++ b/redis-cell-client/src/client.rs
@ -15,6 +15,7 @@ pub struct RedisCellClient {
 impl RedisCellClient {
    // todo: seems like this could be derived
    // TODO: take something generic for conn
    pub fn new(
        conn: MultiplexedConnection,
        key: String,
--- a/redis-cell-client/src/lib.rs
+++ b/redis-cell-client/src/lib.rs
@ -1,5 +1,7 @@
 mod client;
 pub use client::RedisCellClient;
 pub use redis;
 // TODO: don't hard code MultiplexedConnection
 pub use redis::aio::MultiplexedConnection;
 pub use redis::Client;
--- a/redis-cell-server/Dockerfile
+++ b/redis-cell-server/Dockerfile
@ -1,3 +1,4 @@
 # A redis server with the libredis_cell module installed
 FROM rust:1-bullseye as builder
 WORKDIR /usr/src/redis-cell
--- a/web3-proxy/src/app.rs
+++ b/web3-proxy/src/app.rs
@ -242,65 +242,14 @@ impl Web3ProxyApp {
        for _i in 0..10usize {
            // // TODO: add more to this span
            // let span = info_span!("i", ?i);
-            // let _enter = span.enter();
+            // let _enter = span.enter(); // DO NOT ENTER! we can't use enter across awaits! (clippy lint soon)
            if request.method == "eth_sendRawTransaction" {
                // there are private rpcs configured and the request is eth_sendSignedTransaction. send to all private rpcs
                // TODO: think more about this lock. i think it won't actually help the herd. it probably makes it worse if we have a tight lag_limit
-                match self.private_rpcs.get_upstream_servers().await {
+                return self
-                    Ok(active_request_handles) => {
+                    .private_rpcs
-                        // TODO: refactor this to block until it has responses from all and also to return the most common success response
+                    .try_send_all_upstream_servers(request)
-                        // TODO: i don't think we need to spawn it if we do that.
+                    .await;
                        let (tx, rx) = flume::bounded(1);
                        let connections = self.private_rpcs.clone();
                        let method = request.method.clone();
                        let params = request.params.clone();
                        // TODO: benchmark this compared to waiting on unbounded futures
                        // TODO: do something with this handle?
                        // TODO:
                        task::Builder::default()
                            .name("try_send_parallel_requests")
                            .spawn(async move {
                                connections
                                    .try_send_parallel_requests(
                                        active_request_handles,
                                        method,
                                        params,
                                        tx,
                                    )
                                    .await
                            });
                        // wait for the first response
                        // TODO: we don't want the first response. we want the quorum response
                        let backend_response = rx.recv_async().await?;
                        if let Ok(backend_response) = backend_response {
                            // TODO: i think we
                            let response = JsonRpcForwardedResponse {
                                jsonrpc: "2.0".to_string(),
                                id: request.id,
                                result: Some(backend_response),
                                error: None,
                            };
                            return Ok(response);
                        }
                    }
                    Err(None) => {
                        // TODO: return a 502?
                        // TODO: i don't think this will ever happen
                        return Err(anyhow::anyhow!("no private rpcs!"));
                    }
                    Err(Some(retry_after)) => {
                        // TODO: move this to a helper function
                        // sleep (TODO: with a lock?) until our rate limits should be available
                        // TODO: if a server catches up sync while we are waiting, we could stop waiting
                        sleep(retry_after).await;
                        warn!("All rate limits exceeded. Sleeping");
                    }
                };
            } else {
                // this is not a private transaction (or no private relays are configured)
@ -353,6 +302,7 @@ impl Web3ProxyApp {
                    }
                }
                // TODO: move this whole match to a function on self.balanced_rpcs
                match self.balanced_rpcs.next_upstream_server().await {
                    Ok(active_request_handle) => {
                        let response = active_request_handle
--- a/web3-proxy/src/connections.rs
+++ b/web3-proxy/src/connections.rs
@ -1,7 +1,8 @@
 ///! Load balanced communication with a group of web3 providers
 use arc_swap::ArcSwap;
 use counter::Counter;
 use derive_more::From;
-use ethers::prelude::H256;
+use ethers::prelude::{ProviderError, H256};
 use futures::future::join_all;
 use futures::stream::FuturesUnordered;
 use futures::StreamExt;
@ -15,11 +16,13 @@ use std::fmt;
 use std::sync::Arc;
 use std::time::Duration;
 use tokio::task;
 use tokio::time::sleep;
 use tracing::Instrument;
 use tracing::{debug, info, info_span, instrument, trace, warn};
 use crate::config::Web3ConnectionConfig;
 use crate::connection::{ActiveRequestHandle, Web3Connection};
 use crate::jsonrpc::{JsonRpcForwardedResponse, JsonRpcRequest};
 // Serialize so we can print it on our debug endpoint
 #[derive(Clone, Default, Serialize)]
@ -155,70 +158,61 @@ impl Web3Connections {
        *self.synced_connections.load().get_head_block_hash()
    }
-    /// Send the same request to all the handles. Returning the fastest successful result.
+    /// Send the same request to all the handles. Returning the most common success or most common error.
    #[instrument(skip_all)]
    pub async fn try_send_parallel_requests(
-        self: Arc<Self>,
+        &self,
        active_request_handles: Vec<ActiveRequestHandle>,
-        method: String,
+        method: &str,
-        params: Option<Box<RawValue>>,
+        // TODO: remove this box once i figure out how to do the options
-        response_sender: flume::Sender<anyhow::Result<Box<RawValue>>>,
+        params: Option<&RawValue>,
-    ) -> anyhow::Result<()> {
+    ) -> Result<Box<RawValue>, ProviderError> {
        // TODO: if only 1 active_request_handles, do self.try_send_request
        let mut unordered_futures = FuturesUnordered::new();
-        for active_request_handle in active_request_handles {
+        let responses = active_request_handles
-            // clone things so we can pass them to a future
+            .into_iter()
-            let method = method.clone();
+            .map(|active_request_handle| async move {
-            let params = params.clone();
+                let result: Result<Box<RawValue>, _> =
-            let response_sender = response_sender.clone();
+                    active_request_handle.request(method, params).await;
                result
            })
            .collect::<FuturesUnordered<_>>()
            .collect::<Vec<Result<Box<RawValue>, ProviderError>>>()
            .await;
-            let handle = task::Builder::default()
+        // TODO: Strings are not great keys, but we can't use RawValue or ProviderError as keys
-                .name("send_request")
+        let mut count_map: HashMap<String, Result<Box<RawValue>, ProviderError>> = HashMap::new();
-                .spawn(async move {
+        let mut counts: Counter<String> = Counter::new();
-                    let response: Box<RawValue> =
+        let mut any_ok = false;
-                        active_request_handle.request(&method, &params).await?;
+        for response in responses {
            let s = format!("{:?}", response);
-                    // send the first good response to a one shot channel. that way we respond quickly
+            if count_map.get(&s).is_none() {
-                    // drop the result because errors are expected after the first send
+                if response.is_ok() {
-                    response_sender
+                    any_ok = true;
-                        .send_async(Ok(response))
+                }
                        .await
                        .map_err(Into::into)
                });
-            unordered_futures.push(handle);
+                count_map.insert(s.clone(), response);
            }
            counts.update([s].into_iter());
        }
-        // TODO: use iterators instead of pushing into a vec?
+        for (most_common, _) in counts.most_common_ordered() {
-        let mut errs = vec![];
+            // TODO: how do we take this?
-        if let Some(x) = unordered_futures.next().await {
+            let most_common = count_map.remove(&most_common).unwrap();
-            match x.unwrap() {
+
-                Ok(_) => {}
+            if any_ok && most_common.is_err() {
-                Err(e) => {
+                //  errors were more common, but we are going to skip them because we got an okay
-                    // TODO: better errors
+                continue;
-                    warn!("Got an error sending request: {}", e);
+            } else {
-                    errs.push(e);
+                // return the most common
-                }
+                return most_common;
            }
        }
-        // get the first error (if any)
+        // TODO: what should we do if we get here? i don't think we will
-        // TODO: why collect multiple errors if we only pop one?
+        panic!("i don't think this is possible")
        let e = if !errs.is_empty() {
            Err(errs.pop().unwrap())
        } else {
            Err(anyhow::anyhow!("no successful responses"))
        };
        // send the error to the channel
        if response_sender.send_async(e).await.is_ok() {
            // if we were able to send an error, then we never sent a success
            return Err(anyhow::anyhow!("no successful responses"));
        } else {
            // if sending the error failed. the other side must be closed (which means we sent a success earlier)
            Ok(())
        }
    }
    /// TODO: possible dead lock here. investigate more. probably refactor
@ -440,4 +434,49 @@ impl Web3Connections {
        // return the earliest retry_after (if no rpcs are synced, this will be None)
        Err(earliest_retry_after)
    }
    pub async fn try_send_all_upstream_servers(
        &self,
        request: JsonRpcRequest,
    ) -> anyhow::Result<JsonRpcForwardedResponse> {
        // TODO: timeout on this loop
        loop {
            match self.get_upstream_servers().await {
                Ok(active_request_handles) => {
                    // TODO: benchmark this compared to waiting on unbounded futures
                    // TODO: do something with this handle?
                    // TODO: this is not working right. simplify
                    let quorum_response = self
                        .try_send_parallel_requests(
                            active_request_handles,
                            request.method.as_ref(),
                            request.params.as_deref(),
                        )
                        .await?;
                    let response = JsonRpcForwardedResponse {
                        jsonrpc: "2.0".to_string(),
                        id: request.id,
                        result: Some(quorum_response),
                        error: None,
                    };
                    return Ok(response);
                }
                Err(None) => {
                    // TODO: return a 502?
                    // TODO: i don't think this will ever happen
                    return Err(anyhow::anyhow!("no private rpcs!"));
                }
                Err(Some(retry_after)) => {
                    // TODO: move this to a helper function
                    // sleep (TODO: with a lock?) until our rate limits should be available
                    // TODO: if a server catches up sync while we are waiting, we could stop waiting
                    sleep(retry_after).await;
                    warn!("All rate limits exceeded. Sleeping");
                }
            }
        }
    }
 }