web3-proxy/web3-proxy/src/connections.rs

///! Load balanced communication with a group of web3 providers
use arc_swap::ArcSwap;
use derive_more::From;
use ethers::prelude::H256;
use futures::future::join_all;
use futures::stream::FuturesUnordered;
use futures::StreamExt;
use governor::clock::{QuantaClock, QuantaInstant};
use governor::NotUntil;
use hashbrown::HashMap;
use serde_json::value::RawValue;
use std::cmp;
use std::fmt;
use std::sync::Arc;
use tokio::task;
use tracing::Instrument;
use tracing::{info, info_span, instrument, trace, warn};

use crate::config::Web3ConnectionConfig;
use crate::connection::{ActiveRequestHandle, Web3Connection};

#[derive(Clone)]
struct SyncedConnections {
    head_block_num: u64,
    head_block_hash: H256,
    inner: Vec<usize>,
}

impl fmt::Debug for SyncedConnections {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        // TODO: the default formatter takes forever to write. this is too quiet though
        f.debug_struct("SyncedConnections").finish_non_exhaustive()
    }
}

impl SyncedConnections {
    fn new(max_connections: usize) -> Self {
        Self {
            head_block_num: 0,
            head_block_hash: Default::default(),
            inner: Vec::with_capacity(max_connections),
        }
    }

    pub fn get_head_block_hash(&self) -> &H256 {
        &self.head_block_hash
    }
}

/// A collection of web3 connections. Sends requests either the current best server or all servers.
#[derive(From)]
pub struct Web3Connections {
    inner: Vec<Arc<Web3Connection>>,
    synced_connections: ArcSwap<SyncedConnections>,
}

impl fmt::Debug for Web3Connections {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        // TODO: the default formatter takes forever to write. this is too quiet though
        f.debug_struct("Web3Connections")
            .field("inner", &self.inner)
            .finish_non_exhaustive()
    }
}

impl Web3Connections {
    // #[instrument(name = "try_new_Web3Connections", skip_all)]
    pub async fn try_new(
        chain_id: usize,
        servers: Vec<Web3ConnectionConfig>,
        http_client: Option<reqwest::Client>,
        clock: &QuantaClock,
    ) -> anyhow::Result<Arc<Self>> {
        let num_connections = servers.len();

        // turn configs into connections
        let mut connections = Vec::with_capacity(num_connections);
        for server_config in servers.into_iter() {
            match server_config
                .try_build(clock, chain_id, http_client.clone())
                .await
            {
                Ok(connection) => connections.push(connection),
                Err(e) => warn!("Unable to connect to a server! {:?}", e),
            }
        }

        if connections.len() < 2 {
            // TODO: less than 3? what should we do here?
            return Err(anyhow::anyhow!(
                "need at least 2 connections when subscribing to heads!"
            ));
        }

        let synced_connections = SyncedConnections::new(num_connections);

        let connections = Arc::new(Self {
            inner: connections,
            synced_connections: ArcSwap::new(Arc::new(synced_connections)),
        });

        Ok(connections)
    }

    pub async fn subscribe_heads(self: &Arc<Self>) {
        let (block_sender, block_receiver) = flume::unbounded();

        let mut handles = vec![];

        for (rpc_id, connection) in self.inner.iter().enumerate() {
            // subscribe to new heads in a spawned future
            // TODO: channel instead. then we can have one future with write access to a left-right?
            let connection = Arc::clone(connection);
            let block_sender = block_sender.clone();

            // let url = connection.url().to_string();

            let handle = task::Builder::default()
                .name("subscribe_new_heads")
                .spawn(async move {
                    // loop to automatically reconnect
                    // TODO: make this cancellable?
                    // TODO: instead of passing Some(connections), pass Some(channel_sender). Then listen on the receiver below to keep local heads up-to-date
                    // TODO: proper spann
                    connection
                        .subscribe_new_heads(rpc_id, block_sender.clone(), true)
                        .instrument(tracing::info_span!("url"))
                        .await
                });

            handles.push(handle);
        }

        let connections = Arc::clone(self);
        let handle = task::Builder::default()
            .name("update_synced_rpcs")
            .spawn(async move { connections.update_synced_rpcs(block_receiver).await });

        handles.push(handle);

        join_all(handles).await;
    }

    pub fn get_head_block_hash(&self) -> H256 {
        *self.synced_connections.load().get_head_block_hash()
    }

    /// Send the same request to all the handles. Returning the fastest successful result.
    #[instrument(skip_all)]
    pub async fn try_send_parallel_requests(
        self: Arc<Self>,
        active_request_handles: Vec<ActiveRequestHandle>,
        method: String,
        params: Option<Box<RawValue>>,
        response_sender: flume::Sender<anyhow::Result<Box<RawValue>>>,
    ) -> anyhow::Result<()> {
        // TODO: if only 1 active_request_handles, do self.try_send_request
        let mut unordered_futures = FuturesUnordered::new();

        for active_request_handle in active_request_handles {
            // clone things so we can pass them to a future
            let method = method.clone();
            let params = params.clone();
            let response_sender = response_sender.clone();

            let handle = task::Builder::default()
                .name("send_request")
                .spawn(async move {
                    let response: Box<RawValue> =
                        active_request_handle.request(&method, &params).await?;

                    // send the first good response to a one shot channel. that way we respond quickly
                    // drop the result because errors are expected after the first send
                    response_sender
                        .send_async(Ok(response))
                        .await
                        .map_err(Into::into)
                });

            unordered_futures.push(handle);
        }

        // TODO: use iterators instead of pushing into a vec?
        let mut errs = vec![];
        if let Some(x) = unordered_futures.next().await {
            match x.unwrap() {
                Ok(_) => {}
                Err(e) => {
                    // TODO: better errors
                    warn!("Got an error sending request: {}", e);
                    errs.push(e);
                }
            }
        }

        // get the first error (if any)
        // TODO: why collect multiple errors if we only pop one?
        let e = if !errs.is_empty() {
            Err(errs.pop().unwrap())
        } else {
            Err(anyhow::anyhow!("no successful responses"))
        };

        // send the error to the channel
        if response_sender.send_async(e).await.is_ok() {
            // if we were able to send an error, then we never sent a success
            return Err(anyhow::anyhow!("no successful responses"));
        } else {
            // if sending the error failed. the other side must be closed (which means we sent a success earlier)
            Ok(())
        }
    }

    /// TODO: possible dead lock here. investigate more. probably refactor
    /// TODO: move parts of this onto SyncedConnections?
    #[instrument(skip_all)]
    async fn update_synced_rpcs(
        &self,
        block_receiver: flume::Receiver<(u64, H256, usize)>,
    ) -> anyhow::Result<()> {
        let max_connections = self.inner.len();

        let mut connection_states: HashMap<usize, (u64, H256)> =
            HashMap::with_capacity(max_connections);

        let mut pending_synced_connections = SyncedConnections::new(max_connections);

        while let Ok((new_block_num, new_block_hash, rpc_id)) = block_receiver.recv_async().await {
            if new_block_num == 0 {
                // TODO: show the actual rpc url?
                warn!("rpc #{} is still syncing", rpc_id);
            }

            // TODO: span with rpc in it, too
            let span = info_span!("new_block", new_block_num);
            let _enter = span.enter();

            connection_states.insert(rpc_id, (new_block_num, new_block_hash));

            // TODO: do something to update the synced blocks
            match new_block_num.cmp(&pending_synced_connections.head_block_num) {
                cmp::Ordering::Greater => {
                    // the rpc's newest block is the new overall best block
                    info!("new head from #{}", rpc_id);

                    pending_synced_connections.inner.clear();
                    pending_synced_connections.inner.push(rpc_id);

                    pending_synced_connections.head_block_num = new_block_num;
                    pending_synced_connections.head_block_hash = new_block_hash;
                }
                cmp::Ordering::Equal => {
                    if new_block_hash != pending_synced_connections.head_block_hash {
                        // same height, but different chain
                        // TODO: anything else we should do? set some "nextSafeBlockHeight" to delay sending transactions?
                        // TODO: sometimes a node changes its block. if that happens, a new block is probably right behind this one
                        warn!(
                            "chain is forked at #{}! #{} has {}. {} rpcs have {}",
                            new_block_num,
                            rpc_id,
                            new_block_hash,
                            pending_synced_connections.inner.len(),
                            pending_synced_connections.head_block_hash
                        );
                        // TODO: don't continue. check connection_states to see which head block is more popular!
                        continue;
                    }

                    // do not clear synced_connections.
                    // we just want to add this rpc to the end
                    // TODO: HashSet here? i think we get dupes if we don't
                    pending_synced_connections.inner.push(rpc_id);
                }
                cmp::Ordering::Less => {
                    // this isn't the best block in the tier. don't do anything
                    continue;
                }
            }

            // the synced connections have changed
            let synced_connections = Arc::new(pending_synced_connections.clone());

            // TODO: only do this if there are 2 nodes synced to this block?
            // do the arcswap
            self.synced_connections.swap(synced_connections);
        }

        // TODO: if there was an error, we should return it
        warn!("block_receiver exited!");

        Ok(())
    }

    /// get the best available rpc server
    #[instrument(skip_all)]
    pub async fn next_upstream_server(
        &self,
    ) -> Result<ActiveRequestHandle, Option<NotUntil<QuantaInstant>>> {
        let mut earliest_not_until = None;

        let mut synced_rpc_indexes = self.synced_connections.load().inner.clone();

        let sort_cache: Vec<(f32, u32)> = synced_rpc_indexes
            .iter()
            .map(|rpc_id| {
                let rpc = self.inner.get(*rpc_id).unwrap();

                let active_requests = rpc.active_requests();
                let soft_limit = rpc.soft_limit();

                // TODO: how should we include the soft limit? floats are slower than integer math
                let utilization = active_requests as f32 / soft_limit as f32;

                (utilization, soft_limit)
            })
            .collect();

        // TODO: i think we might need to load active connections and then
        synced_rpc_indexes.sort_unstable_by(|a, b| {
            let (a_utilization, a_soft_limit) = sort_cache.get(*a).unwrap();
            let (b_utilization, b_soft_limit) = sort_cache.get(*b).unwrap();

            // TODO: i'm comparing floats. crap
            match a_utilization
                .partial_cmp(b_utilization)
                .unwrap_or(cmp::Ordering::Equal)
            {
                cmp::Ordering::Equal => a_soft_limit.cmp(b_soft_limit),
                x => x,
            }
        });

        for rpc_id in synced_rpc_indexes.into_iter() {
            let rpc = self.inner.get(rpc_id).unwrap();

            // increment our connection counter
            match rpc.try_request_handle() {
                Err(not_until) => {
                    earliest_possible(&mut earliest_not_until, not_until);
                }
                Ok(handle) => {
                    trace!("next server on {:?}: {:?}", self, rpc_id);
                    return Ok(handle);
                }
            }
        }

        // TODO: this is too verbose
        // warn!("no servers on {:?}! {:?}", self, earliest_not_until);

        // this might be None
        Err(earliest_not_until)
    }

    /// get all rpc servers that are not rate limited
    /// returns servers even if they aren't in sync. This is useful for broadcasting signed transactions
    pub fn get_upstream_servers(
        &self,
    ) -> Result<Vec<ActiveRequestHandle>, Option<NotUntil<QuantaInstant>>> {
        let mut earliest_not_until = None;
        // TODO: with capacity?
        let mut selected_rpcs = vec![];

        for connection in self.inner.iter() {
            // check rate limits and increment our connection counter
            match connection.try_request_handle() {
                Err(not_until) => {
                    earliest_possible(&mut earliest_not_until, not_until);
                    // this rpc is not available. skip it
                }
                Ok(handle) => selected_rpcs.push(handle),
            }
        }

        if !selected_rpcs.is_empty() {
            return Ok(selected_rpcs);
        }

        // return the earliest not_until (if no rpcs are synced, this will be None)
        Err(earliest_not_until)
    }
}

fn earliest_possible(
    earliest_not_until_option: &mut Option<NotUntil<QuantaInstant>>,
    new_not_until: NotUntil<QuantaInstant>,
) {
    match earliest_not_until_option.as_ref() {
        None => *earliest_not_until_option = Some(new_not_until),
        Some(earliest_not_until) => {
            let earliest_possible = earliest_not_until.earliest_possible();
            let new_earliest_possible = new_not_until.earliest_possible();

            if earliest_possible > new_earliest_possible {
                *earliest_not_until_option = Some(new_not_until);
            }
        }
    }
}
handle batched requests 2022-05-12 02:50:52 +03:00			`///! Load balanced communication with a group of web3 providers`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`use arc_swap::ArcSwap;`
quick lru cache 2022-05-05 22:07:09 +03:00			`use derive_more::From;`
check block hash and store block number fewer places 2022-05-15 09:27:13 +03:00			`use ethers::prelude::H256;`
less spawns and more logs 2022-05-18 19:35:06 +03:00			`use futures::future::join_all;`
quick lru cache 2022-05-05 22:07:09 +03:00			`use futures::stream::FuturesUnordered;`
			`use futures::StreamExt;`
			`use governor::clock::{QuantaClock, QuantaInstant};`
			`use governor::NotUntil;`
lint 2022-05-18 23:28:00 +03:00			`use hashbrown::HashMap;`
quick lru cache 2022-05-05 22:07:09 +03:00			`use serde_json::value::RawValue;`
			`use std::cmp;`
			`use std::fmt;`
			`use std::sync::Arc;`
add tokio-console 2022-05-17 19:23:27 +03:00			`use tokio::task;`
less spawns and more logs 2022-05-18 19:35:06 +03:00			`use tracing::Instrument;`
			`use tracing::{info, info_span, instrument, trace, warn};`
quick lru cache 2022-05-05 22:07:09 +03:00
			`use crate::config::Web3ConnectionConfig;`
dont fear locks and better serializing 2022-05-06 08:44:30 +03:00			`use crate::connection::{ActiveRequestHandle, Web3Connection};`
quick lru cache 2022-05-05 22:07:09 +03:00
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`#[derive(Clone)]`
			`struct SyncedConnections {`
			`head_block_num: u64,`
check block hash and store block number fewer places 2022-05-15 09:27:13 +03:00			`head_block_hash: H256,`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`inner: Vec<usize>,`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`

			`impl fmt::Debug for SyncedConnections {`
			`fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {`
			`// TODO: the default formatter takes forever to write. this is too quiet though`
			`f.debug_struct("SyncedConnections").finish_non_exhaustive()`
			`}`
			`}`

			`impl SyncedConnections {`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`fn new(max_connections: usize) -> Self {`
			`Self {`
			`head_block_num: 0,`
			`head_block_hash: Default::default(),`
			`inner: Vec::with_capacity(max_connections),`
turn caching back on 2022-05-16 01:02:14 +03:00			`}`
small refactor 2022-05-15 22:28:22 +03:00			`}`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`pub fn get_head_block_hash(&self) -> &H256 {`
			`&self.head_block_hash`
small refactor 2022-05-15 22:28:22 +03:00			`}`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`

			`/// A collection of web3 connections. Sends requests either the current best server or all servers.`
			`#[derive(From)]`
			`pub struct Web3Connections {`
			`inner: Vec<Arc<Web3Connection>>,`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`synced_connections: ArcSwap<SyncedConnections>,`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`

			`impl fmt::Debug for Web3Connections {`
			`fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {`
			`// TODO: the default formatter takes forever to write. this is too quiet though`
			`f.debug_struct("Web3Connections")`
			`.field("inner", &self.inner)`
			`.finish_non_exhaustive()`
			`}`
			`}`

			`impl Web3Connections {`
less instrumenting 2022-05-17 20:15:18 +03:00			`// #[instrument(name = "try_new_Web3Connections", skip_all)]`
quick lru cache 2022-05-05 22:07:09 +03:00			`pub async fn try_new(`
add chain_id to proc title 2022-05-12 21:49:57 +03:00			`chain_id: usize,`
quick lru cache 2022-05-05 22:07:09 +03:00			`servers: Vec<Web3ConnectionConfig>,`
			`http_client: Option<reqwest::Client>,`
			`clock: &QuantaClock,`
			`) -> anyhow::Result<Arc<Self>> {`
			`let num_connections = servers.len();`

turn caching back on 2022-05-16 01:02:14 +03:00			`// turn configs into connections`
			`let mut connections = Vec::with_capacity(num_connections);`
quick lru cache 2022-05-05 22:07:09 +03:00			`for server_config in servers.into_iter() {`
add chain_id to proc title 2022-05-12 21:49:57 +03:00			`match server_config`
			`.try_build(clock, chain_id, http_client.clone())`
			`.await`
			`{`
allow connections to fail 2022-05-06 00:38:15 +03:00			`Ok(connection) => connections.push(connection),`
better error log 2022-05-13 00:29:33 +03:00			`Err(e) => warn!("Unable to connect to a server! {:?}", e),`
allow connections to fail 2022-05-06 00:38:15 +03:00			`}`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`

turn caching back on 2022-05-16 01:02:14 +03:00			`if connections.len() < 2 {`
			`// TODO: less than 3? what should we do here?`
			`return Err(anyhow::anyhow!(`
			`"need at least 2 connections when subscribing to heads!"`
			`));`
			`}`
small refactor 2022-05-15 22:28:22 +03:00
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`let synced_connections = SyncedConnections::new(num_connections);`
turn caching back on 2022-05-16 01:02:14 +03:00
			`let connections = Arc::new(Self {`
			`inner: connections,`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`synced_connections: ArcSwap::new(Arc::new(synced_connections)),`
turn caching back on 2022-05-16 01:02:14 +03:00			`});`

less spawns and more logs 2022-05-18 19:35:06 +03:00			`Ok(connections)`
			`}`

			`pub async fn subscribe_heads(self: &Arc<Self>) {`
			`let (block_sender, block_receiver) = flume::unbounded();`

			`let mut handles = vec![];`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`for (rpc_id, connection) in self.inner.iter().enumerate() {`
less spawns and more logs 2022-05-18 19:35:06 +03:00			`// subscribe to new heads in a spawned future`
			`// TODO: channel instead. then we can have one future with write access to a left-right?`
			`let connection = Arc::clone(connection);`
			`let block_sender = block_sender.clone();`

			`// let url = connection.url().to_string();`

			`let handle = task::Builder::default()`
			`.name("subscribe_new_heads")`
add tokio-console 2022-05-17 19:23:27 +03:00			`.spawn(async move {`
less spawns and more logs 2022-05-18 19:35:06 +03:00			`// loop to automatically reconnect`
			`// TODO: make this cancellable?`
			`// TODO: instead of passing Some(connections), pass Some(channel_sender). Then listen on the receiver below to keep local heads up-to-date`
			`// TODO: proper spann`
			`connection`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`.subscribe_new_heads(rpc_id, block_sender.clone(), true)`
less spawns and more logs 2022-05-18 19:35:06 +03:00			`.instrument(tracing::info_span!("url"))`
add tokio-console 2022-05-17 19:23:27 +03:00			`.await`
			`});`
less spawns and more logs 2022-05-18 19:35:06 +03:00
			`handles.push(handle);`
turn caching back on 2022-05-16 01:02:14 +03:00			`}`

less spawns and more logs 2022-05-18 19:35:06 +03:00			`let connections = Arc::clone(self);`
			`let handle = task::Builder::default()`
			`.name("update_synced_rpcs")`
			`.spawn(async move { connections.update_synced_rpcs(block_receiver).await });`

			`handles.push(handle);`

			`join_all(handles).await;`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`pub fn get_head_block_hash(&self) -> H256 {`
			`*self.synced_connections.load().get_head_block_hash()`
turn caching back on 2022-05-16 01:02:14 +03:00			`}`
quick lru cache 2022-05-05 22:07:09 +03:00
handle batched requests 2022-05-12 02:50:52 +03:00			`/// Send the same request to all the handles. Returning the fastest successful result.`
instrument 2022-05-17 03:56:56 +03:00			`#[instrument(skip_all)]`
handle batched requests 2022-05-12 02:50:52 +03:00			`pub async fn try_send_parallel_requests(`
quick lru cache 2022-05-05 22:07:09 +03:00			`self: Arc<Self>,`
handle batched requests 2022-05-12 02:50:52 +03:00			`active_request_handles: Vec<ActiveRequestHandle>,`
quick lru cache 2022-05-05 22:07:09 +03:00			`method: String,`
params are optional apparently 2022-05-12 06:40:41 +03:00			`params: Option<Box<RawValue>>,`
dont fear locks and better serializing 2022-05-06 08:44:30 +03:00			`response_sender: flume::Sender<anyhow::Result<Box<RawValue>>>,`
quick lru cache 2022-05-05 22:07:09 +03:00			`) -> anyhow::Result<()> {`
this works but i dont like it 2022-05-12 06:54:42 +03:00			`// TODO: if only 1 active_request_handles, do self.try_send_request`
quick lru cache 2022-05-05 22:07:09 +03:00			`let mut unordered_futures = FuturesUnordered::new();`

one less clone 2022-05-12 22:44:31 +03:00			`for active_request_handle in active_request_handles {`
quick lru cache 2022-05-05 22:07:09 +03:00			`// clone things so we can pass them to a future`
			`let method = method.clone();`
			`let params = params.clone();`
			`let response_sender = response_sender.clone();`

add tokio-console 2022-05-17 19:23:27 +03:00			`let handle = task::Builder::default()`
			`.name("send_request")`
			`.spawn(async move {`
			`let response: Box<RawValue> =`
			`active_request_handle.request(&method, &params).await?;`

			`// send the first good response to a one shot channel. that way we respond quickly`
			`// drop the result because errors are expected after the first send`
			`response_sender`
			`.send_async(Ok(response))`
			`.await`
			`.map_err(Into::into)`
			`});`
quick lru cache 2022-05-05 22:07:09 +03:00
			`unordered_futures.push(handle);`
			`}`

handle batched requests 2022-05-12 02:50:52 +03:00			`// TODO: use iterators instead of pushing into a vec?`
quick lru cache 2022-05-05 22:07:09 +03:00			`let mut errs = vec![];`
			`if let Some(x) = unordered_futures.next().await {`
			`match x.unwrap() {`
			`Ok(_) => {}`
			`Err(e) => {`
			`// TODO: better errors`
			`warn!("Got an error sending request: {}", e);`
			`errs.push(e);`
			`}`
			`}`
			`}`

			`// get the first error (if any)`
			`// TODO: why collect multiple errors if we only pop one?`
			`let e = if !errs.is_empty() {`
			`Err(errs.pop().unwrap())`
			`} else {`
			`Err(anyhow::anyhow!("no successful responses"))`
			`};`

			`// send the error to the channel`
deadlock detection 2022-05-16 08:16:32 +03:00			`if response_sender.send_async(e).await.is_ok() {`
quick lru cache 2022-05-05 22:07:09 +03:00			`// if we were able to send an error, then we never sent a success`
			`return Err(anyhow::anyhow!("no successful responses"));`
			`} else {`
			`// if sending the error failed. the other side must be closed (which means we sent a success earlier)`
			`Ok(())`
			`}`
			`}`

more logging 2022-05-13 20:43:37 +03:00			`/// TODO: possible dead lock here. investigate more. probably refactor`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`/// TODO: move parts of this onto SyncedConnections?`
instrument 2022-05-17 03:56:56 +03:00			`#[instrument(skip_all)]`
turn caching back on 2022-05-16 01:02:14 +03:00			`async fn update_synced_rpcs(`
check block hash and store block number fewer places 2022-05-15 09:27:13 +03:00			`&self,`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`block_receiver: flume::Receiver<(u64, H256, usize)>,`
check block hash and store block number fewer places 2022-05-15 09:27:13 +03:00			`) -> anyhow::Result<()> {`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`let max_connections = self.inner.len();`

lint 2022-05-18 23:28:00 +03:00			`let mut connection_states: HashMap<usize, (u64, H256)> =`
			`HashMap::with_capacity(max_connections);`
less spawns and more logs 2022-05-18 19:35:06 +03:00
lint 2022-05-18 23:28:00 +03:00			`let mut pending_synced_connections = SyncedConnections::new(max_connections);`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00
			`while let Ok((new_block_num, new_block_hash, rpc_id)) = block_receiver.recv_async().await {`
check block hash and store block number fewer places 2022-05-15 09:27:13 +03:00			`if new_block_num == 0 {`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`// TODO: show the actual rpc url?`
			`warn!("rpc #{} is still syncing", rpc_id);`
check block hash and store block number fewer places 2022-05-15 09:27:13 +03:00			`}`
quick lru cache 2022-05-05 22:07:09 +03:00
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`// TODO: span with rpc in it, too`
			`let span = info_span!("new_block", new_block_num);`
less spawns and more logs 2022-05-18 19:35:06 +03:00			`let _enter = span.enter();`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`connection_states.insert(rpc_id, (new_block_num, new_block_hash));`

			`// TODO: do something to update the synced blocks`
lint 2022-05-18 23:28:00 +03:00			`match new_block_num.cmp(&pending_synced_connections.head_block_num) {`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`cmp::Ordering::Greater => {`
			`// the rpc's newest block is the new overall best block`
			`info!("new head from #{}", rpc_id);`

lint 2022-05-18 23:28:00 +03:00			`pending_synced_connections.inner.clear();`
			`pending_synced_connections.inner.push(rpc_id);`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00
lint 2022-05-18 23:28:00 +03:00			`pending_synced_connections.head_block_num = new_block_num;`
			`pending_synced_connections.head_block_hash = new_block_hash;`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`}`
			`cmp::Ordering::Equal => {`
lint 2022-05-18 23:28:00 +03:00			`if new_block_hash != pending_synced_connections.head_block_hash {`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`// same height, but different chain`
			`// TODO: anything else we should do? set some "nextSafeBlockHeight" to delay sending transactions?`
			`// TODO: sometimes a node changes its block. if that happens, a new block is probably right behind this one`
			`warn!(`
lint 2022-05-18 23:28:00 +03:00			`"chain is forked at #{}! #{} has {}. {} rpcs have {}",`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`new_block_num,`
			`rpc_id,`
			`new_block_hash,`
lint 2022-05-18 23:28:00 +03:00			`pending_synced_connections.inner.len(),`
			`pending_synced_connections.head_block_hash`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`);`
lint 2022-05-18 23:28:00 +03:00			`// TODO: don't continue. check connection_states to see which head block is more popular!`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`continue;`
			`}`
quick lru cache 2022-05-05 22:07:09 +03:00
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`// do not clear synced_connections.`
			`// we just want to add this rpc to the end`
lint 2022-05-18 23:28:00 +03:00			`// TODO: HashSet here? i think we get dupes if we don't`
			`pending_synced_connections.inner.push(rpc_id);`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`}`
			`cmp::Ordering::Less => {`
			`// this isn't the best block in the tier. don't do anything`
			`continue;`
			`}`
			`}`

			`// the synced connections have changed`
lint 2022-05-18 23:28:00 +03:00			`let synced_connections = Arc::new(pending_synced_connections.clone());`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00
			`// TODO: only do this if there are 2 nodes synced to this block?`
			`// do the arcswap`
lint 2022-05-18 23:28:00 +03:00			`self.synced_connections.swap(synced_connections);`
dont fear locks and better serializing 2022-05-06 08:44:30 +03:00			`}`
quick lru cache 2022-05-05 22:07:09 +03:00
less spawns and more logs 2022-05-18 19:35:06 +03:00			`// TODO: if there was an error, we should return it`
			`warn!("block_receiver exited!");`

quick lru cache 2022-05-05 22:07:09 +03:00			`Ok(())`
			`}`

			`/// get the best available rpc server`
instrument 2022-05-17 03:56:56 +03:00			`#[instrument(skip_all)]`
quick lru cache 2022-05-05 22:07:09 +03:00			`pub async fn next_upstream_server(`
			`&self,`
use a request handle for ratelimit handling 2022-05-06 07:29:25 +03:00			`) -> Result<ActiveRequestHandle, Option<NotUntil<QuantaInstant>>> {`
quick lru cache 2022-05-05 22:07:09 +03:00			`let mut earliest_not_until = None;`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`let mut synced_rpc_indexes = self.synced_connections.load().inner.clone();`
quick lru cache 2022-05-05 22:07:09 +03:00
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`let sort_cache: Vec<(f32, u32)> = synced_rpc_indexes`
quick lru cache 2022-05-05 22:07:09 +03:00			`.iter()`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`.map(\|rpc_id\| {`
			`let rpc = self.inner.get(*rpc_id).unwrap();`

			`let active_requests = rpc.active_requests();`
			`let soft_limit = rpc.soft_limit();`
set overall max inside the lock 2022-05-06 23:44:12 +03:00
more comments 2022-05-16 08:56:57 +03:00			`// TODO: how should we include the soft limit? floats are slower than integer math`
set overall max inside the lock 2022-05-06 23:44:12 +03:00			`let utilization = active_requests as f32 / soft_limit as f32;`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`(utilization, soft_limit)`
quick lru cache 2022-05-05 22:07:09 +03:00			`})`
			`.collect();`

			`// TODO: i think we might need to load active connections and then`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`synced_rpc_indexes.sort_unstable_by(\|a, b\| {`
			`let (a_utilization, a_soft_limit) = sort_cache.get(*a).unwrap();`
			`let (b_utilization, b_soft_limit) = sort_cache.get(*b).unwrap();`
set overall max inside the lock 2022-05-06 23:44:12 +03:00
			`// TODO: i'm comparing floats. crap`
			`match a_utilization`
			`.partial_cmp(b_utilization)`
			`.unwrap_or(cmp::Ordering::Equal)`
			`{`
			`cmp::Ordering::Equal => a_soft_limit.cmp(b_soft_limit),`
			`x => x,`
			`}`
quick lru cache 2022-05-05 22:07:09 +03:00			`});`

back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`for rpc_id in synced_rpc_indexes.into_iter() {`
			`let rpc = self.inner.get(rpc_id).unwrap();`

quick lru cache 2022-05-05 22:07:09 +03:00			`// increment our connection counter`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`match rpc.try_request_handle() {`
use a request handle for ratelimit handling 2022-05-06 07:29:25 +03:00			`Err(not_until) => {`
			`earliest_possible(&mut earliest_not_until, not_until);`
			`}`
set overall max inside the lock 2022-05-06 23:44:12 +03:00			`Ok(handle) => {`
back to arcswap and usizes 2022-05-18 23:18:01 +03:00			`trace!("next server on {:?}: {:?}", self, rpc_id);`
set overall max inside the lock 2022-05-06 23:44:12 +03:00			`return Ok(handle);`
			`}`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`
			`}`

set overall max inside the lock 2022-05-06 23:44:12 +03:00			`// TODO: this is too verbose`
			`// warn!("no servers on {:?}! {:?}", self, earliest_not_until);`

quick lru cache 2022-05-05 22:07:09 +03:00			`// this might be None`
			`Err(earliest_not_until)`
			`}`

			`/// get all rpc servers that are not rate limited`
one tier 2022-05-13 23:50:11 +03:00			`/// returns servers even if they aren't in sync. This is useful for broadcasting signed transactions`
quick lru cache 2022-05-05 22:07:09 +03:00			`pub fn get_upstream_servers(`
			`&self,`
use a request handle for ratelimit handling 2022-05-06 07:29:25 +03:00			`) -> Result<Vec<ActiveRequestHandle>, Option<NotUntil<QuantaInstant>>> {`
quick lru cache 2022-05-05 22:07:09 +03:00			`let mut earliest_not_until = None;`
			`// TODO: with capacity?`
			`let mut selected_rpcs = vec![];`

			`for connection in self.inner.iter() {`
			`// check rate limits and increment our connection counter`
use a request handle for ratelimit handling 2022-05-06 07:29:25 +03:00			`match connection.try_request_handle() {`
			`Err(not_until) => {`
			`earliest_possible(&mut earliest_not_until, not_until);`
			`// this rpc is not available. skip it`
			`}`
			`Ok(handle) => selected_rpcs.push(handle),`
quick lru cache 2022-05-05 22:07:09 +03:00			`}`
			`}`

			`if !selected_rpcs.is_empty() {`
			`return Ok(selected_rpcs);`
			`}`

			`// return the earliest not_until (if no rpcs are synced, this will be None)`
			`Err(earliest_not_until)`
			`}`
			`}`

			`fn earliest_possible(`
			`earliest_not_until_option: &mut Option<NotUntil<QuantaInstant>>,`
			`new_not_until: NotUntil<QuantaInstant>,`
			`) {`
			`match earliest_not_until_option.as_ref() {`
			`None => *earliest_not_until_option = Some(new_not_until),`
			`Some(earliest_not_until) => {`
			`let earliest_possible = earliest_not_until.earliest_possible();`
			`let new_earliest_possible = new_not_until.earliest_possible();`

			`if earliest_possible > new_earliest_possible {`
			`*earliest_not_until_option = Some(new_not_until);`
			`}`
			`}`
			`}`
			`}`