web3-proxy/web3_proxy/src/app_stats.rs

use crate::frontend::authorization::{Authorization, RequestMetadata};
use crate::jsonrpc::JsonRpcForwardedResponse;
use chrono::{TimeZone, Utc};
use derive_more::From;
use entities::rpc_accounting;
use hashbrown::HashMap;
use hdrhistogram::{Histogram, RecordError};
use sea_orm::{ActiveModelTrait, DatabaseConnection, DbErr};
use std::sync::atomic::Ordering;
use std::sync::Arc;
use std::time::{Duration, SystemTime};
use tokio::sync::broadcast;
use tokio::task::JoinHandle;
use tokio::time::{interval_at, Instant};
use tracing::{error, info};

/// TODO: where should this be defined?
/// TODO: can we use something inside sea_orm instead?
#[derive(Debug)]
pub struct ProxyResponseStat {
    authorization: Arc<Authorization>,
    method: String,
    archive_request: bool,
    error_response: bool,
    request_bytes: u64,
    /// if backend_requests is 0, there was a cache_hit
    backend_requests: u64,
    response_bytes: u64,
    response_millis: u64,
}

impl ProxyResponseStat {
    /// TODO: think more about this. probably rename it
    fn key(&self) -> ProxyResponseAggregateKey {
        ProxyResponseAggregateKey {
            rpc_key_id: self.authorization.checks.rpc_key_id,
            // TODO: include Origin here?
            method: self.method.clone(),
            archive_request: self.archive_request,
            error_response: self.error_response,
        }
    }
}

pub struct ProxyResponseHistograms {
    request_bytes: Histogram<u64>,
    response_bytes: Histogram<u64>,
    response_millis: Histogram<u64>,
}

impl Default for ProxyResponseHistograms {
    fn default() -> Self {
        // TODO: how many significant figures?
        let request_bytes = Histogram::new(5).expect("creating request_bytes histogram");
        let response_bytes = Histogram::new(5).expect("creating response_bytes histogram");
        let response_millis = Histogram::new(5).expect("creating response_millis histogram");

        Self {
            request_bytes,
            response_bytes,
            response_millis,
        }
    }
}

// TODO: think more about if we should include IP address in this
#[derive(Clone, From, Hash, PartialEq, Eq)]
struct ProxyResponseAggregateKey {
    rpc_key_id: u64,
    method: String,
    error_response: bool,
    archive_request: bool,
}

#[derive(Default)]
pub struct ProxyResponseAggregate {
    frontend_requests: u64,
    backend_requests: u64,
    // TODO: related to backend_requests
    // backend_retries: u64,
    // TODO: related to backend_requests
    // no_servers: u64,
    cache_misses: u64,
    cache_hits: u64,
    sum_request_bytes: u64,
    sum_response_bytes: u64,
    sum_response_millis: u64,
    histograms: ProxyResponseHistograms,
}

/// A stat that we aggregate and then store in a database.
/// For now there is just one, but I think there might be others later
#[derive(Debug, From)]
pub enum Web3ProxyStat {
    Response(ProxyResponseStat),
}

#[derive(From)]
pub struct StatEmitterSpawn {
    pub stat_sender: flume::Sender<Web3ProxyStat>,
    /// these handles are important and must be allowed to finish
    pub background_handle: JoinHandle<anyhow::Result<()>>,
}

pub struct StatEmitter {
    chain_id: u64,
    db_conn: DatabaseConnection,
    period_seconds: u64,
}

// TODO: impl `+=<ProxyResponseStat>` for ProxyResponseAggregate?
impl ProxyResponseAggregate {
    fn add(&mut self, stat: ProxyResponseStat) -> Result<(), RecordError> {
        // a stat always come from just 1 frontend request
        self.frontend_requests += 1;

        if stat.backend_requests == 0 {
            // no backend request. cache hit!
            self.cache_hits += 1;
        } else {
            // backend requests! cache miss!
            self.cache_misses += 1;

            // a stat might have multiple backend requests
            self.backend_requests += stat.backend_requests;
        }

        self.sum_request_bytes += stat.request_bytes;
        self.sum_response_bytes += stat.response_bytes;
        self.sum_response_millis += stat.response_millis;

        // TODO: use `record_correct`?
        self.histograms.request_bytes.record(stat.request_bytes)?;
        self.histograms
            .response_millis
            .record(stat.response_millis)?;
        self.histograms.response_bytes.record(stat.response_bytes)?;

        Ok(())
    }

    // TODO? help to turn this plus the key into a database model?
    // TODO: take a db transaction instead so that we can batch
    async fn save(
        self,
        chain_id: u64,
        db_conn: &DatabaseConnection,
        key: ProxyResponseAggregateKey,
        period_timestamp: u64,
    ) -> Result<(), DbErr> {
        // this is a lot of variables
        let period_datetime = Utc.timestamp(period_timestamp as i64, 0);

        let request_bytes = &self.histograms.request_bytes;

        let min_request_bytes = request_bytes.min();
        let mean_request_bytes = request_bytes.mean();
        let p50_request_bytes = request_bytes.value_at_quantile(0.50);
        let p90_request_bytes = request_bytes.value_at_quantile(0.90);
        let p99_request_bytes = request_bytes.value_at_quantile(0.99);
        let max_request_bytes = request_bytes.max();

        let response_millis = &self.histograms.response_millis;

        let min_response_millis = response_millis.min();
        let mean_response_millis = response_millis.mean();
        let p50_response_millis = response_millis.value_at_quantile(0.50);
        let p90_response_millis = response_millis.value_at_quantile(0.90);
        let p99_response_millis = response_millis.value_at_quantile(0.99);
        let max_response_millis = response_millis.max();

        let response_bytes = &self.histograms.response_bytes;

        let min_response_bytes = response_bytes.min();
        let mean_response_bytes = response_bytes.mean();
        let p50_response_bytes = response_bytes.value_at_quantile(0.50);
        let p90_response_bytes = response_bytes.value_at_quantile(0.90);
        let p99_response_bytes = response_bytes.value_at_quantile(0.99);
        let max_response_bytes = response_bytes.max();

        // TODO: Set origin and maybe other things on this model. probably not the ip though
        let aggregated_stat_model = rpc_accounting::ActiveModel {
            id: sea_orm::NotSet,
            // origin: sea_orm::Set(key.authorization.origin.to_string()),
            rpc_key_id: sea_orm::Set(key.rpc_key_id),
            chain_id: sea_orm::Set(chain_id),
            method: sea_orm::Set(key.method),
            archive_request: sea_orm::Set(key.archive_request),
            error_response: sea_orm::Set(key.error_response),
            period_datetime: sea_orm::Set(period_datetime),
            frontend_requests: sea_orm::Set(self.frontend_requests),
            backend_requests: sea_orm::Set(self.backend_requests),
            // backend_retries: sea_orm::Set(self.backend_retries),
            // no_servers: sea_orm::Set(self.no_servers),
            cache_misses: sea_orm::Set(self.cache_misses),
            cache_hits: sea_orm::Set(self.cache_hits),

            sum_request_bytes: sea_orm::Set(self.sum_request_bytes),
            min_request_bytes: sea_orm::Set(min_request_bytes),
            mean_request_bytes: sea_orm::Set(mean_request_bytes),
            p50_request_bytes: sea_orm::Set(p50_request_bytes),
            p90_request_bytes: sea_orm::Set(p90_request_bytes),
            p99_request_bytes: sea_orm::Set(p99_request_bytes),
            max_request_bytes: sea_orm::Set(max_request_bytes),

            sum_response_millis: sea_orm::Set(self.sum_response_millis),
            min_response_millis: sea_orm::Set(min_response_millis),
            mean_response_millis: sea_orm::Set(mean_response_millis),
            p50_response_millis: sea_orm::Set(p50_response_millis),
            p90_response_millis: sea_orm::Set(p90_response_millis),
            p99_response_millis: sea_orm::Set(p99_response_millis),
            max_response_millis: sea_orm::Set(max_response_millis),

            sum_response_bytes: sea_orm::Set(self.sum_response_bytes),
            min_response_bytes: sea_orm::Set(min_response_bytes),
            mean_response_bytes: sea_orm::Set(mean_response_bytes),
            p50_response_bytes: sea_orm::Set(p50_response_bytes),
            p90_response_bytes: sea_orm::Set(p90_response_bytes),
            p99_response_bytes: sea_orm::Set(p99_response_bytes),
            max_response_bytes: sea_orm::Set(max_response_bytes),
        };

        aggregated_stat_model.save(db_conn).await?;

        Ok(())
    }
}

impl ProxyResponseStat {
    // TODO: should RequestMetadata be in an arc? or can we handle refs here?
    pub fn new(
        method: String,
        authorization: Arc<Authorization>,
        metadata: Arc<RequestMetadata>,
        response: &JsonRpcForwardedResponse,
    ) -> Self {
        // TODO: do this without serializing to a string. this is going to slow us down!
        let response_bytes = serde_json::to_string(response)
            .expect("serializing here should always work")
            .len() as u64;

        let archive_request = metadata.archive_request.load(Ordering::Acquire);
        let backend_requests = metadata.backend_requests.load(Ordering::Acquire);
        // let period_seconds = metadata.period_seconds;
        // let period_timestamp =
        //     (metadata.start_datetime.timestamp() as u64) / period_seconds * period_seconds;
        let request_bytes = metadata.request_bytes;
        let error_response = metadata.error_response.load(Ordering::Acquire);

        // TODO: timestamps could get confused by leap seconds. need tokio time instead
        let response_millis = metadata.start_instant.elapsed().as_millis() as u64;

        Self {
            authorization,
            archive_request,
            method,
            backend_requests,
            request_bytes,
            error_response,
            response_bytes,
            response_millis,
        }
    }
}

impl StatEmitter {
    pub fn spawn(
        chain_id: u64,
        db_conn: DatabaseConnection,
        period_seconds: u64,
        shutdown_receiver: broadcast::Receiver<()>,
    ) -> anyhow::Result<StatEmitterSpawn> {
        let (stat_sender, stat_receiver) = flume::unbounded();

        let mut new = Self {
            chain_id,
            db_conn,
            period_seconds,
        };

        let handle =
            tokio::spawn(async move { new.stat_loop(stat_receiver, shutdown_receiver).await });

        Ok((stat_sender, handle).into())
    }

    async fn stat_loop(
        &mut self,
        stat_receiver: flume::Receiver<Web3ProxyStat>,
        mut shutdown_receiver: broadcast::Receiver<()>,
    ) -> anyhow::Result<()> {
        let system_now = SystemTime::now();

        let duration_since_epoch = system_now
            .duration_since(SystemTime::UNIX_EPOCH)
            .expect("time machines don't exist");

        // TODO: change period_seconds from u64 to u32
        let current_period = duration_since_epoch
            .checked_div(self.period_seconds as u32)
            .unwrap()
            * self.period_seconds as u32;

        let duration_to_next_period =
            Duration::from_secs(self.period_seconds) - (duration_since_epoch - current_period);

        // start the interval when the next period starts
        let start_instant = Instant::now() + duration_to_next_period;
        let mut interval = interval_at(start_instant, Duration::from_secs(self.period_seconds));

        // loop between different futures to update these mutables
        let mut period_timestamp = current_period.as_secs();
        let mut response_aggregate_map =
            HashMap::<ProxyResponseAggregateKey, ProxyResponseAggregate>::new();

        loop {
            tokio::select! {
                stat = stat_receiver.recv_async() => {
                    match stat? {
                        Web3ProxyStat::Response(stat) => {
                            let key = stat.key();

                            // TODO: does hashmap have get_or_insert?
                            if ! response_aggregate_map.contains_key(&key) {
                                response_aggregate_map.insert(key.clone(), Default::default());
                            };

                            if let Some(value) = response_aggregate_map.get_mut(&key) {
                                if let Err(err) = value.add(stat) {
                                    error!(?err, "unable to aggregate stats!");
                                };
                            } else {
                                unimplemented!();
                            }
                        }
                    }
                }
                _ = interval.tick() => {
                    // save all the aggregated stats
                    // TODO: batch these saves
                    for (key, aggregate) in response_aggregate_map.drain() {
                        if let Err(err) = aggregate.save(self.chain_id, &self.db_conn, key, period_timestamp).await {
                            error!(?err, "Unable to save stat while shutting down!");
                        };
                    }
                    // advance to the next period
                    // TODO: is this safe? what if there is drift?
                    period_timestamp += self.period_seconds;
                }
                x = shutdown_receiver.recv() => {
                    match x {
                        Ok(_) => {
                            info!("aggregate stat_loop shutting down");
                            // TODO: call aggregate_stat for all the
                        },
                        Err(err) => error!(?err, "shutdown receiver"),
                    }
                    break;
                }
            }
        }

        info!("saving {} pending stats", response_aggregate_map.len());

        for (key, aggregate) in response_aggregate_map.drain() {
            if let Err(err) = aggregate
                .save(self.chain_id, &self.db_conn, key, period_timestamp)
                .await
            {
                error!(?err, "Unable to save stat while shutting down!");
            };
        }

        info!("aggregated stat_loop shut down");

        Ok(())
    }
}
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`use crate::frontend::authorization::{Authorization, RequestMetadata};`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`use crate::jsonrpc::JsonRpcForwardedResponse;`
stats almost work just need to update the migration to match our new ideas for columns. should also make the shutdown smarter so that nothing gets lost 2022-10-10 08:35:25 +03:00			`use chrono::{TimeZone, Utc};`
emit our first stats-- cache hits and misses 2022-10-03 23:02:05 +03:00			`use derive_more::From;`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`use entities::rpc_accounting;`
better stats aggregations 2022-11-03 02:14:16 +03:00			`use hashbrown::HashMap;`
			`use hdrhistogram::{Histogram, RecordError};`
			`use sea_orm::{ActiveModelTrait, DatabaseConnection, DbErr};`
			`use std::sync::atomic::Ordering;`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`use std::sync::Arc;`
better stats aggregations 2022-11-03 02:14:16 +03:00			`use std::time::{Duration, SystemTime};`
			`use tokio::sync::broadcast;`
add stat emitter 2022-10-03 21:08:01 +03:00			`use tokio::task::JoinHandle;`
better stats aggregations 2022-11-03 02:14:16 +03:00			`use tokio::time::{interval_at, Instant};`
			`use tracing::{error, info};`
emit our first stats-- cache hits and misses 2022-10-03 23:02:05 +03:00
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`/// TODO: where should this be defined?`
			`/// TODO: can we use something inside sea_orm instead?`
emit our first stats-- cache hits and misses 2022-10-03 23:02:05 +03:00			`#[derive(Debug)]`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`pub struct ProxyResponseStat {`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`authorization: Arc<Authorization>,`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`method: String,`
better stats aggregations 2022-11-03 02:14:16 +03:00			`archive_request: bool,`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`error_response: bool,`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`request_bytes: u64,`
better stats aggregations 2022-11-03 02:14:16 +03:00			`/// if backend_requests is 0, there was a cache_hit`
update sea-orm and entities 2022-10-25 06:41:59 +03:00			`backend_requests: u64,`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`response_bytes: u64,`
			`response_millis: u64,`
emit our first stats-- cache hits and misses 2022-10-03 23:02:05 +03:00			`}`

simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`impl ProxyResponseStat {`
			`/// TODO: think more about this. probably rename it`
			`fn key(&self) -> ProxyResponseAggregateKey {`
			`ProxyResponseAggregateKey {`
			`rpc_key_id: self.authorization.checks.rpc_key_id,`
			`// TODO: include Origin here?`
			`method: self.method.clone(),`
			`archive_request: self.archive_request,`
			`error_response: self.error_response,`
			`}`
			`}`
			`}`

less locks and fix some stats 2022-10-11 20:34:25 +03:00			`pub struct ProxyResponseHistograms {`
			`request_bytes: Histogram<u64>,`
			`response_bytes: Histogram<u64>,`
			`response_millis: Histogram<u64>,`
			`}`

			`impl Default for ProxyResponseHistograms {`
			`fn default() -> Self {`
			`// TODO: how many significant figures?`
			`let request_bytes = Histogram::new(5).expect("creating request_bytes histogram");`
			`let response_bytes = Histogram::new(5).expect("creating response_bytes histogram");`
			`let response_millis = Histogram::new(5).expect("creating response_millis histogram");`

			`Self {`
			`request_bytes,`
			`response_bytes,`
			`response_millis,`
			`}`
			`}`
			`}`

simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`// TODO: think more about if we should include IP address in this`
better stats aggregations 2022-11-03 02:14:16 +03:00			`#[derive(Clone, From, Hash, PartialEq, Eq)]`
			`struct ProxyResponseAggregateKey {`
rename api_key to rpc_key 2022-10-27 03:12:42 +03:00			`rpc_key_id: u64,`
this might be too many columns 2022-10-11 08:13:00 +03:00			`method: String,`
			`error_response: bool,`
better stats aggregations 2022-11-03 02:14:16 +03:00			`archive_request: bool,`
			`}`

			`#[derive(Default)]`
			`pub struct ProxyResponseAggregate {`
			`frontend_requests: u64,`
			`backend_requests: u64,`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`// TODO: related to backend_requests`
better stats aggregations 2022-11-03 02:14:16 +03:00			`// backend_retries: u64,`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`// TODO: related to backend_requests`
better stats aggregations 2022-11-03 02:14:16 +03:00			`// no_servers: u64,`
			`cache_misses: u64,`
			`cache_hits: u64,`
			`sum_request_bytes: u64,`
			`sum_response_bytes: u64,`
			`sum_response_millis: u64,`
			`histograms: ProxyResponseHistograms,`
			`}`

			`/// A stat that we aggregate and then store in a database.`
			`/// For now there is just one, but I think there might be others later`
			`#[derive(Debug, From)]`
			`pub enum Web3ProxyStat {`
			`Response(ProxyResponseStat),`
emit our first stats-- cache hits and misses 2022-10-03 23:02:05 +03:00			`}`

better stats aggregations 2022-11-03 02:14:16 +03:00			`#[derive(From)]`
			`pub struct StatEmitterSpawn {`
			`pub stat_sender: flume::Sender<Web3ProxyStat>,`
			`/// these handles are important and must be allowed to finish`
			`pub background_handle: JoinHandle<anyhow::Result<()>>,`
			`}`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00
			`pub struct StatEmitter {`
			`chain_id: u64,`
			`db_conn: DatabaseConnection,`
			`period_seconds: u64,`
emit our first stats-- cache hits and misses 2022-10-03 23:02:05 +03:00			`}`

better stats aggregations 2022-11-03 02:14:16 +03:00			// TODO: impl `+=<ProxyResponseStat>` for ProxyResponseAggregate?
			`impl ProxyResponseAggregate {`
			`fn add(&mut self, stat: ProxyResponseStat) -> Result<(), RecordError> {`
			`// a stat always come from just 1 frontend request`
			`self.frontend_requests += 1;`

			`if stat.backend_requests == 0 {`
			`// no backend request. cache hit!`
			`self.cache_hits += 1;`
			`} else {`
			`// backend requests! cache miss!`
			`self.cache_misses += 1;`

			`// a stat might have multiple backend requests`
			`self.backend_requests += stat.backend_requests;`
			`}`

			`self.sum_request_bytes += stat.request_bytes;`
			`self.sum_response_bytes += stat.response_bytes;`
			`self.sum_response_millis += stat.response_millis;`

			// TODO: use `record_correct`?
			`self.histograms.request_bytes.record(stat.request_bytes)?;`
			`self.histograms`
			`.response_millis`
			`.record(stat.response_millis)?;`
			`self.histograms.response_bytes.record(stat.response_bytes)?;`

			`Ok(())`
			`}`

			`// TODO? help to turn this plus the key into a database model?`
			`// TODO: take a db transaction instead so that we can batch`
			`async fn save(`
			`self,`
			`chain_id: u64,`
			`db_conn: &DatabaseConnection,`
			`key: ProxyResponseAggregateKey,`
			`period_timestamp: u64,`
			`) -> Result<(), DbErr> {`
			`// this is a lot of variables`
			`let period_datetime = Utc.timestamp(period_timestamp as i64, 0);`

			`let request_bytes = &self.histograms.request_bytes;`

			`let min_request_bytes = request_bytes.min();`
			`let mean_request_bytes = request_bytes.mean();`
			`let p50_request_bytes = request_bytes.value_at_quantile(0.50);`
			`let p90_request_bytes = request_bytes.value_at_quantile(0.90);`
			`let p99_request_bytes = request_bytes.value_at_quantile(0.99);`
			`let max_request_bytes = request_bytes.max();`

			`let response_millis = &self.histograms.response_millis;`

			`let min_response_millis = response_millis.min();`
			`let mean_response_millis = response_millis.mean();`
			`let p50_response_millis = response_millis.value_at_quantile(0.50);`
			`let p90_response_millis = response_millis.value_at_quantile(0.90);`
			`let p99_response_millis = response_millis.value_at_quantile(0.99);`
			`let max_response_millis = response_millis.max();`

			`let response_bytes = &self.histograms.response_bytes;`

			`let min_response_bytes = response_bytes.min();`
			`let mean_response_bytes = response_bytes.mean();`
			`let p50_response_bytes = response_bytes.value_at_quantile(0.50);`
			`let p90_response_bytes = response_bytes.value_at_quantile(0.90);`
			`let p99_response_bytes = response_bytes.value_at_quantile(0.99);`
			`let max_response_bytes = response_bytes.max();`

simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`// TODO: Set origin and maybe other things on this model. probably not the ip though`
better stats aggregations 2022-11-03 02:14:16 +03:00			`let aggregated_stat_model = rpc_accounting::ActiveModel {`
			`id: sea_orm::NotSet,`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`// origin: sea_orm::Set(key.authorization.origin.to_string()),`
better stats aggregations 2022-11-03 02:14:16 +03:00			`rpc_key_id: sea_orm::Set(key.rpc_key_id),`
			`chain_id: sea_orm::Set(chain_id),`
			`method: sea_orm::Set(key.method),`
			`archive_request: sea_orm::Set(key.archive_request),`
			`error_response: sea_orm::Set(key.error_response),`
			`period_datetime: sea_orm::Set(period_datetime),`
			`frontend_requests: sea_orm::Set(self.frontend_requests),`
			`backend_requests: sea_orm::Set(self.backend_requests),`
			`// backend_retries: sea_orm::Set(self.backend_retries),`
			`// no_servers: sea_orm::Set(self.no_servers),`
			`cache_misses: sea_orm::Set(self.cache_misses),`
			`cache_hits: sea_orm::Set(self.cache_hits),`

			`sum_request_bytes: sea_orm::Set(self.sum_request_bytes),`
			`min_request_bytes: sea_orm::Set(min_request_bytes),`
			`mean_request_bytes: sea_orm::Set(mean_request_bytes),`
			`p50_request_bytes: sea_orm::Set(p50_request_bytes),`
			`p90_request_bytes: sea_orm::Set(p90_request_bytes),`
			`p99_request_bytes: sea_orm::Set(p99_request_bytes),`
			`max_request_bytes: sea_orm::Set(max_request_bytes),`

			`sum_response_millis: sea_orm::Set(self.sum_response_millis),`
			`min_response_millis: sea_orm::Set(min_response_millis),`
			`mean_response_millis: sea_orm::Set(mean_response_millis),`
			`p50_response_millis: sea_orm::Set(p50_response_millis),`
			`p90_response_millis: sea_orm::Set(p90_response_millis),`
			`p99_response_millis: sea_orm::Set(p99_response_millis),`
			`max_response_millis: sea_orm::Set(max_response_millis),`

			`sum_response_bytes: sea_orm::Set(self.sum_response_bytes),`
			`min_response_bytes: sea_orm::Set(min_response_bytes),`
			`mean_response_bytes: sea_orm::Set(mean_response_bytes),`
			`p50_response_bytes: sea_orm::Set(p50_response_bytes),`
			`p90_response_bytes: sea_orm::Set(p90_response_bytes),`
			`p99_response_bytes: sea_orm::Set(p99_response_bytes),`
			`max_response_bytes: sea_orm::Set(max_response_bytes),`
			`};`

			`aggregated_stat_model.save(db_conn).await?;`

			`Ok(())`
			`}`
add stat emitter 2022-10-03 21:08:01 +03:00			`}`

add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`impl ProxyResponseStat {`
			`// TODO: should RequestMetadata be in an arc? or can we handle refs here?`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`pub fn new(`
			`method: String,`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`authorization: Arc<Authorization>,`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`metadata: Arc<RequestMetadata>,`
			`response: &JsonRpcForwardedResponse,`
			`) -> Self {`
			`// TODO: do this without serializing to a string. this is going to slow us down!`
			`let response_bytes = serde_json::to_string(response)`
			`.expect("serializing here should always work")`
			`.len() as u64;`

better stats aggregations 2022-11-03 02:14:16 +03:00			`let archive_request = metadata.archive_request.load(Ordering::Acquire);`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`let backend_requests = metadata.backend_requests.load(Ordering::Acquire);`
better stats aggregations 2022-11-03 02:14:16 +03:00			`// let period_seconds = metadata.period_seconds;`
			`// let period_timestamp =`
			`// (metadata.start_datetime.timestamp() as u64) / period_seconds * period_seconds;`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`let request_bytes = metadata.request_bytes;`
			`let error_response = metadata.error_response.load(Ordering::Acquire);`
less locks and fix some stats 2022-10-11 20:34:25 +03:00
missing loop 2022-10-21 02:50:06 +03:00			`// TODO: timestamps could get confused by leap seconds. need tokio time instead`
			`let response_millis = metadata.start_instant.elapsed().as_millis() as u64;`
i think it works 2022-10-12 00:31:34 +03:00
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`Self {`
simplify authorization types so we can pass them deeper easily 2022-11-08 22:58:11 +03:00			`authorization,`
better stats aggregations 2022-11-03 02:14:16 +03:00			`archive_request,`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`method,`
proper sizes for caches and emit all stats 2022-10-11 22:58:25 +03:00			`backend_requests,`
			`request_bytes,`
			`error_response,`
			`response_bytes,`
			`response_millis,`
add stat emitter 2022-10-03 21:08:01 +03:00			`}`
			`}`
			`}`

			`impl StatEmitter {`
better stats aggregations 2022-11-03 02:14:16 +03:00			`pub fn spawn(`
			`chain_id: u64,`
			`db_conn: DatabaseConnection,`
			`period_seconds: u64,`
			`shutdown_receiver: broadcast::Receiver<()>,`
			`) -> anyhow::Result<StatEmitterSpawn> {`
			`let (stat_sender, stat_receiver) = flume::unbounded();`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`let mut new = Self {`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00			`chain_id,`
			`db_conn,`
			`period_seconds,`
			`};`

better stats aggregations 2022-11-03 02:14:16 +03:00			`let handle =`
			`tokio::spawn(async move { new.stat_loop(stat_receiver, shutdown_receiver).await });`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`Ok((stat_sender, handle).into())`
this might be too many columns 2022-10-11 08:13:00 +03:00			`}`
stats in redis that actually work we should still investigate a real time series db, but stats in redis is much simpler for now 2022-10-07 05:15:53 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`async fn stat_loop(`
			`&mut self,`
			`stat_receiver: flume::Receiver<Web3ProxyStat>,`
wait on background threads 2022-10-21 01:51:56 +03:00			`mut shutdown_receiver: broadcast::Receiver<()>,`
this might be too many columns 2022-10-11 08:13:00 +03:00			`) -> anyhow::Result<()> {`
better stats aggregations 2022-11-03 02:14:16 +03:00			`let system_now = SystemTime::now();`
missing loop 2022-10-21 02:50:06 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`let duration_since_epoch = system_now`
			`.duration_since(SystemTime::UNIX_EPOCH)`
			`.expect("time machines don't exist");`
missing loop 2022-10-21 02:50:06 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`// TODO: change period_seconds from u64 to u32`
			`let current_period = duration_since_epoch`
			`.checked_div(self.period_seconds as u32)`
			`.unwrap()`
			`* self.period_seconds as u32;`

			`let duration_to_next_period =`
			`Duration::from_secs(self.period_seconds) - (duration_since_epoch - current_period);`

			`// start the interval when the next period starts`
			`let start_instant = Instant::now() + duration_to_next_period;`
			`let mut interval = interval_at(start_instant, Duration::from_secs(self.period_seconds));`

			`// loop between different futures to update these mutables`
			`let mut period_timestamp = current_period.as_secs();`
			`let mut response_aggregate_map =`
			`HashMap::<ProxyResponseAggregateKey, ProxyResponseAggregate>::new();`

			`loop {`
			`tokio::select! {`
			`stat = stat_receiver.recv_async() => {`
			`match stat? {`
			`Web3ProxyStat::Response(stat) => {`
			`let key = stat.key();`

			`// TODO: does hashmap have get_or_insert?`
			`if ! response_aggregate_map.contains_key(&key) {`
			`response_aggregate_map.insert(key.clone(), Default::default());`
			`};`

			`if let Some(value) = response_aggregate_map.get_mut(&key) {`
			`if let Err(err) = value.add(stat) {`
			`error!(?err, "unable to aggregate stats!");`
			`};`
			`} else {`
			`unimplemented!();`
			`}`
missing loop 2022-10-21 02:50:06 +03:00			`}`
wait on background threads 2022-10-21 01:51:56 +03:00			`}`
			`}`
better stats aggregations 2022-11-03 02:14:16 +03:00			`_ = interval.tick() => {`
			`// save all the aggregated stats`
			`// TODO: batch these saves`
			`for (key, aggregate) in response_aggregate_map.drain() {`
			`if let Err(err) = aggregate.save(self.chain_id, &self.db_conn, key, period_timestamp).await {`
			`error!(?err, "Unable to save stat while shutting down!");`
			`};`
			`}`
			`// advance to the next period`
			`// TODO: is this safe? what if there is drift?`
			`period_timestamp += self.period_seconds;`
			`}`
missing loop 2022-10-21 02:50:06 +03:00			`x = shutdown_receiver.recv() => {`
			`match x {`
better stats aggregations 2022-11-03 02:14:16 +03:00			`Ok(_) => {`
			`info!("aggregate stat_loop shutting down");`
			`// TODO: call aggregate_stat for all the`
			`},`
missing loop 2022-10-21 02:50:06 +03:00			`Err(err) => error!(?err, "shutdown receiver"),`
			`}`
			`break;`
wait on background threads 2022-10-21 01:51:56 +03:00			`}`
			`}`
this might be too many columns 2022-10-11 08:13:00 +03:00			`}`
stats almost work just need to update the migration to match our new ideas for columns. should also make the shutdown smarter so that nothing gets lost 2022-10-10 08:35:25 +03:00
dry stats 2022-11-04 07:32:09 +03:00			`info!("saving {} pending stats", response_aggregate_map.len());`
fix joins for user_stats_aggregate_get 2022-11-04 06:40:43 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`for (key, aggregate) in response_aggregate_map.drain() {`
			`if let Err(err) = aggregate`
			`.save(self.chain_id, &self.db_conn, key, period_timestamp)`
			`.await`
			`{`
			`error!(?err, "Unable to save stat while shutting down!");`
			`};`
this might be too many columns 2022-10-11 08:13:00 +03:00			`}`
add stat emitter 2022-10-03 21:08:01 +03:00
better stats aggregations 2022-11-03 02:14:16 +03:00			`info!("aggregated stat_loop shut down");`
add per-user rpc accounting 2022-10-10 07:15:07 +03:00
			`Ok(())`
			`}`
add stat emitter 2022-10-03 21:08:01 +03:00			`}`