foyer-bench 0.1.4

bench tool for foyer - the hybrid cache for Rust
//  Copyright 2024 Foyer Project Authors
//
//  Licensed under the Apache License, Version 2.0 (the "License");
//  you may not use this file except in compliance with the License.
//  You may obtain a copy of the License at
//
//  http://www.apache.org/licenses/LICENSE-2.0
//
//  Unless required by applicable law or agreed to in writing, software
//  distributed under the License is distributed on an "AS IS" BASIS,
//  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
//  See the License for the specific language governing permissions and
//  limitations under the License.

// Copyright 2023 RisingWave Labs
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::{
    sync::{
        atomic::{AtomicUsize, Ordering},
        Arc,
    },
    time::{Duration, Instant},
};

use bytesize::ByteSize;
use foyer::DeviceStats;
use hdrhistogram::Histogram;
use parking_lot::RwLock;
use tokio::sync::broadcast;

// latencies are measured by 'us'
#[derive(Clone, Copy, Debug)]
pub struct Analysis {
    disk_read_iops: f64,
    disk_read_throughput: f64,
    disk_write_iops: f64,
    disk_write_throughput: f64,

    insert_iops: f64,
    insert_throughput: f64,
    insert_lat_p50: u64,
    insert_lat_p90: u64,
    insert_lat_p99: u64,
    insert_lat_p999: u64,
    insert_lat_p9999: u64,
    insert_lat_p99999: u64,
    insert_lat_pmax: u64,

    get_iops: f64,
    get_miss: f64,
    get_throughput: f64,
    get_miss_lat_p50: u64,
    get_miss_lat_p90: u64,
    get_miss_lat_p99: u64,
    get_miss_lat_p999: u64,
    get_miss_lat_p9999: u64,
    get_miss_lat_p99999: u64,
    get_miss_lat_pmax: u64,
    get_hit_lat_p50: u64,
    get_hit_lat_p90: u64,
    get_hit_lat_p99: u64,
    get_hit_lat_p999: u64,
    get_hit_lat_p9999: u64,
    get_hit_lat_p99999: u64,
    get_hit_lat_pmax: u64,
}

#[derive(Default, Clone, Copy, Debug)]
pub struct MetricsDump {
    pub insert_ios: usize,
    pub insert_bytes: usize,
    pub insert_lat_p50: u64,
    pub insert_lat_p90: u64,
    pub insert_lat_p99: u64,
    pub insert_lat_p999: u64,
    pub insert_lat_p9999: u64,
    pub insert_lat_p99999: u64,
    pub insert_lat_pmax: u64,

    pub get_ios: usize,
    pub get_miss_ios: usize,
    pub get_bytes: usize,
    pub get_hit_lat_p50: u64,
    pub get_hit_lat_p90: u64,
    pub get_hit_lat_p99: u64,
    pub get_hit_lat_p999: u64,
    pub get_hit_lat_p9999: u64,
    pub get_hit_lat_p99999: u64,
    pub get_hit_lat_pmax: u64,
    pub get_miss_lat_p50: u64,
    pub get_miss_lat_p90: u64,
    pub get_miss_lat_p99: u64,
    pub get_miss_lat_p999: u64,
    pub get_miss_lat_p9999: u64,
    pub get_miss_lat_p99999: u64,
    pub get_miss_lat_pmax: u64,
}

#[derive(Clone, Debug)]
pub struct Metrics {
    pub insert_ios: Arc<AtomicUsize>,
    pub insert_bytes: Arc<AtomicUsize>,
    pub insert_lats: Arc<RwLock<Histogram<u64>>>,

    pub get_ios: Arc<AtomicUsize>,
    pub get_bytes: Arc<AtomicUsize>,
    pub get_miss_ios: Arc<AtomicUsize>,
    pub get_hit_lats: Arc<RwLock<Histogram<u64>>>,
    pub get_miss_lats: Arc<RwLock<Histogram<u64>>>,
}

impl Default for Metrics {
    fn default() -> Self {
        Self {
            insert_ios: Arc::new(AtomicUsize::new(0)),
            insert_bytes: Arc::new(AtomicUsize::new(0)),
            insert_lats: Arc::new(RwLock::new(Histogram::new_with_bounds(1, 10_000_000, 2).unwrap())),

            get_ios: Arc::new(AtomicUsize::new(0)),
            get_bytes: Arc::new(AtomicUsize::new(0)),
            get_miss_ios: Arc::new(AtomicUsize::new(0)),
            get_hit_lats: Arc::new(RwLock::new(Histogram::new_with_bounds(1, 10_000_000, 2).unwrap())),
            get_miss_lats: Arc::new(RwLock::new(Histogram::new_with_bounds(1, 10_000_000, 2).unwrap())),
        }
    }
}

impl Metrics {
    pub fn dump(&self) -> MetricsDump {
        let insert_lats = self.insert_lats.read();
        let get_hit_lats = self.get_hit_lats.read();
        let get_miss_lats = self.get_miss_lats.read();

        MetricsDump {
            insert_ios: self.insert_ios.load(Ordering::Relaxed),
            insert_bytes: self.insert_bytes.load(Ordering::Relaxed),
            insert_lat_p50: insert_lats.value_at_quantile(0.5),
            insert_lat_p90: insert_lats.value_at_quantile(0.9),
            insert_lat_p99: insert_lats.value_at_quantile(0.99),
            insert_lat_p999: insert_lats.value_at_quantile(0.999),
            insert_lat_p9999: insert_lats.value_at_quantile(0.9999),
            insert_lat_p99999: insert_lats.value_at_quantile(0.99999),
            insert_lat_pmax: insert_lats.max(),

            get_ios: self.get_ios.load(Ordering::Relaxed),
            get_miss_ios: self.get_miss_ios.load(Ordering::Relaxed),
            get_bytes: self.get_bytes.load(Ordering::Relaxed),
            get_hit_lat_p50: get_hit_lats.value_at_quantile(0.5),
            get_hit_lat_p90: get_hit_lats.value_at_quantile(0.9),
            get_hit_lat_p99: get_hit_lats.value_at_quantile(0.99),
            get_hit_lat_p999: get_hit_lats.value_at_quantile(0.999),
            get_hit_lat_p9999: get_hit_lats.value_at_quantile(0.9999),
            get_hit_lat_p99999: get_hit_lats.value_at_quantile(0.99999),
            get_hit_lat_pmax: get_hit_lats.max(),
            get_miss_lat_p50: get_miss_lats.value_at_quantile(0.5),
            get_miss_lat_p90: get_miss_lats.value_at_quantile(0.9),
            get_miss_lat_p99: get_miss_lats.value_at_quantile(0.99),
            get_miss_lat_p999: get_miss_lats.value_at_quantile(0.999),
            get_miss_lat_p9999: get_miss_lats.value_at_quantile(0.9999),
            get_miss_lat_p99999: get_miss_lats.value_at_quantile(0.99999),
            get_miss_lat_pmax: get_miss_lats.max(),
        }
    }
}

impl std::fmt::Display for Analysis {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        let disk_read_throughput = ByteSize::b(self.disk_read_throughput as u64);
        let disk_write_throughput = ByteSize::b(self.disk_write_throughput as u64);
        let disk_total_throughput = disk_read_throughput + disk_write_throughput;

        // disk statics
        writeln!(f, "disk total iops: {:.1}", self.disk_write_iops + self.disk_read_iops)?;
        writeln!(
            f,
            "disk total throughput: {}/s",
            disk_total_throughput.to_string_as(true)
        )?;
        writeln!(f, "disk read iops: {:.1}", self.disk_read_iops)?;
        writeln!(f, "disk read throughput: {}/s", disk_read_throughput.to_string_as(true))?;
        writeln!(f, "disk write iops: {:.1}", self.disk_write_iops)?;
        writeln!(
            f,
            "disk write throughput: {}/s",
            disk_write_throughput.to_string_as(true)
        )?;

        // insert statics
        let insert_throughput = ByteSize::b(self.insert_throughput as u64);
        writeln!(f, "insert iops: {:.1}/s", self.insert_iops)?;
        writeln!(f, "insert throughput: {}/s", insert_throughput.to_string_as(true))?;
        writeln!(f, "insert lat p50: {}us", self.insert_lat_p50)?;
        writeln!(f, "insert lat p90: {}us", self.insert_lat_p90)?;
        writeln!(f, "insert lat p99: {}us", self.insert_lat_p99)?;
        writeln!(f, "insert lat p999: {}us", self.insert_lat_p999)?;
        writeln!(f, "insert lat p9999: {}us", self.insert_lat_p9999)?;
        writeln!(f, "insert lat p99999: {}us", self.insert_lat_p99999)?;
        writeln!(f, "insert lat pmax: {}us", self.insert_lat_pmax)?;

        // get statics
        let get_throughput = ByteSize::b(self.get_throughput as u64);
        writeln!(f, "get iops: {:.1}/s", self.get_iops)?;
        writeln!(f, "get miss: {:.2}% ", self.get_miss * 100f64)?;
        writeln!(f, "get throughput: {}/s", get_throughput.to_string_as(true))?;
        writeln!(f, "get hit lat p50: {}us", self.get_hit_lat_p50)?;
        writeln!(f, "get hit lat p90: {}us", self.get_hit_lat_p90)?;
        writeln!(f, "get hit lat p99: {}us", self.get_hit_lat_p99)?;
        writeln!(f, "get hit lat p999: {}us", self.get_hit_lat_p999)?;
        writeln!(f, "get hit lat p9999: {}us", self.get_hit_lat_p9999)?;
        writeln!(f, "get hit lat p99999: {}us", self.get_hit_lat_p99999)?;
        writeln!(f, "get hit lat pmax: {}us", self.get_hit_lat_pmax)?;
        writeln!(f, "get miss lat p50: {}us", self.get_miss_lat_p50)?;
        writeln!(f, "get miss lat p90: {}us", self.get_miss_lat_p90)?;
        writeln!(f, "get miss lat p99: {}us", self.get_miss_lat_p99)?;
        writeln!(f, "get miss lat p999: {}us", self.get_miss_lat_p999)?;
        writeln!(f, "get miss lat p9999: {}us", self.get_miss_lat_p9999)?;
        writeln!(f, "get miss lat p99999: {}us", self.get_miss_lat_p99999)?;
        writeln!(f, "get miss lat pmax: {}us", self.get_miss_lat_pmax)?;

        Ok(())
    }
}

pub struct IoStat {
    pub read_ios: usize,
    pub read_bytes: usize,

    pub write_ios: usize,
    pub write_bytes: usize,
}

impl IoStat {
    pub fn snapshot(stats: &DeviceStats) -> Self {
        Self {
            read_ios: stats.read_ios.load(Ordering::Relaxed),
            read_bytes: stats.read_bytes.load(Ordering::Relaxed),
            write_ios: stats.write_ios.load(Ordering::Relaxed),
            write_bytes: stats.write_bytes.load(Ordering::Relaxed),
        }
    }
}

pub fn analyze(
    duration: Duration,
    iostat_start: &IoStat,
    iostat_end: &IoStat,
    metrics_dump_start: &MetricsDump,
    metrics_dump_end: &MetricsDump,
) -> Analysis {
    let secs = duration.as_secs_f64();
    let disk_read_iops = (iostat_end.read_ios - iostat_start.read_ios) as f64 / secs;
    let disk_read_throughput = (iostat_end.read_bytes - iostat_start.read_bytes) as f64 / secs;
    let disk_write_iops = (iostat_end.write_ios - iostat_start.write_ios) as f64 / secs;
    let disk_write_throughput = (iostat_end.write_bytes - iostat_start.write_bytes) as f64 / secs;

    let insert_iops = (metrics_dump_end.insert_ios - metrics_dump_start.insert_ios) as f64 / secs;
    let insert_throughput = (metrics_dump_end.insert_bytes - metrics_dump_start.insert_bytes) as f64 / secs;

    let get_iops = (metrics_dump_end.get_ios - metrics_dump_start.get_ios) as f64 / secs;
    let get_miss = (metrics_dump_end.get_miss_ios - metrics_dump_start.get_miss_ios) as f64
        / (metrics_dump_end.get_ios - metrics_dump_start.get_ios) as f64;
    let get_throughput = (metrics_dump_end.get_bytes - metrics_dump_start.get_bytes) as f64 / secs;

    Analysis {
        disk_read_iops,
        disk_read_throughput,
        disk_write_iops,
        disk_write_throughput,

        insert_iops,
        insert_throughput,
        insert_lat_p50: metrics_dump_end.insert_lat_p50,
        insert_lat_p90: metrics_dump_end.insert_lat_p90,
        insert_lat_p99: metrics_dump_end.insert_lat_p99,
        insert_lat_p999: metrics_dump_end.insert_lat_p999,
        insert_lat_p9999: metrics_dump_end.insert_lat_p9999,
        insert_lat_p99999: metrics_dump_end.insert_lat_p99999,
        insert_lat_pmax: metrics_dump_end.insert_lat_pmax,

        get_iops,
        get_miss,
        get_throughput,
        get_hit_lat_p50: metrics_dump_end.get_hit_lat_p50,
        get_hit_lat_p90: metrics_dump_end.get_hit_lat_p90,
        get_hit_lat_p99: metrics_dump_end.get_hit_lat_p99,
        get_hit_lat_p999: metrics_dump_end.get_hit_lat_p999,
        get_hit_lat_p9999: metrics_dump_end.get_hit_lat_p9999,
        get_hit_lat_p99999: metrics_dump_end.get_hit_lat_p99999,
        get_hit_lat_pmax: metrics_dump_end.get_hit_lat_pmax,
        get_miss_lat_p50: metrics_dump_end.get_miss_lat_p50,
        get_miss_lat_p90: metrics_dump_end.get_miss_lat_p90,
        get_miss_lat_p99: metrics_dump_end.get_miss_lat_p99,
        get_miss_lat_p999: metrics_dump_end.get_miss_lat_p999,
        get_miss_lat_p9999: metrics_dump_end.get_miss_lat_p9999,
        get_miss_lat_p99999: metrics_dump_end.get_miss_lat_p99999,
        get_miss_lat_pmax: metrics_dump_end.get_miss_lat_pmax,
    }
}

pub async fn monitor(
    stats: Arc<DeviceStats>,
    interval: Duration,
    total_secs: Duration,
    warm_up: Duration,
    metrics: Metrics,
    mut stop: broadcast::Receiver<()>,
) {
    let start = Instant::now();

    loop {
        tokio::time::sleep(Duration::from_secs(1)).await;
        println!("warm up... [{}s/{}s]", start.elapsed().as_secs(), warm_up.as_secs());
        if start.elapsed() > warm_up {
            break;
        }
    }

    let mut stat = IoStat::snapshot(&stats);
    let mut metrics_dump = metrics.dump();

    let start = Instant::now();

    loop {
        let now = Instant::now();
        match stop.try_recv() {
            Err(broadcast::error::TryRecvError::Empty) => {}
            _ => return,
        }

        tokio::time::sleep(interval).await;
        let new_stat = IoStat::snapshot(&stats);
        let new_metrics_dump = metrics.dump();
        let analysis = analyze(
            // interval may have ~ +7% error
            now.elapsed(),
            &stat,
            &new_stat,
            &metrics_dump,
            &new_metrics_dump,
        );
        println!("[{}s/{}s]", start.elapsed().as_secs(), total_secs.as_secs());
        println!("{}", analysis);
        stat = new_stat;
        metrics_dump = new_metrics_dump;
    }
}