add benchmark utility to profile memory usage

ding-young · ding-young · commit aec319129873 · 2025-07-18T07:34:02.000Z
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/benchmarks/Cargo.toml b/benchmarks/Cargo.toml
@@ -45,6 +45,7 @@ mimalloc = { version = "0.1", optional = true, default-features = false }
 object_store = { workspace = true }
 parquet = { workspace = true, default-features = true }
 rand = { workspace = true }
+regex.workspace = true
 serde = { version = "1.0.219", features = ["derive"] }
 serde_json = { workspace = true }
 snmalloc-rs = { version = "0.3", optional = true }
@@ -53,5 +54,8 @@ test-utils = { path = "../test-utils/", version = "0.1.0" }
 tokio = { workspace = true, features = ["rt-multi-thread", "parking_lot"] }
 tokio-util = { version = "0.7.15" }
 
+[target.'cfg(target_os = "linux")'.dependencies]
+procfs = "0.17.0"
+
 [dev-dependencies]
 datafusion-proto = { workspace = true }
diff --git a/benchmarks/src/bin/mem_profile.rs b/benchmarks/src/bin/mem_profile.rs
@@ -0,0 +1,205 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! mem_profile binary entrypoint
+use datafusion::error::Result;
+use std::{
+    io::{BufRead, BufReader},
+    process::{Command, Stdio},
+};
+use structopt::StructOpt;
+
+#[derive(Debug, StructOpt)]
+#[structopt(about = "memory profile command")]
+struct MemProfileOpt {
+    #[structopt(subcommand)]
+    command: BenchmarkCommand,
+}
+
+#[derive(Debug, StructOpt)]
+enum BenchmarkCommand {
+    Tpch(TpchOpt),
+    // TODO Add other benchmark commands here
+}
+
+#[derive(Debug, StructOpt)]
+struct TpchOpt {
+    #[structopt(long, required = true)]
+    path: String,
+
+    /// Query number. If not specified, runs all queries
+    #[structopt(short, long)]
+    query: Option<usize>,
+}
+
+#[tokio::main]
+pub async fn main() -> Result<()> {
+    // 1. parse args and check which benchmarks should be run
+    let opt = MemProfileOpt::from_args();
+
+    // 2. prebuild test binary so that memory does not blow up due to build process
+    // check binary file location
+    println!("Pre-building benchmark binary...");
+    let status = Command::new("cargo")
+        .args(["build", "--profile", "release-nonlto", "--bin", "dfbench"])
+        .status()
+        .expect("Failed to build dfbench");
+
+    if !status.success() {
+        panic!("Failed to build dfbench");
+    }
+    println!("Benchmark binary built successfully.");
+
+    // 3. create a subprocess, run each benchmark with args (1) (2)
+    match opt.command {
+        BenchmarkCommand::Tpch(tpch_opt) => {
+            run_tpch_benchmark(tpch_opt).await?;
+        }
+    }
+
+    // (maybe we cannot support result file.. and just have to print..)
+    Ok(())
+}
+
+async fn run_tpch_benchmark(opt: TpchOpt) -> Result<()> {
+    let mut args: Vec<String> = vec![
+        "./target/release-nonlto/dfbench".to_string(),
+        "tpch".to_string(),
+        "--iterations".to_string(),
+        "1".to_string(),
+        "--path".to_string(),
+        opt.path.clone(),
+        "--format".to_string(),
+        "parquet".to_string(),
+        "--partitions".to_string(),
+        "4".to_string(),
+        "--memory-stat-enabled".to_string(),
+        "--query".to_string(),
+    ];
+
+    let mut query_strings: Vec<String> = Vec::new();
+    if let Some(query_id) = opt.query {
+        query_strings.push(query_id.to_string());
+    } else {
+        // run all queries.
+        for i in 1..=22 {
+            query_strings.push(i.to_string());
+        }
+    }
+
+    let mut results = vec![];
+    for query_str in query_strings {
+        args.push(query_str);
+        let _ = run_query(&args, &mut results);
+        args.pop();
+    }
+
+    print_summary_table(&results);
+    Ok(())
+}
+
+fn run_query(args: &[String], results: &mut Vec<QueryResult>) -> Result<()> {
+    let exec_path = &args[0];
+    let exec_args = &args[1..];
+
+    let mut child = Command::new(exec_path)
+        .args(exec_args)
+        .stdout(Stdio::piped())
+        .spawn()
+        .expect("Failed to start benchmark");
+
+    let stdout = child.stdout.take().unwrap();
+    let reader = BufReader::new(stdout);
+
+    // buffer stdout
+    let lines: Result<Vec<String>, std::io::Error> =
+        reader.lines().collect::<Result<_, _>>();
+
+    child
+        .wait()
+        .expect("Benchmark process exited with an error");
+
+    // parse after child process terminates
+    let lines = lines?;
+    let mut iter = lines.iter().peekable();
+
+    while let Some(line) = iter.next() {
+        if let Some((query, duration_ms)) = parse_query_time(line) {
+            if let Some(next_line) = iter.peek() {
+                if let Some((vmpeak, vmhwm, resident)) = parse_vm_line(next_line) {
+                    results.push(QueryResult {
+                        query,
+                        duration_ms,
+                        vmpeak,
+                        vmhwm,
+                        resident,
+                    });
+                    break;
+                }
+            }
+        }
+    }
+
+    Ok(())
+}
+
+#[derive(Debug)]
+struct QueryResult {
+    query: usize,
+    duration_ms: f64,
+    vmpeak: String,
+    vmhwm: String,
+    resident: String,
+}
+
+fn parse_query_time(line: &str) -> Option<(usize, f64)> {
+    let re = regex::Regex::new(r"Query (\d+) avg time: ([\d.]+) ms").unwrap();
+    if let Some(caps) = re.captures(line) {
+        let query_id = caps[1].parse::<usize>().ok()?;
+        let avg_time = caps[2].parse::<f64>().ok()?;
+        Some((query_id, avg_time))
+    } else {
+        None
+    }
+}
+
+fn parse_vm_line(line: &str) -> Option<(String, String, String)> {
+    let re = regex::Regex::new(
+        r"VmPeak:\s*([\d.]+\s*[A-Z]+),\s*VmHWM:\s*([\d.]+\s*[A-Z]+),\s*RSS:\s*([\d.]+\s*[A-Z]+)"
+    ).ok()?;
+    let caps = re.captures(line)?;
+    let vmpeak = caps.get(1)?.as_str().to_string();
+    let vmhwm = caps.get(2)?.as_str().to_string();
+    let resident = caps.get(3)?.as_str().to_string();
+    Some((vmpeak, vmhwm, resident))
+}
+
+// Print as simple aligned table
+fn print_summary_table(results: &[QueryResult]) {
+    println!(
+        "\n{:<8} {:>10} {:>12} {:>12} {:>12}",
+        "Query", "Time (ms)", "VmPeak", "VmHWM", "RSS"
+    );
+    println!("{}", "-".repeat(68));
+
+    for r in results {
+        println!(
+            "{:<8} {:>10.2} {:>12} {:>12} {:>12}",
+            r.query, r.duration_ms, r.vmpeak, r.vmhwm, r.resident
+        );
+    }
+}
diff --git a/benchmarks/src/clickbench.rs b/benchmarks/src/clickbench.rs
@@ -19,7 +19,7 @@ use std::fs;
 use std::io::ErrorKind;
 use std::path::{Path, PathBuf};
 
-use crate::util::{BenchmarkRun, CommonOpt, QueryResult};
+use crate::util::{print_memory_stats, BenchmarkRun, CommonOpt, QueryResult};
 use datafusion::logical_expr::{ExplainFormat, ExplainOption};
 use datafusion::{
     error::{DataFusionError, Result},
@@ -192,6 +192,10 @@ impl RunOpt {
         }
         let avg = millis.iter().sum::<f64>() / millis.len() as f64;
         println!("Query {query_id} avg time: {avg:.2} ms");
+
+        if self.common.memory_stat_enabled {
+            print_memory_stats();
+        }
         Ok(query_results)
     }
 
diff --git a/benchmarks/src/tpch/run.rs b/benchmarks/src/tpch/run.rs
@@ -21,7 +21,7 @@ use std::sync::Arc;
 use super::{
     get_query_sql, get_tbl_tpch_table_schema, get_tpch_table_schema, TPCH_TABLES,
 };
-use crate::util::{BenchmarkRun, CommonOpt, QueryResult};
+use crate::util::{print_memory_stats, BenchmarkRun, CommonOpt, QueryResult};
 
 use arrow::record_batch::RecordBatch;
 use arrow::util::pretty::{self, pretty_format_batches};
@@ -184,6 +184,10 @@ impl RunOpt {
         let avg = millis.iter().sum::<f64>() / millis.len() as f64;
         println!("Query {query_id} avg time: {avg:.2} ms");
 
+        if self.common.memory_stat_enabled {
+            print_memory_stats();
+        }
+
         Ok(query_results)
     }
 
diff --git a/benchmarks/src/util/memory.rs b/benchmarks/src/util/memory.rs
@@ -0,0 +1,54 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use datafusion::execution::memory_pool::human_readable_size;
+
+#[derive(Debug)]
+pub struct MemoryStats {
+    pub vm_rss_kb: Option<u64>,
+    pub vm_hwm_kb: Option<u64>,
+    pub vm_size_kb: Option<u64>,
+    pub vm_peak_kb: Option<u64>,
+}
+
+pub fn print_memory_stats() {
+    #[cfg(target_os = "linux")]
+    {
+        use procfs::process::Process;
+
+        let pid = std::process::id();
+        let process = Process::new(pid as i32).unwrap();
+        let statm = process.statm().unwrap();
+        let status = process.status().unwrap();
+        let page_size = procfs::page_size();
+
+        let resident_bytes = (statm.resident * page_size) as usize;
+        let vmpeak_bytes = status.vmpeak.map(|kb| (kb * 1024) as usize);
+        let vmhwm_bytes = status.vmhwm.map(|kb| (kb * 1024) as usize);
+
+        println!(
+            "VmPeak: {}, VmHWM: {}, RSS: {}",
+            vmpeak_bytes
+                .map(human_readable_size)
+                .unwrap_or_else(|| "N/A".to_string()),
+            vmhwm_bytes
+                .map(human_readable_size)
+                .unwrap_or_else(|| "N/A".to_string()),
+            human_readable_size(resident_bytes)
+        );
+    }
+}
diff --git a/benchmarks/src/util/mod.rs b/benchmarks/src/util/mod.rs
@@ -16,8 +16,10 @@
 // under the License.
 
 //! Shared benchmark utilities
+mod memory;
 mod options;
 mod run;
 
+pub use memory::{print_memory_stats, MemoryStats};
 pub use options::CommonOpt;
 pub use run::{BenchQuery, BenchmarkRun, QueryResult};
diff --git a/benchmarks/src/util/options.rs b/benchmarks/src/util/options.rs
@@ -61,6 +61,11 @@ pub struct CommonOpt {
     /// Activate debug mode to see more details
     #[structopt(short, long)]
     pub debug: bool,
+
+    /// Enable memory profiling to see VmPeak, VmHwm for running benchmark.
+    /// See more details in TODO
+    #[structopt(long)]
+    pub memory_stat_enabled: bool,
 }
 
 impl CommonOpt {