This is an automated email from the ASF dual-hosted git repository.

dheres pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/datafusion.git


The following commit(s) were added to refs/heads/main by this push:
     new 94fd86ab82 Add topk_tpch benchmark (#16410)
94fd86ab82 is described below

commit 94fd86ab82aa4fff135352b1025706e255db6f5e
Author: Daniƫl Heres <danielhe...@gmail.com>
AuthorDate: Sat Jun 14 16:06:56 2025 +0200

    Add topk_tpch benchmark (#16410)
    
    * Add topk benchmark
    
    * Add topk benchmark
    
    * Add topk benchmark
---
 benchmarks/README.md |  9 +++++++++
 benchmarks/bench.sh  | 17 +++++++++++++++++
 2 files changed, 26 insertions(+)

diff --git a/benchmarks/README.md b/benchmarks/README.md
index b19b3385af..01da886ffb 100644
--- a/benchmarks/README.md
+++ b/benchmarks/README.md
@@ -510,6 +510,15 @@ See [`sort_tpch.rs`](src/sort_tpch.rs) for more details.
 ./bench.sh run sort_tpch
 ```
 
+### TopK TPCH
+
+In addition, topk_tpch is available from the bench.sh script:
+
+```bash
+./bench.sh run topk_tpch
+```
+
+
 ## IMDB
 
 Run Join Order Benchmark (JOB) on IMDB dataset.
diff --git a/benchmarks/bench.sh b/benchmarks/bench.sh
index 837e8c6c9b..f1780f8844 100755
--- a/benchmarks/bench.sh
+++ b/benchmarks/bench.sh
@@ -236,6 +236,10 @@ main() {
                     # same data as for tpch
                     data_tpch "1"
                     ;;
+                topk_tpch)
+                    # same data as for tpch
+                    data_tpch "1"
+                    ;;
                 *)
                     echo "Error: unknown benchmark '$BENCHMARK' for data 
generation"
                     usage
@@ -361,6 +365,9 @@ main() {
                 sort_tpch)
                     run_sort_tpch
                     ;;
+                topk_tpch)
+                    run_topk_tpch
+                    ;;
                 *)
                     echo "Error: unknown benchmark '$BENCHMARK' for run"
                     usage
@@ -981,6 +988,16 @@ run_sort_tpch() {
     debug_run $CARGO_COMMAND --bin dfbench -- sort-tpch --iterations 5 --path 
"${TPCH_DIR}" -o "${RESULTS_FILE}"
 }
 
+# Runs the sort tpch integration benchmark with limit 100 (topk)
+run_topk_tpch() {
+    TPCH_DIR="${DATA_DIR}/tpch_sf1"
+    RESULTS_FILE="${RESULTS_DIR}/run_topk_tpch.json"
+    echo "RESULTS_FILE: ${RESULTS_FILE}"
+    echo "Running topk tpch benchmark..."
+
+    $CARGO_COMMAND --bin dfbench -- sort-tpch --iterations 5 --path 
"${TPCH_DIR}" -o "${RESULTS_FILE}" --limit 100
+}
+
 
 compare_benchmarks() {
     BASE_RESULTS_DIR="${SCRIPT_DIR}/results"


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@datafusion.apache.org
For additional commands, e-mail: commits-h...@datafusion.apache.org

Reply via email to