Skip to content

Commit d62d060

Browse files
authored
Merge branch 'main' into reduce_expr_size
2 parents f6f35c6 + 3291e4e commit d62d060

File tree

44 files changed

+2300
-892
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

44 files changed

+2300
-892
lines changed

.github/actions/setup-macos-aarch64-builder/action.yaml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,5 +45,7 @@ runs:
4545
rustup component add rustfmt
4646
- name: Setup rust cache
4747
uses: Swatinem/rust-cache@v2
48+
with:
49+
save-if: ${{ github.ref_name == 'main' }}
4850
- name: Configure rust runtime env
4951
uses: ./.github/actions/setup-rust-runtime

.github/workflows/rust.yml

Lines changed: 39 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,11 @@ jobs:
5151
uses: ./.github/actions/setup-builder
5252
with:
5353
rust-version: stable
54+
- name: Rust Dependency Cache
55+
uses: Swatinem/rust-cache@v2
56+
with:
57+
shared-key: "amd-ci-check" # this job uses it's own cache becase check has a separate cache and we need it to be fast as it blocks other jobs
58+
save-if: ${{ github.ref_name == 'main' }}
5459
- name: Prepare cargo build
5560
run: |
5661
# Adding `--locked` here to assert that the `Cargo.lock` file is up to
@@ -99,6 +104,11 @@ jobs:
99104
uses: ./.github/actions/setup-builder
100105
with:
101106
rust-version: stable
107+
- name: Rust Dependency Cache
108+
uses: Swatinem/rust-cache@v2
109+
with:
110+
save-if: false # set in linux-test
111+
shared-key: "amd-ci"
102112
- name: Check datafusion-substrait (default features)
103113
run: cargo check --profile ci --all-targets -p datafusion-substrait
104114
#
@@ -162,6 +172,11 @@ jobs:
162172
uses: ./.github/actions/setup-builder
163173
with:
164174
rust-version: stable
175+
- name: Rust Dependency Cache
176+
uses: Swatinem/rust-cache@v2
177+
with:
178+
save-if: false # set in linux-test
179+
shared-key: "amd-ci"
165180
- name: Check datafusion (default features)
166181
run: cargo check --profile ci --all-targets -p datafusion
167182
#
@@ -247,15 +262,22 @@ jobs:
247262
name: cargo test (amd64)
248263
needs: linux-build-lib
249264
runs-on: ubuntu-latest
265+
container:
266+
image: amd64/rust
250267
steps:
251268
- uses: actions/checkout@v4
252269
with:
253270
submodules: true
254271
fetch-depth: 1
255272
- name: Setup Rust toolchain
256-
run: rustup toolchain install stable
257-
- name: Install Protobuf Compiler
258-
run: sudo apt-get install -y protobuf-compiler
273+
uses: ./.github/actions/setup-builder
274+
with:
275+
rust-version: stable
276+
- name: Rust Dependency Cache
277+
uses: Swatinem/rust-cache@v2
278+
with:
279+
save-if: ${{ github.ref_name == 'main' }}
280+
shared-key: "amd-ci"
259281
- name: Run tests (excluding doctests and datafusion-cli)
260282
env:
261283
RUST_BACKTRACE: 1
@@ -279,6 +301,10 @@ jobs:
279301
name: cargo test datafusion-cli (amd64)
280302
needs: linux-build-lib
281303
runs-on: ubuntu-latest
304+
# should be uncommented once https://github.com/apache/datafusion/pull/16644 is merged
305+
# and cache should be added
306+
# container:
307+
# image: amd64/rust
282308
steps:
283309
- uses: actions/checkout@v4
284310
with:
@@ -329,6 +355,11 @@ jobs:
329355
uses: ./.github/actions/setup-builder
330356
with:
331357
rust-version: stable
358+
- name: Rust Dependency Cache
359+
uses: Swatinem/rust-cache@v2
360+
with:
361+
save-if: ${{ github.ref_name == 'main' }}
362+
shared-key: "amd-ci-linux-test-example"
332363
- name: Run examples
333364
run: |
334365
# test datafusion-sql examples
@@ -655,6 +686,11 @@ jobs:
655686
rust-version: stable
656687
- name: Install Clippy
657688
run: rustup component add clippy
689+
- name: Rust Dependency Cache
690+
uses: Swatinem/rust-cache@v2
691+
with:
692+
save-if: ${{ github.ref_name == 'main' }}
693+
shared-key: "amd-ci-clippy"
658694
- name: Run clippy
659695
run: ci/scripts/rust_clippy.sh
660696

Cargo.lock

Lines changed: 14 additions & 36 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

benchmarks/bench.sh

Lines changed: 0 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -114,8 +114,6 @@ imdb: Join Order Benchmark (JOB) using the IMDB dataset conver
114114
115115
# Micro-Benchmarks (specific operators and features)
116116
cancellation: How long cancelling a query takes
117-
parquet: Benchmark of parquet reader's filtering speed
118-
sort: Benchmark of sorting speed
119117
120118
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
121119
Supported Configuration (Environment Variables)
@@ -303,8 +301,6 @@ main() {
303301
run_tpch "10" "csv"
304302
run_tpch_mem "10"
305303
run_cancellation
306-
run_parquet
307-
run_sort
308304
run_clickbench_1
309305
run_clickbench_partitioned
310306
run_clickbench_extended
@@ -338,12 +334,6 @@ main() {
338334
cancellation)
339335
run_cancellation
340336
;;
341-
parquet)
342-
run_parquet
343-
;;
344-
sort)
345-
run_sort
346-
;;
347337
clickbench_1)
348338
run_clickbench_1
349339
;;
@@ -528,22 +518,6 @@ run_cancellation() {
528518
debug_run $CARGO_COMMAND --bin dfbench -- cancellation --iterations 5 --path "${DATA_DIR}/cancellation" -o "${RESULTS_FILE}"
529519
}
530520

531-
# Runs the parquet filter benchmark
532-
run_parquet() {
533-
RESULTS_FILE="${RESULTS_DIR}/parquet.json"
534-
echo "RESULTS_FILE: ${RESULTS_FILE}"
535-
echo "Running parquet filter benchmark..."
536-
debug_run $CARGO_COMMAND --bin parquet -- filter --path "${DATA_DIR}" --scale-factor 1.0 --iterations 5 -o "${RESULTS_FILE}"
537-
}
538-
539-
# Runs the sort benchmark
540-
run_sort() {
541-
RESULTS_FILE="${RESULTS_DIR}/sort.json"
542-
echo "RESULTS_FILE: ${RESULTS_FILE}"
543-
echo "Running sort benchmark..."
544-
debug_run $CARGO_COMMAND --bin parquet -- sort --path "${DATA_DIR}" --scale-factor 1.0 --iterations 5 -o "${RESULTS_FILE}"
545-
}
546-
547521

548522
# Downloads the single file hits.parquet ClickBench datasets from
549523
# https://github.com/ClickHouse/ClickBench/tree/main#data-loading

benchmarks/src/bin/dfbench.rs

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -33,9 +33,7 @@ static ALLOC: snmalloc_rs::SnMalloc = snmalloc_rs::SnMalloc;
3333
#[global_allocator]
3434
static ALLOC: mimalloc::MiMalloc = mimalloc::MiMalloc;
3535

36-
use datafusion_benchmarks::{
37-
cancellation, clickbench, h2o, imdb, parquet_filter, sort, sort_tpch, tpch,
38-
};
36+
use datafusion_benchmarks::{cancellation, clickbench, h2o, imdb, sort_tpch, tpch};
3937

4038
#[derive(Debug, StructOpt)]
4139
#[structopt(about = "benchmark command")]
@@ -44,8 +42,6 @@ enum Options {
4442
Clickbench(clickbench::RunOpt),
4543
H2o(h2o::RunOpt),
4644
Imdb(imdb::RunOpt),
47-
ParquetFilter(parquet_filter::RunOpt),
48-
Sort(sort::RunOpt),
4945
SortTpch(sort_tpch::RunOpt),
5046
Tpch(tpch::RunOpt),
5147
TpchConvert(tpch::ConvertOpt),
@@ -61,8 +57,6 @@ pub async fn main() -> Result<()> {
6157
Options::Clickbench(opt) => opt.run().await,
6258
Options::H2o(opt) => opt.run().await,
6359
Options::Imdb(opt) => Box::pin(opt.run()).await,
64-
Options::ParquetFilter(opt) => opt.run().await,
65-
Options::Sort(opt) => opt.run().await,
6660
Options::SortTpch(opt) => opt.run().await,
6761
Options::Tpch(opt) => Box::pin(opt.run()).await,
6862
Options::TpchConvert(opt) => opt.run().await,

benchmarks/src/bin/parquet.rs

Lines changed: 0 additions & 49 deletions
This file was deleted.

benchmarks/src/lib.rs

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,8 +20,6 @@ pub mod cancellation;
2020
pub mod clickbench;
2121
pub mod h2o;
2222
pub mod imdb;
23-
pub mod parquet_filter;
24-
pub mod sort;
2523
pub mod sort_tpch;
2624
pub mod tpch;
2725
pub mod util;

0 commit comments

Comments
 (0)