Skip to content

Commit e7b267b

Browse files
authored
Merge branch 'main' into feature/add-string-split-support
2 parents 1180cd4 + 035aeff commit e7b267b

1,525 files changed

Lines changed: 214663 additions & 101172 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.github/actions/rust-test/action.yaml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,5 +70,7 @@ runs:
7070
shell: bash
7171
run: |
7272
cd native
73+
# Set LD_LIBRARY_PATH to include JVM library path for tests that use JNI
74+
export LD_LIBRARY_PATH=${JAVA_HOME}/lib/server:${LD_LIBRARY_PATH}
7375
RUST_BACKTRACE=1 cargo nextest run
7476

.github/actions/setup-iceberg-builder/action.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ runs:
2525
using: "composite"
2626
steps:
2727
- name: Clone Iceberg repo
28-
uses: actions/checkout@v4
28+
uses: actions/checkout@v6
2929
with:
3030
repository: apache/iceberg
3131
path: apache-iceberg

.github/actions/setup-iceberg-rust-builder/action.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ runs:
2525
using: "composite"
2626
steps:
2727
- name: Clone Iceberg repo
28-
uses: actions/checkout@v4
28+
uses: actions/checkout@v6
2929
with:
3030
repository: apache/iceberg
3131
path: apache-iceberg

.github/actions/setup-spark-builder/action.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ runs:
2828
using: "composite"
2929
steps:
3030
- name: Clone Spark repo
31-
uses: actions/checkout@v4
31+
uses: actions/checkout@v6
3232
with:
3333
repository: apache/spark
3434
path: apache-spark

.github/workflows/benchmark-tpcds.yml

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -27,11 +27,17 @@ on:
2727
- "doc/**"
2828
- "docs/**"
2929
- "**.md"
30+
- "native/core/benches/**"
31+
- "native/spark-expr/benches/**"
32+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3033
pull_request:
3134
paths-ignore:
3235
- "doc/**"
3336
- "docs/**"
3437
- "**.md"
38+
- "native/core/benches/**"
39+
- "native/spark-expr/benches/**"
40+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3541
# manual trigger
3642
# https://docs.github.com/en/actions/managing-workflow-runs/manually-running-a-workflow
3743
workflow_dispatch:
@@ -55,7 +61,7 @@ jobs:
5561
rust-version: ${{env.RUST_VERSION}}
5662
jdk-version: 11
5763
- name: Cache Maven dependencies
58-
uses: actions/cache@v4
64+
uses: actions/cache@v5
5965
with:
6066
path: |
6167
~/.m2/repository
@@ -67,7 +73,7 @@ jobs:
6773
run: make release
6874
- name: Cache TPC-DS generated data
6975
id: cache-tpcds-sf-1
70-
uses: actions/cache@v4
76+
uses: actions/cache@v5
7177
with:
7278
path: ./tpcds-sf-1
7379
key: tpcds-${{ hashFiles('.github/workflows/benchmark.yml') }}
@@ -107,7 +113,7 @@ jobs:
107113
rust-version: ${{env.RUST_VERSION}}
108114
jdk-version: 11
109115
- name: Cache Maven dependencies
110-
uses: actions/cache@v4
116+
uses: actions/cache@v5
111117
with:
112118
path: |
113119
~/.m2/repository
@@ -117,7 +123,7 @@ jobs:
117123
${{ runner.os }}-java-maven-
118124
- name: Restore TPC-DS generated data
119125
id: cache-tpcds-sf-1
120-
uses: actions/cache/restore@v4
126+
uses: actions/cache/restore@v5
121127
with:
122128
path: ./tpcds-sf-1
123129
key: tpcds-${{ hashFiles('.github/workflows/benchmark.yml') }}

.github/workflows/benchmark-tpch.yml

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -27,11 +27,17 @@ on:
2727
- "doc/**"
2828
- "docs/**"
2929
- "**.md"
30+
- "native/core/benches/**"
31+
- "native/spark-expr/benches/**"
32+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3033
pull_request:
3134
paths-ignore:
3235
- "doc/**"
3336
- "docs/**"
3437
- "**.md"
38+
- "native/core/benches/**"
39+
- "native/spark-expr/benches/**"
40+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3541
# manual trigger
3642
# https://docs.github.com/en/actions/managing-workflow-runs/manually-running-a-workflow
3743
workflow_dispatch:
@@ -55,7 +61,7 @@ jobs:
5561
rust-version: ${{env.RUST_VERSION}}
5662
jdk-version: 11
5763
- name: Cache Maven dependencies
58-
uses: actions/cache@v4
64+
uses: actions/cache@v5
5965
with:
6066
path: |
6167
~/.m2/repository
@@ -65,7 +71,7 @@ jobs:
6571
${{ runner.os }}-java-maven-
6672
- name: Cache TPC-H generated data
6773
id: cache-tpch-sf-1
68-
uses: actions/cache@v4
74+
uses: actions/cache@v5
6975
with:
7076
path: ./tpch
7177
key: tpch-${{ hashFiles('.github/workflows/benchmark-tpch.yml') }}
@@ -91,7 +97,7 @@ jobs:
9197
rust-version: ${{env.RUST_VERSION}}
9298
jdk-version: 11
9399
- name: Cache Maven dependencies
94-
uses: actions/cache@v4
100+
uses: actions/cache@v5
95101
with:
96102
path: |
97103
~/.m2/repository
@@ -101,7 +107,7 @@ jobs:
101107
${{ runner.os }}-java-maven-
102108
- name: Restore TPC-H generated data
103109
id: cache-tpch-sf-1
104-
uses: actions/cache/restore@v4
110+
uses: actions/cache/restore@v5
105111
with:
106112
path: ./tpch
107113
key: tpch-${{ hashFiles('.github/workflows/benchmark-tpch.yml') }}

.github/workflows/iceberg_spark_test.yml

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,11 +27,17 @@ on:
2727
- "doc/**"
2828
- "docs/**"
2929
- "**.md"
30+
- "native/core/benches/**"
31+
- "native/spark-expr/benches/**"
32+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3033
pull_request:
3134
paths-ignore:
3235
- "doc/**"
3336
- "docs/**"
3437
- "**.md"
38+
- "native/core/benches/**"
39+
- "native/spark-expr/benches/**"
40+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3541
# manual trigger
3642
# https://docs.github.com/en/actions/managing-workflow-runs/manually-running-a-workflow
3743
workflow_dispatch:

.github/workflows/miri.yml

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,11 +23,17 @@ on:
2323
- "doc/**"
2424
- "docs/**"
2525
- "**.md"
26+
- "native/core/benches/**"
27+
- "native/spark-expr/benches/**"
28+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
2629
pull_request:
2730
paths-ignore:
2831
- "doc/**"
2932
- "docs/**"
3033
- "**.md"
34+
- "native/core/benches/**"
35+
- "native/spark-expr/benches/**"
36+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3137
# manual trigger
3238
# https://docs.github.com/en/actions/managing-workflow-runs/manually-running-a-workflow
3339
workflow_dispatch:
Lines changed: 85 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,85 @@
1+
# Licensed to the Apache Software Foundation (ASF) under one
2+
# or more contributor license agreements. See the NOTICE file
3+
# distributed with this work for additional information
4+
# regarding copyright ownership. The ASF licenses this file
5+
# to you under the Apache License, Version 2.0 (the
6+
# "License"); you may not use this file except in compliance
7+
# with the License. You may obtain a copy of the License at
8+
#
9+
# http://www.apache.org/licenses/LICENSE-2.0
10+
#
11+
# Unless required by applicable law or agreed to in writing,
12+
# software distributed under the License is distributed on an
13+
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14+
# KIND, either express or implied. See the License for the
15+
# specific language governing permissions and limitations
16+
# under the License.
17+
18+
# Lightweight CI for benchmark-only changes - verifies compilation and linting
19+
# without running full test suites
20+
21+
name: PR Benchmark Check
22+
23+
concurrency:
24+
group: ${{ github.repository }}-${{ github.head_ref || github.sha }}-${{ github.workflow }}
25+
cancel-in-progress: true
26+
27+
on:
28+
push:
29+
paths:
30+
- "native/core/benches/**"
31+
- "native/spark-expr/benches/**"
32+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
33+
pull_request:
34+
paths:
35+
- "native/core/benches/**"
36+
- "native/spark-expr/benches/**"
37+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
38+
workflow_dispatch:
39+
40+
env:
41+
RUST_VERSION: stable
42+
43+
jobs:
44+
benchmark-check:
45+
name: Benchmark Compile & Lint Check
46+
runs-on: ubuntu-latest
47+
container:
48+
image: amd64/rust
49+
steps:
50+
- uses: actions/checkout@v6
51+
52+
- name: Setup Rust & Java toolchain
53+
uses: ./.github/actions/setup-builder
54+
with:
55+
rust-version: ${{ env.RUST_VERSION }}
56+
jdk-version: 17
57+
58+
- name: Check Cargo fmt
59+
run: |
60+
cd native
61+
cargo fmt --all -- --check --color=never
62+
63+
- name: Check Cargo clippy
64+
run: |
65+
cd native
66+
cargo clippy --color=never --all-targets --workspace -- -D warnings
67+
68+
- name: Check benchmark compilation
69+
run: |
70+
cd native
71+
cargo check --benches
72+
73+
- name: Cache Maven dependencies
74+
uses: actions/cache@v5
75+
with:
76+
path: |
77+
~/.m2/repository
78+
/root/.m2/repository
79+
key: ${{ runner.os }}-benchmark-maven-${{ hashFiles('**/pom.xml') }}
80+
restore-keys: |
81+
${{ runner.os }}-benchmark-maven-
82+
83+
- name: Check Scala compilation and linting
84+
run: |
85+
./mvnw -B compile test-compile scalafix:scalafix -Dscalafix.mode=CHECK -Psemanticdb -DskipTests

.github/workflows/pr_build_linux.yml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,11 +27,17 @@ on:
2727
- "doc/**"
2828
- "docs/**"
2929
- "**.md"
30+
- "native/core/benches/**"
31+
- "native/spark-expr/benches/**"
32+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3033
pull_request:
3134
paths-ignore:
3235
- "doc/**"
3336
- "docs/**"
3437
- "**.md"
38+
- "native/core/benches/**"
39+
- "native/spark-expr/benches/**"
40+
- "spark/src/test/scala/org/apache/spark/sql/benchmark/**"
3541
# manual trigger
3642
# https://docs.github.com/en/actions/managing-workflow-runs/manually-running-a-workflow
3743
workflow_dispatch:
@@ -116,6 +122,7 @@ jobs:
116122
org.apache.comet.exec.CometAsyncShuffleSuite
117123
org.apache.comet.exec.DisableAQECometShuffleSuite
118124
org.apache.comet.exec.DisableAQECometAsyncShuffleSuite
125+
org.apache.spark.shuffle.sort.SpillSorterSuite
119126
- name: "parquet"
120127
value: |
121128
org.apache.comet.parquet.CometParquetWriterSuite
@@ -132,6 +139,7 @@ jobs:
132139
org.apache.comet.exec.CometAggregateSuite
133140
org.apache.comet.exec.CometExec3_4PlusSuite
134141
org.apache.comet.exec.CometExecSuite
142+
org.apache.comet.exec.CometGenerateExecSuite
135143
org.apache.comet.exec.CometWindowExecSuite
136144
org.apache.comet.exec.CometJoinSuite
137145
org.apache.comet.CometNativeSuite
@@ -140,6 +148,8 @@ jobs:
140148
org.apache.spark.CometPluginsDefaultSuite
141149
org.apache.spark.CometPluginsNonOverrideSuite
142150
org.apache.spark.CometPluginsUnifiedModeOverrideSuite
151+
org.apache.comet.rules.CometScanRuleSuite
152+
org.apache.comet.rules.CometExecRuleSuite
143153
org.apache.spark.sql.CometTPCDSQuerySuite
144154
org.apache.spark.sql.CometTPCDSQueryTestSuite
145155
org.apache.spark.sql.CometTPCHQuerySuite
@@ -151,13 +161,15 @@ jobs:
151161
value: |
152162
org.apache.comet.CometExpressionSuite
153163
org.apache.comet.CometExpressionCoverageSuite
164+
org.apache.comet.CometHashExpressionSuite
154165
org.apache.comet.CometTemporalExpressionSuite
155166
org.apache.comet.CometArrayExpressionSuite
156167
org.apache.comet.CometCastSuite
157168
org.apache.comet.CometMathExpressionSuite
158169
org.apache.comet.CometStringExpressionSuite
159170
org.apache.comet.CometBitwiseExpressionSuite
160171
org.apache.comet.CometMapExpressionSuite
172+
org.apache.comet.CometJsonExpressionSuite
161173
org.apache.comet.expressions.conditional.CometIfSuite
162174
org.apache.comet.expressions.conditional.CometCoalesceSuite
163175
org.apache.comet.expressions.conditional.CometCaseWhenSuite

0 commit comments

Comments
 (0)