Skip to content

Commit 5a6f470

Browse files
committed
Merge branch 'main' of https://github.com/apache/datafusion into lambda4
2 parents ca260a7 + 5c653be commit 5a6f470

57 files changed

Lines changed: 4449 additions & 2906 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.github/workflows/audit.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ jobs:
4242
steps:
4343
- uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
4444
- name: Install cargo-audit
45-
uses: taiki-e/install-action@94cb46f8d6e437890146ffbd78a778b78e623fb2 # v2.74.0
45+
uses: taiki-e/install-action@85b24a67ef0c632dfefad70b9d5ce8fddb040754 # v2.75.10
4646
with:
4747
tool: cargo-audit
4848
- name: Run audit check

.github/workflows/rust.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -430,7 +430,7 @@ jobs:
430430
sudo apt-get update -qq
431431
sudo apt-get install -y -qq clang
432432
- name: Setup wasm-pack
433-
uses: taiki-e/install-action@94cb46f8d6e437890146ffbd78a778b78e623fb2 # v2.74.0
433+
uses: taiki-e/install-action@85b24a67ef0c632dfefad70b9d5ce8fddb040754 # v2.75.10
434434
with:
435435
tool: wasm-pack
436436
- name: Run tests with headless mode
@@ -770,7 +770,7 @@ jobs:
770770
- name: Setup Rust toolchain
771771
uses: ./.github/actions/setup-builder
772772
- name: Install cargo-msrv
773-
uses: taiki-e/install-action@94cb46f8d6e437890146ffbd78a778b78e623fb2 # v2.74.0
773+
uses: taiki-e/install-action@85b24a67ef0c632dfefad70b9d5ce8fddb040754 # v2.75.10
774774
with:
775775
tool: cargo-msrv
776776

Cargo.lock

Lines changed: 30 additions & 30 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -162,7 +162,7 @@ glob = "0.3.0"
162162
half = { version = "2.7.0", default-features = false }
163163
hashbrown = { version = "0.17.0" }
164164
hex = { version = "0.4.3" }
165-
indexmap = "2.13.1"
165+
indexmap = "2.14.0"
166166
insta = { version = "1.47.2", features = ["glob", "filters"] }
167167
itertools = "0.14"
168168
itoa = "1.0"

benchmarks/bench.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -677,7 +677,7 @@ run_tpch() {
677677
echo "Running tpch benchmark..."
678678

679679
FORMAT=$2
680-
debug_run $CARGO_COMMAND --bin dfbench -- tpch --iterations 5 --path "${TPCH_DIR}" --prefer_hash_join "${PREFER_HASH_JOIN}" --format ${FORMAT} -o "${RESULTS_FILE}" ${QUERY_ARG} ${LATENCY_ARG}
680+
debug_run $CARGO_COMMAND --bin dfbench -- tpch --iterations 5 --path "${TPCH_DIR}" --scale-factor "${SCALE_FACTOR}" --prefer_hash_join "${PREFER_HASH_JOIN}" --format ${FORMAT} -o "${RESULTS_FILE}" ${QUERY_ARG} ${LATENCY_ARG}
681681
}
682682

683683
# Runs the tpch in memory (needs tpch parquet data)
@@ -693,7 +693,7 @@ run_tpch_mem() {
693693
echo "RESULTS_FILE: ${RESULTS_FILE}"
694694
echo "Running tpch_mem benchmark..."
695695
# -m means in memory
696-
debug_run $CARGO_COMMAND --bin dfbench -- tpch --iterations 5 --path "${TPCH_DIR}" --prefer_hash_join "${PREFER_HASH_JOIN}" -m --format parquet -o "${RESULTS_FILE}" ${QUERY_ARG} ${LATENCY_ARG}
696+
debug_run $CARGO_COMMAND --bin dfbench -- tpch --iterations 5 --path "${TPCH_DIR}" --scale-factor "${SCALE_FACTOR}" --prefer_hash_join "${PREFER_HASH_JOIN}" -m --format parquet -o "${RESULTS_FILE}" ${QUERY_ARG} ${LATENCY_ARG}
697697
}
698698

699699
# Runs the tpcds benchmark
@@ -900,7 +900,7 @@ data_imdb() {
900900
if [ "${DOWNLOADED_SIZE}" != "${expected_size}" ]; then
901901
echo "Error: Download size mismatch"
902902
echo "Expected: ${expected_size}"
903-
echo "Got: ${DOWNLADED_SIZE}"
903+
echo "Got: ${DOWNLOADED_SIZE}"
904904
echo "Please re-initiate the download"
905905
return 1
906906
fi

benchmarks/lineprotocol.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -164,12 +164,12 @@ def lineformat(
164164
) -> None:
165165
baseline = BenchmarkRun.load_from_file(baseline)
166166
context = baseline.context
167-
benchamrk_str = f"benchmark,name={context.name},version={context.benchmark_version},datafusion_version={context.datafusion_version},num_cpus={context.num_cpus}"
167+
benchmark_str = f"benchmark,name={context.name},version={context.benchmark_version},datafusion_version={context.datafusion_version},num_cpus={context.num_cpus}"
168168
for query in baseline.queries:
169169
query_str = f"query=\"{query.query}\""
170170
timestamp = f"{query.start_time*10**9}"
171171
for iter_num, result in enumerate(query.iterations):
172-
print(f"{benchamrk_str} {query_str},iteration={iter_num},row_count={result.row_count},elapsed_ms={result.elapsed*1000:.0f} {timestamp}\n")
172+
print(f"{benchmark_str} {query_str},iteration={iter_num},row_count={result.row_count},elapsed_ms={result.elapsed*1000:.0f} {timestamp}\n")
173173

174174
def main() -> None:
175175
parser = ArgumentParser()

benchmarks/queries/q10.sql

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ where
1616
c_custkey = o_custkey
1717
and l_orderkey = o_orderkey
1818
and o_orderdate >= date '1993-10-01'
19-
and o_orderdate < date '1994-01-01'
19+
and o_orderdate < date '1993-10-01' + interval '3' month
2020
and l_returnflag = 'R'
2121
and c_nationkey = n_nationkey
2222
group by

benchmarks/queries/q11.sql

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ group by
1313
ps_partkey having
1414
sum(ps_supplycost * ps_availqty) > (
1515
select
16-
sum(ps_supplycost * ps_availqty) * 0.0001
16+
sum(ps_supplycost * ps_availqty) * 0.0001 /* __TPCH_Q11_FRACTION__ */
1717
from
1818
partsupp,
1919
supplier,
@@ -24,4 +24,4 @@ group by
2424
and n_name = 'GERMANY'
2525
)
2626
order by
27-
value desc;
27+
value desc;

benchmarks/queries/q12.sql

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,8 @@ where
2323
and l_commitdate < l_receiptdate
2424
and l_shipdate < l_commitdate
2525
and l_receiptdate >= date '1994-01-01'
26-
and l_receiptdate < date '1995-01-01'
26+
and l_receiptdate < date '1994-01-01' + interval '1' year
2727
group by
2828
l_shipmode
2929
order by
30-
l_shipmode;
30+
l_shipmode;

benchmarks/queries/q14.sql

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,4 +10,4 @@ from
1010
where
1111
l_partkey = p_partkey
1212
and l_shipdate >= date '1995-09-01'
13-
and l_shipdate < date '1995-10-01';
13+
and l_shipdate < date '1995-09-01' + interval '1' month;

0 commit comments

Comments
 (0)