From 48c35872049663ef61991eb5d748578d53a67475 Mon Sep 17 00:00:00 2001 From: Andy Grove Date: Tue, 7 May 2024 08:37:07 -0600 Subject: [PATCH] Prepare 38.0.0 release candidate 1 (#10407) * add new crates to script * update version and run cargo update * changelog * update cargo meta to reflect TLP status --- Cargo.toml | 38 +-- datafusion-cli/Cargo.lock | 304 ++++++++++++------------ datafusion-cli/Cargo.toml | 8 +- datafusion/CHANGELOG.md | 1 + dev/changelog/38.0.0.md | 370 ++++++++++++++++++++++++++++++ dev/requirements.txt | 2 + dev/update_datafusion_versions.py | 3 + docs/source/user-guide/configs.md | 2 +- 8 files changed, 547 insertions(+), 181 deletions(-) create mode 100644 dev/changelog/38.0.0.md create mode 100644 dev/requirements.txt diff --git a/Cargo.toml b/Cargo.toml index 3ca3af284675..e78fe4767d80 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -44,14 +44,14 @@ members = [ resolver = "2" [workspace.package] -authors = ["Apache Arrow "] +authors = ["Apache DataFusion "] edition = "2021" -homepage = "https://github.com/apache/datafusion" +homepage = "https://datafusion.apache.org" license = "Apache-2.0" readme = "README.md" repository = "https://github.com/apache/datafusion" rust-version = "1.73" -version = "37.1.0" +version = "38.0.0" [workspace.dependencies] # We turn off default-features for some dependencies here so the workspaces which inherit them can @@ -73,22 +73,22 @@ bytes = "1.4" chrono = { version = "0.4.34", default-features = false } ctor = "0.2.0" dashmap = "5.4.0" -datafusion = { path = "datafusion/core", version = "37.1.0", default-features = false } -datafusion-common = { path = "datafusion/common", version = "37.1.0", default-features = false } -datafusion-common-runtime = { path = "datafusion/common-runtime", version = "37.1.0" } -datafusion-execution = { path = "datafusion/execution", version = "37.1.0" } -datafusion-expr = { path = "datafusion/expr", version = "37.1.0" } -datafusion-functions = { path = "datafusion/functions", version = "37.1.0" } -datafusion-functions-aggregate = { path = "datafusion/functions-aggregate", version = "37.1.0" } -datafusion-functions-array = { path = "datafusion/functions-array", version = "37.1.0" } -datafusion-optimizer = { path = "datafusion/optimizer", version = "37.1.0", default-features = false } -datafusion-physical-expr = { path = "datafusion/physical-expr", version = "37.1.0", default-features = false } -datafusion-physical-expr-common = { path = "datafusion/physical-expr-common", version = "37.1.0", default-features = false } -datafusion-physical-plan = { path = "datafusion/physical-plan", version = "37.1.0" } -datafusion-proto = { path = "datafusion/proto", version = "37.1.0" } -datafusion-sql = { path = "datafusion/sql", version = "37.1.0" } -datafusion-sqllogictest = { path = "datafusion/sqllogictest", version = "37.1.0" } -datafusion-substrait = { path = "datafusion/substrait", version = "37.1.0" } +datafusion = { path = "datafusion/core", version = "38.0.0", default-features = false } +datafusion-common = { path = "datafusion/common", version = "38.0.0", default-features = false } +datafusion-common-runtime = { path = "datafusion/common-runtime", version = "38.0.0" } +datafusion-execution = { path = "datafusion/execution", version = "38.0.0" } +datafusion-expr = { path = "datafusion/expr", version = "38.0.0" } +datafusion-functions = { path = "datafusion/functions", version = "38.0.0" } +datafusion-functions-aggregate = { path = "datafusion/functions-aggregate", version = "38.0.0" } +datafusion-functions-array = { path = "datafusion/functions-array", version = "38.0.0" } +datafusion-optimizer = { path = "datafusion/optimizer", version = "38.0.0", default-features = false } +datafusion-physical-expr = { path = "datafusion/physical-expr", version = "38.0.0", default-features = false } +datafusion-physical-expr-common = { path = "datafusion/physical-expr-common", version = "38.0.0", default-features = false } +datafusion-physical-plan = { path = "datafusion/physical-plan", version = "38.0.0" } +datafusion-proto = { path = "datafusion/proto", version = "38.0.0" } +datafusion-sql = { path = "datafusion/sql", version = "38.0.0" } +datafusion-sqllogictest = { path = "datafusion/sqllogictest", version = "38.0.0" } +datafusion-substrait = { path = "datafusion/substrait", version = "38.0.0" } doc-comment = "0.3" env_logger = "0.11" futures = "0.3" diff --git a/datafusion-cli/Cargo.lock b/datafusion-cli/Cargo.lock index 5263b064ff9b..fd471e750194 100644 --- a/datafusion-cli/Cargo.lock +++ b/datafusion-cli/Cargo.lock @@ -84,9 +84,9 @@ dependencies = [ [[package]] name = "anstyle" -version = "1.0.6" +version = "1.0.7" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8901269c6307e8d93993578286ac0edf7f195079ffff5ebdeea6a59ffb7e36bc" +checksum = "038dfcf04a5feb68e9c60b21c9625a54c2c0616e79b72b0fd87075a056ae1d1b" [[package]] name = "apache-avro" @@ -177,7 +177,7 @@ dependencies = [ "chrono", "chrono-tz", "half", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "num", ] @@ -204,7 +204,7 @@ dependencies = [ "arrow-schema", "arrow-select", "atoi", - "base64 0.22.0", + "base64 0.22.1", "chrono", "comfy-table", "half", @@ -306,7 +306,7 @@ dependencies = [ "arrow-data", "arrow-schema", "half", - "hashbrown 0.14.3", + "hashbrown 0.14.5", ] [[package]] @@ -363,9 +363,9 @@ dependencies = [ [[package]] name = "async-compression" -version = "0.4.8" +version = "0.4.9" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "07dbbf24db18d609b1462965249abdf49129ccad073ec257da372adc83259c60" +checksum = "4e9eabd7a98fe442131a17c316bd9349c43695e49e730c3c8e12cfb5f4da2693" dependencies = [ "bzip2", "flate2", @@ -387,7 +387,7 @@ checksum = "c6fa2087f2753a7da8cc1c0dbfcf89579dd57458e36769de5ac750b4671737ca" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -412,9 +412,9 @@ dependencies = [ [[package]] name = "autocfg" -version = "1.2.0" +version = "1.3.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f1fdabc7756949593fe60f30ec81974b613357de856987752631dea1e3394c80" +checksum = "0c4b4d0bd25bd0b74681c0ad21497610ce1b7c91b1022cd21c80c6fbdd9476b0" [[package]] name = "aws-config" @@ -729,9 +729,9 @@ checksum = "9d297deb1925b89f2ccc13d7635fa0714f12c87adce1c75356b39ca9b7178567" [[package]] name = "base64" -version = "0.22.0" +version = "0.22.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9475866fec1451be56a3c2400fd081ff546538961565ccb5b7142cbd22bc7a51" +checksum = "72b3254f16251a8381aa12e40e3c4d2f0199f8c6508fbecb9d91f575e0fbb8c6" [[package]] name = "base64-simd" @@ -869,12 +869,13 @@ dependencies = [ [[package]] name = "cc" -version = "1.0.94" +version = "1.0.97" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "17f6e324229dc011159fcc089755d1e2e216a90d43a7dea6853ca740b84f35e7" +checksum = "099a5357d84c4c61eb35fc8eafa9a79a902c2f76911e5747ced4e032edd8d9b4" dependencies = [ "jobserver", "libc", + "once_cell", ] [[package]] @@ -1092,7 +1093,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "edb49164822f3ee45b17acd4a208cfc1251410cf0cad9a833234c9890774dd9f" dependencies = [ "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -1108,7 +1109,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "978747c1d849a7d2ee5e8adc0159961c48fb7e5db2f06af6723b80123bb53856" dependencies = [ "cfg-if", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "lock_api", "once_cell", "parking_lot_core", @@ -1116,7 +1117,7 @@ dependencies = [ [[package]] name = "datafusion" -version = "37.1.0" +version = "38.0.0" dependencies = [ "ahash", "apache-avro", @@ -1145,7 +1146,7 @@ dependencies = [ "futures", "glob", "half", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "indexmap 2.2.6", "itertools", "log", @@ -1168,7 +1169,7 @@ dependencies = [ [[package]] name = "datafusion-cli" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "assert_cmd", @@ -1195,7 +1196,7 @@ dependencies = [ [[package]] name = "datafusion-common" -version = "37.1.0" +version = "38.0.0" dependencies = [ "ahash", "apache-avro", @@ -1215,14 +1216,14 @@ dependencies = [ [[package]] name = "datafusion-common-runtime" -version = "37.1.0" +version = "38.0.0" dependencies = [ "tokio", ] [[package]] name = "datafusion-execution" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "chrono", @@ -1230,7 +1231,7 @@ dependencies = [ "datafusion-common", "datafusion-expr", "futures", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "log", "object_store", "parking_lot", @@ -1241,7 +1242,7 @@ dependencies = [ [[package]] name = "datafusion-expr" -version = "37.1.0" +version = "38.0.0" dependencies = [ "ahash", "arrow", @@ -1257,10 +1258,10 @@ dependencies = [ [[package]] name = "datafusion-functions" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", - "base64 0.22.0", + "base64 0.22.1", "blake2", "blake3", "chrono", @@ -1268,7 +1269,7 @@ dependencies = [ "datafusion-execution", "datafusion-expr", "datafusion-physical-expr", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "hex", "itertools", "log", @@ -1282,7 +1283,7 @@ dependencies = [ [[package]] name = "datafusion-functions-aggregate" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "datafusion-common", @@ -1296,7 +1297,7 @@ dependencies = [ [[package]] name = "datafusion-functions-array" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "arrow-array", @@ -1314,7 +1315,7 @@ dependencies = [ [[package]] name = "datafusion-optimizer" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "async-trait", @@ -1322,7 +1323,7 @@ dependencies = [ "datafusion-common", "datafusion-expr", "datafusion-physical-expr", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "indexmap 2.2.6", "itertools", "log", @@ -1331,7 +1332,7 @@ dependencies = [ [[package]] name = "datafusion-physical-expr" -version = "37.1.0" +version = "38.0.0" dependencies = [ "ahash", "arrow", @@ -1340,7 +1341,7 @@ dependencies = [ "arrow-ord", "arrow-schema", "arrow-string", - "base64 0.22.0", + "base64 0.22.1", "chrono", "datafusion-common", "datafusion-execution", @@ -1348,7 +1349,7 @@ dependencies = [ "datafusion-functions-aggregate", "datafusion-physical-expr-common", "half", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "hex", "indexmap 2.2.6", "itertools", @@ -1360,7 +1361,7 @@ dependencies = [ [[package]] name = "datafusion-physical-expr-common" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "datafusion-common", @@ -1369,7 +1370,7 @@ dependencies = [ [[package]] name = "datafusion-physical-plan" -version = "37.1.0" +version = "38.0.0" dependencies = [ "ahash", "arrow", @@ -1388,7 +1389,7 @@ dependencies = [ "datafusion-physical-expr-common", "futures", "half", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "indexmap 2.2.6", "itertools", "log", @@ -1401,7 +1402,7 @@ dependencies = [ [[package]] name = "datafusion-sql" -version = "37.1.0" +version = "38.0.0" dependencies = [ "arrow", "arrow-array", @@ -1557,9 +1558,9 @@ dependencies = [ [[package]] name = "fastrand" -version = "2.0.2" +version = "2.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "658bd65b1cf4c852a3cc96f18a8ce7b5640f6b703f905c7d74532294c2a63984" +checksum = "9fc0510504f03c51ada170672ac806f1f105a88aa97a5281117e1ddc3368e51a" [[package]] name = "fd-lock" @@ -1590,9 +1591,9 @@ dependencies = [ [[package]] name = "flate2" -version = "1.0.28" +version = "1.0.30" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "46303f565772937ffe1d394a4fac6f411c6013172fadde9dcdb1e147a086940e" +checksum = "5f54427cfd1c7829e2a139fcefea601bf088ebca651d2bf53ebc600eac295dae" dependencies = [ "crc32fast", "miniz_oxide", @@ -1678,7 +1679,7 @@ checksum = "87750cf4b7a4c0625b1529e4c543c2182106e4dedc60a2a6455e00d212c489ac" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -1729,9 +1730,9 @@ dependencies = [ [[package]] name = "getrandom" -version = "0.2.14" +version = "0.2.15" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "94b22e06ecb0110981051723910cbf0b5f5e09a2062dd7663334ee79a9d1286c" +checksum = "c4567c8db10ae91089c99af84c68c38da3ec2f087c3f82960bcdbf3656b6f4d7" dependencies = [ "cfg-if", "libc", @@ -1788,18 +1789,9 @@ checksum = "8a9ee70c43aaf417c914396645a0fa852624801b24ebb7ae78fe8272889ac888" [[package]] name = "hashbrown" -version = "0.13.2" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "43a3c133739dddd0d2990f9a4bdf8eb4b21ef50e4851ca85ab661199821d510e" -dependencies = [ - "ahash", -] - -[[package]] -name = "hashbrown" -version = "0.14.3" +version = "0.14.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "290f1a1d9242c78d09ce40a5e87e7554ee637af1351968159f4952f028f75604" +checksum = "e5274423e17b7c9fc20b6e7e208532f9b19825d82dfd615708b70edd83df41f1" dependencies = [ "ahash", "allocator-api2", @@ -1929,7 +1921,7 @@ dependencies = [ "futures-util", "http", "hyper", - "rustls 0.21.10", + "rustls 0.21.12", "tokio", "tokio-rustls 0.24.1", ] @@ -1984,7 +1976,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "168fb715dda47215e360912c096649d23d58bf392ac62f73919e831745e40f26" dependencies = [ "equivalent", - "hashbrown 0.14.3", + "hashbrown 0.14.5", ] [[package]] @@ -2028,9 +2020,9 @@ checksum = "49f1f14873335454500d59611f1cf4a4b0f786f9ac11f4312a78e4cf2566695b" [[package]] name = "jobserver" -version = "0.1.30" +version = "0.1.31" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "685a7d121ee3f65ae4fddd72b25a04bb36b6af81bc0828f7d5434c0fe60fa3a2" +checksum = "d2b099aaa34a9751c5bf0878add70444e1ed2dd73f347be99003d4577277de6e" dependencies = [ "libc", ] @@ -2116,15 +2108,15 @@ dependencies = [ [[package]] name = "libc" -version = "0.2.153" +version = "0.2.154" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9c198f91728a82281a64e1f4f9eeb25d82cb32a5de251c6bd1b5154d63a8e7bd" +checksum = "ae743338b92ff9146ce83992f766a31066a91a8c84a45e0e9f21e7cf6de6d346" [[package]] name = "libflate" -version = "2.0.0" +version = "2.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9f7d5654ae1795afc7ff76f4365c2c8791b0feb18e8996a96adad8ffd7c3b2bf" +checksum = "45d9dfdc14ea4ef0900c1cddbc8dcd553fbaacd8a4a282cf4018ae9dd04fb21e" dependencies = [ "adler32", "core2", @@ -2135,12 +2127,12 @@ dependencies = [ [[package]] name = "libflate_lz77" -version = "2.0.0" +version = "2.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "be5f52fb8c451576ec6b79d3f4deb327398bc05bbdbd99021a6e77a4c855d524" +checksum = "e6e0d73b369f386f1c44abd9c570d5318f55ccde816ff4b562fa452e5182863d" dependencies = [ "core2", - "hashbrown 0.13.2", + "hashbrown 0.14.5", "rle-decode-fast", ] @@ -2152,9 +2144,9 @@ checksum = "4ec2a862134d2a7d32d7983ddcdd1c4923530833c9f2ea1a44fc5fa473989058" [[package]] name = "libmimalloc-sys" -version = "0.1.35" +version = "0.1.37" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3979b5c37ece694f1f5e51e7ecc871fdb0f517ed04ee45f88d15d6d553cb9664" +checksum = "81eb4061c0582dedea1cbc7aff2240300dd6982e0239d1c99e65c1dbf4a30ba7" dependencies = [ "cc", "libc", @@ -2178,9 +2170,9 @@ checksum = "01cda141df6706de531b6c46c3a33ecca755538219bd484262fa09410c13539c" [[package]] name = "lock_api" -version = "0.4.11" +version = "0.4.12" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3c168f8615b12bc01f9c17e2eb0cc07dcae1940121185446edc3744920e8ef45" +checksum = "07af8b9cdd281b7915f413fa73f29ebd5d55d0d3f0155584dade1ff18cea1b17" dependencies = [ "autocfg", "scopeguard", @@ -2230,9 +2222,9 @@ checksum = "6c8640c5d730cb13ebd907d8d04b52f55ac9a2eec55b440c8892f40d56c76c1d" [[package]] name = "mimalloc" -version = "0.1.39" +version = "0.1.41" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "fa01922b5ea280a911e323e4d2fd24b7fe5cc4042e0d2cda3c40775cdc4bdc9c" +checksum = "9f41a2280ded0da56c8cf898babb86e8f10651a34adcfff190ae9a1159c6908d" dependencies = [ "libmimalloc-sys", ] @@ -2305,11 +2297,10 @@ dependencies = [ [[package]] name = "num-bigint" -version = "0.4.4" +version = "0.4.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "608e7659b5c3d7cba262d894801b9ec9d00de989e8a82bd4bef91d08da45cdc0" +checksum = "c165a9ab64cf766f73521c0dd2cfdff64f488b8f0b3e621face3462d3db536d7" dependencies = [ - "autocfg", "num-integer", "num-traits", ] @@ -2340,9 +2331,9 @@ dependencies = [ [[package]] name = "num-iter" -version = "0.1.44" +version = "0.1.45" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "d869c01cc0c455284163fd0092f1f93835385ccab5a98a0dcc497b2f8bf055a9" +checksum = "1429034a0490724d0075ebb2bc9e875d6503c3cf69e235a8941aa757d83ef5bf" dependencies = [ "autocfg", "num-integer", @@ -2363,9 +2354,9 @@ dependencies = [ [[package]] name = "num-traits" -version = "0.2.18" +version = "0.2.19" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "da0df0e5185db44f69b44f26786fe401b6c293d1907744beaa7fa62b2e5a517a" +checksum = "071dfc062690e90b734c0b2273ce72ad0ffa95f0c74596bc250dcfd960262841" dependencies = [ "autocfg", "libm", @@ -2456,9 +2447,9 @@ checksum = "4030760ffd992bef45b0ae3f10ce1aba99e33464c90d14dd7c039884963ddc7a" [[package]] name = "parking_lot" -version = "0.12.1" +version = "0.12.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3742b2c103b9f06bc9fff0a37ff4912935851bee6d36f3c02bcc755bcfec228f" +checksum = "7e4af0ca4f6caed20e900d564c242b8e5d4903fdacf31d3daf527b66fe6f42fb" dependencies = [ "lock_api", "parking_lot_core", @@ -2466,15 +2457,15 @@ dependencies = [ [[package]] name = "parking_lot_core" -version = "0.9.9" +version = "0.9.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "4c42a9226546d68acdd9c0a280d17ce19bfe27a46bf68784e4066115788d008e" +checksum = "1e401f977ab385c9e4e3ab30627d6f26d00e2c73eef317493c4ec6d468726cf8" dependencies = [ "cfg-if", "libc", "redox_syscall", "smallvec", - "windows-targets 0.48.5", + "windows-targets 0.52.5", ] [[package]] @@ -2491,14 +2482,14 @@ dependencies = [ "arrow-ipc", "arrow-schema", "arrow-select", - "base64 0.22.0", + "base64 0.22.1", "brotli", "bytes", "chrono", "flate2", "futures", "half", - "hashbrown 0.14.3", + "hashbrown 0.14.5", "lz4_flex", "num", "num-bigint", @@ -2514,18 +2505,18 @@ dependencies = [ [[package]] name = "parse-zoneinfo" -version = "0.3.0" +version = "0.3.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c705f256449c60da65e11ff6626e0c16a0a0b96aaa348de61376b249bc340f41" +checksum = "1f2a05b18d44e2957b88f96ba460715e295bc1d7510468a2f3d3b44535d26c24" dependencies = [ "regex", ] [[package]] name = "paste" -version = "1.0.14" +version = "1.0.15" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "de3145af08024dea9fa9914f381a17b8fc6034dfb00f3a84013f7ff43f29ed4c" +checksum = "57c0d7b74b563b49d38dae00a0c37d4d6de9b432382b2892f0574ddcae73fd0a" [[package]] name = "percent-encoding" @@ -2598,7 +2589,7 @@ checksum = "2f38a4412a78282e09a2cf38d195ea5420d15ba0602cb375210efbc877243965" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -2687,9 +2678,9 @@ dependencies = [ [[package]] name = "proc-macro2" -version = "1.0.81" +version = "1.0.82" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3d1597b0c024618f09a9c3b8655b7e430397a36d23fdafec26d6965e9eec3eba" +checksum = "8ad3d49ab951a01fbaafe34f2ec74122942fe18a3f9814c3268f1bb72042131b" dependencies = [ "unicode-ident", ] @@ -2761,11 +2752,11 @@ dependencies = [ [[package]] name = "redox_syscall" -version = "0.4.1" +version = "0.5.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "4722d768eff46b75989dd134e5c353f0d6296e5aaa3132e776cbdb56be7731aa" +checksum = "469052894dcb553421e483e4209ee581a45100d31b4018de03e5a7ad86374a7e" dependencies = [ - "bitflags 1.3.2", + "bitflags 2.5.0", ] [[package]] @@ -2837,7 +2828,7 @@ dependencies = [ "once_cell", "percent-encoding", "pin-project-lite", - "rustls 0.21.10", + "rustls 0.21.12", "rustls-native-certs", "rustls-pemfile 1.0.4", "serde", @@ -2921,9 +2912,9 @@ dependencies = [ [[package]] name = "rustc-demangle" -version = "0.1.23" +version = "0.1.24" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "d626bb9dae77e28219937af045c257c28bfd3f69333c512553507f5f9798cb76" +checksum = "719b953e2095829ee67db738b3bfa9fa368c94900df327b3f07fe6e794d2fe1f" [[package]] name = "rustc_version" @@ -2936,9 +2927,9 @@ dependencies = [ [[package]] name = "rustix" -version = "0.38.32" +version = "0.38.34" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "65e04861e65f21776e67888bfbea442b3642beaa0138fdb1dd7a84a52dffdb89" +checksum = "70dc5ec042f7a43c4a73241207cecc9873a06d45debb38b329f8541d85c2730f" dependencies = [ "bitflags 2.5.0", "errno", @@ -2961,9 +2952,9 @@ dependencies = [ [[package]] name = "rustls" -version = "0.21.10" +version = "0.21.12" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f9d5a6813c0759e4609cd494e8e725babae6a2ca7b62a5536a13daaec6fcb7ba" +checksum = "3f56a14d1f48b391359b22f731fd4bd7e43c97f3c50eee276f3aa09c94784d3e" dependencies = [ "log", "ring 0.17.8", @@ -2998,15 +2989,15 @@ version = "2.1.2" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "29993a25686778eb88d4189742cd713c9bce943bc54251a33509dc63cbacf73d" dependencies = [ - "base64 0.22.0", + "base64 0.22.1", "rustls-pki-types", ] [[package]] name = "rustls-pki-types" -version = "1.4.1" +version = "1.6.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ecd36cc4259e3e4514335c4a138c6b43171a8d61d8f5c9348f9fc7529416f247" +checksum = "51f344d206c5e1b010eec27349b815a4805f70a778895959d70b74b9b529b30a" [[package]] name = "rustls-webpki" @@ -3020,9 +3011,9 @@ dependencies = [ [[package]] name = "rustversion" -version = "1.0.15" +version = "1.0.16" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "80af6f9131f277a45a3fba6ce8e2258037bb0477a67e610d3c1fe046ab31de47" +checksum = "092474d1a01ea8278f69e6a358998405fae5b8b963ddaeb2b0b04a128bf1dfb0" [[package]] name = "rustyline" @@ -3049,9 +3040,9 @@ dependencies = [ [[package]] name = "ryu" -version = "1.0.17" +version = "1.0.18" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e86697c916019a8588c99b5fac3cead74ec0b4b819707a682fd4d23fa0ce1ba1" +checksum = "f3cb5ba0dc43242ce17de99c180e96db90b235b8a9fdc9543c96d2209116bd9f" [[package]] name = "same-file" @@ -3089,11 +3080,11 @@ dependencies = [ [[package]] name = "security-framework" -version = "2.10.0" +version = "2.11.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "770452e37cad93e0a50d5abc3990d2bc351c36d0328f86cefec2f2fb206eaef6" +checksum = "c627723fd09706bacdb5cf41499e95098555af3c3c29d014dc3c458ef6be11c0" dependencies = [ - "bitflags 1.3.2", + "bitflags 2.5.0", "core-foundation", "core-foundation-sys", "libc", @@ -3102,9 +3093,9 @@ dependencies = [ [[package]] name = "security-framework-sys" -version = "2.10.0" +version = "2.11.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "41f3cc463c0ef97e11c3461a9d3787412d30e8e7eb907c79180c4a57bf7c04ef" +checksum = "317936bbbd05227752583946b9e66d7ce3b489f84e11a94a510b4437fef407d7" dependencies = [ "core-foundation-sys", "libc", @@ -3112,9 +3103,9 @@ dependencies = [ [[package]] name = "semver" -version = "1.0.22" +version = "1.0.23" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "92d43fe69e652f3df9bdc2b85b2854a0825b86e4fb76bc44d945137d053639ca" +checksum = "61697e0a1c7e512e84a621326239844a24d8207b4669b41bc18b32ea5cbf988b" [[package]] name = "seq-macro" @@ -3124,22 +3115,22 @@ checksum = "a3f0bf26fd526d2a95683cd0f87bf103b8539e2ca1ef48ce002d67aad59aa0b4" [[package]] name = "serde" -version = "1.0.198" +version = "1.0.200" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9846a40c979031340571da2545a4e5b7c4163bdae79b301d5f86d03979451fcc" +checksum = "ddc6f9cc94d67c0e21aaf7eda3a010fd3af78ebf6e096aa6e2e13c79749cce4f" dependencies = [ "serde_derive", ] [[package]] name = "serde_derive" -version = "1.0.198" +version = "1.0.200" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e88edab869b01783ba905e7d0153f9fc1a6505a96e4ad3018011eedb838566d9" +checksum = "856f046b9400cee3c8c94ed572ecdb752444c24528c035cd35882aad6f492bcb" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3178,9 +3169,9 @@ dependencies = [ [[package]] name = "signal-hook-registry" -version = "1.4.1" +version = "1.4.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "d8229b473baa5980ac72ef434c4415e70c4b5e71b423043adb4ba059f89c99a1" +checksum = "a9e9e0b4211b72e7b8b6e85c807d36c212bdb33ea8587f7569562a84df5465b1" dependencies = [ "libc", ] @@ -3236,9 +3227,9 @@ checksum = "1b6b67fb9a61334225b5b790716f609cd58395f895b3fe8b328786812a40bc3b" [[package]] name = "socket2" -version = "0.5.6" +version = "0.5.7" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "05ffd9c0a93b7543e062e759284fcf5f5e3b098501104bfbdde4d404db792871" +checksum = "ce305eb0b4296696835b71df73eb912e0f1ffd2556a501fcede6e0c50349191c" dependencies = [ "libc", "windows-sys 0.52.0", @@ -3274,7 +3265,7 @@ checksum = "01b2e185515564f15375f593fb966b5718bc624ba77fe49fa4616ad619690554" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3320,7 +3311,7 @@ dependencies = [ "proc-macro2", "quote", "rustversion", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3333,7 +3324,7 @@ dependencies = [ "proc-macro2", "quote", "rustversion", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3355,9 +3346,9 @@ dependencies = [ [[package]] name = "syn" -version = "2.0.60" +version = "2.0.61" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "909518bc7b1c9b779f1bbf07f2929d35af9f0f37e47c6e9ef7f9dddc1e1821f3" +checksum = "c993ed8ccba56ae856363b1845da7266a7cb78e1d146c8a32d54b45a8b831fc9" dependencies = [ "proc-macro2", "quote", @@ -3398,7 +3389,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "85b77fafb263dd9d05cbeac119526425676db3784113aa9295c88498cbf8bff1" dependencies = [ "cfg-if", - "fastrand 2.0.2", + "fastrand 2.1.0", "rustix", "windows-sys 0.52.0", ] @@ -3426,22 +3417,22 @@ checksum = "23d434d3f8967a09480fb04132ebe0a3e088c173e6d0ee7897abbdf4eab0f8b9" [[package]] name = "thiserror" -version = "1.0.58" +version = "1.0.60" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "03468839009160513471e86a034bb2c5c0e4baae3b43f79ffc55c4a5427b3297" +checksum = "579e9083ca58dd9dcf91a9923bb9054071b9ebbd800b342194c9feb0ee89fc18" dependencies = [ "thiserror-impl", ] [[package]] name = "thiserror-impl" -version = "1.0.58" +version = "1.0.60" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c61f3ba182994efc43764a46c018c347bc492c79f024e705f46567b418f6d4f7" +checksum = "e2470041c06ec3ac1ab38d0356a6119054dedaea53e12fbefc0de730a1c08524" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3536,7 +3527,7 @@ checksum = "5b8a1e28f2deaa14e508979454cb3a223b10b938b45af148bc0986de36f1923b" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3556,7 +3547,7 @@ version = "0.24.1" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "c28327cf380ac148141087fbfb9de9d7bd4e84ab5d2c28fbc911d753de8a7081" dependencies = [ - "rustls 0.21.10", + "rustls 0.21.12", "tokio", ] @@ -3573,16 +3564,15 @@ dependencies = [ [[package]] name = "tokio-util" -version = "0.7.10" +version = "0.7.11" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "5419f34732d9eb6ee4c3578b7989078579b7f039cbbb9ca2c4da015749371e15" +checksum = "9cf6b47b3771c49ac75ad09a6162f53ad4b8088b76ac60e8ec1455b31a189fe1" dependencies = [ "bytes", "futures-core", "futures-sink", "pin-project-lite", "tokio", - "tracing", ] [[package]] @@ -3633,7 +3623,7 @@ checksum = "34704c8d6ebcbc939824180af020566b01a7c01f80641264eba0999f6c2b6be7" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3678,7 +3668,7 @@ checksum = "f03ca4cb38206e2bef0700092660bb74d696f808514dae47fa1467cbfe26e96e" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] @@ -3716,9 +3706,9 @@ checksum = "d4c87d22b6e3f4a18d4d40ef354e97c90fcb14dd91d7dc0aa9d8a1172ebf7202" [[package]] name = "unicode-width" -version = "0.1.11" +version = "0.1.12" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e51733f11c9c4f72aa0c160008246859e340b00807569a0da0e7a1079b27ba85" +checksum = "68f5e5f3158ecfd4b8ff6fe086db7c8467a2dfdac97fe420f2b7c4aa97af66d6" [[package]] name = "untrusted" @@ -3832,7 +3822,7 @@ dependencies = [ "once_cell", "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", "wasm-bindgen-shared", ] @@ -3866,7 +3856,7 @@ checksum = "e94f17b526d0a461a191c78ea52bbce64071ed5c04c9ffe424dcb38f74171bb7" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", "wasm-bindgen-backend", "wasm-bindgen-shared", ] @@ -3928,11 +3918,11 @@ checksum = "ac3b87c63620426dd9b991e5ce0329eff545bccbbb34f3be09ff6fb6ab51b7b6" [[package]] name = "winapi-util" -version = "0.1.6" +version = "0.1.8" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f29e6f9198ba0d26b4c9f07dbe6f9ed633e1f3d5b8b414090084349e46a52596" +checksum = "4d4cc384e1e73b93bafa6fb4f1df8c41695c8a91cf9c4c64358067d15a7b6c6b" dependencies = [ - "winapi", + "windows-sys 0.52.0", ] [[package]] @@ -4116,22 +4106,22 @@ dependencies = [ [[package]] name = "zerocopy" -version = "0.7.32" +version = "0.7.34" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "74d4d3961e53fa4c9a25a8637fc2bfaf2595b3d3ae34875568a5cf64787716be" +checksum = "ae87e3fcd617500e5d106f0380cf7b77f3c6092aae37191433159dda23cfb087" dependencies = [ "zerocopy-derive", ] [[package]] name = "zerocopy-derive" -version = "0.7.32" +version = "0.7.34" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9ce1b18ccd8e73a9321186f97e46f9f04b778851177567b1975109d26a08d2a6" +checksum = "15e934569e47891f7d9411f1a451d947a60e000ab3bd24fbb970f000387d1b3b" dependencies = [ "proc-macro2", "quote", - "syn 2.0.60", + "syn 2.0.61", ] [[package]] diff --git a/datafusion-cli/Cargo.toml b/datafusion-cli/Cargo.toml index c6019bc5970c..4e3d800cfe97 100644 --- a/datafusion-cli/Cargo.toml +++ b/datafusion-cli/Cargo.toml @@ -18,12 +18,12 @@ [package] name = "datafusion-cli" description = "Command Line Client for DataFusion query engine." -version = "37.1.0" -authors = ["Apache Arrow "] +version = "38.0.0" +authors = ["Apache DataFusion "] edition = "2021" keywords = ["arrow", "datafusion", "query", "sql"] license = "Apache-2.0" -homepage = "https://github.com/apache/datafusion" +homepage = "https://datafusion.apache.org" repository = "https://github.com/apache/datafusion" # Specify MSRV here as `cargo msrv` doesn't support workspace version rust-version = "1.73" @@ -35,7 +35,7 @@ async-trait = "0.1.41" aws-config = "0.55" aws-credential-types = "0.55" clap = { version = "3", features = ["derive", "cargo"] } -datafusion = { path = "../datafusion/core", version = "37.1.0", features = [ +datafusion = { path = "../datafusion/core", version = "38.0.0", features = [ "avro", "crypto_expressions", "datetime_expressions", diff --git a/datafusion/CHANGELOG.md b/datafusion/CHANGELOG.md index 6ab4801b8c60..04de1efe5a81 100644 --- a/datafusion/CHANGELOG.md +++ b/datafusion/CHANGELOG.md @@ -19,6 +19,7 @@ # Changelog +- [38.0.0](../dev/changelog/38.0.0.md) - [37.1.0](../dev/changelog/37.1.0.md) - [37.0.0](../dev/changelog/37.0.0.md) - [36.0.0](../dev/changelog/36.0.0.md) diff --git a/dev/changelog/38.0.0.md b/dev/changelog/38.0.0.md new file mode 100644 index 000000000000..ca06ad5de475 --- /dev/null +++ b/dev/changelog/38.0.0.md @@ -0,0 +1,370 @@ + + +## [38.0.0](https://github.com/apache/datafusion/tree/38.0.0) (2024-05-07) + +**Breaking changes:** + +- refactor: make dfschema wrap schemaref [#9595](https://github.com/apache/datafusion/pull/9595) (haohuaijin) +- Make FirstValue an UDAF, Change `AggregateUDFImpl::accumulator` signature, support ORDER BY for UDAFs [#9874](https://github.com/apache/datafusion/pull/9874) (jayzhan211) +- Remove `OwnedTableReference` and `OwnedSchemaReference` [#9933](https://github.com/apache/datafusion/pull/9933) (comphead) +- Consistent LogicalPlan subquery handling in TreeNode::apply and TreeNode::visit [#9913](https://github.com/apache/datafusion/pull/9913) (peter-toth) +- Refactor `Optimizer` to use owned plans and `TreeNode` API (10% faster planning) [#9948](https://github.com/apache/datafusion/pull/9948) (alamb) +- Stop copying plans in `LogicalPlan::with_param_values` [#10016](https://github.com/apache/datafusion/pull/10016) (alamb) +- Move coalesce to datafusion-functions and remove BuiltInScalarFunction [#10098](https://github.com/apache/datafusion/pull/10098) (Omega359) +- Refactor sessionconfig set fns to avoid an unnecessary enum to string conversion [#10141](https://github.com/apache/datafusion/pull/10141) (psvri) +- ScalarUDF: Remove `supports_zero_argument` and avoid creating null array for empty args [#10193](https://github.com/apache/datafusion/pull/10193) (jayzhan211) +- Clean-up: Remove AggregateExec::group_by() [#10297](https://github.com/apache/datafusion/pull/10297) (berkaysynnada) +- Remove `ScalarFunctionDefinition::Name` [#10277](https://github.com/apache/datafusion/pull/10277) (lewiszlw) +- feat: Determine ordering of file groups [#9593](https://github.com/apache/datafusion/pull/9593) (suremarc) +- Split parquet bloom filter config and enable bloom filter on read by default [#10306](https://github.com/apache/datafusion/pull/10306) (lewiszlw) +- Improve coerce API so it does not need DFSchema [#10331](https://github.com/apache/datafusion/pull/10331) (alamb) +- Minor: Do not force analyzer to copy logical plans [#10367](https://github.com/apache/datafusion/pull/10367) (alamb) +- Move `Covariance` (Sample) `covar` / `covar_samp` to be a User Defined Aggregate Function [#10372](https://github.com/apache/datafusion/pull/10372) (jayzhan211) + +**Performance related:** + +- perf: Use `Arc` instead of `Cow<&'a>` in the analyzer [#9824](https://github.com/apache/datafusion/pull/9824) (comphead) + +**Implemented enhancements:** + +- feat: Add display_pg_json for LogicalPlan [#9789](https://github.com/apache/datafusion/pull/9789) (liurenjie1024) +- feat: eliminate redundant sorts on monotonic expressions [#9813](https://github.com/apache/datafusion/pull/9813) (suremarc) +- feat: optimize `lower` and `upper` functions [#9971](https://github.com/apache/datafusion/pull/9971) (JasonLi-cn) +- feat: support `unnest` multiple arrays [#10044](https://github.com/apache/datafusion/pull/10044) (jonahgao) +- feat: `DataFrame` supports unnesting multiple columns [#10118](https://github.com/apache/datafusion/pull/10118) (jonahgao) +- feat: support input reordering for `NestedLoopJoinExec` [#9676](https://github.com/apache/datafusion/pull/9676) (korowa) +- feat: add static_name() to ExecutionPlan [#10266](https://github.com/apache/datafusion/pull/10266) (waynexia) +- feat: add optimizer config param to avoid grouping partitions `prefer_existing_union` [#10259](https://github.com/apache/datafusion/pull/10259) (NGA-TRAN) +- feat: unwrap casts of string and dictionary columns [#10323](https://github.com/apache/datafusion/pull/10323) (erratic-pattern) +- feat: Add CrossJoin match case to unparser [#10371](https://github.com/apache/datafusion/pull/10371) (sardination) +- feat: run expression simplifier in a loop until a fixedpoint or 3 cycles [#10358](https://github.com/apache/datafusion/pull/10358) (erratic-pattern) + +**Fixed bugs:** + +- fix: detect non-recursive CTEs in the recursive `WITH` clause [#9836](https://github.com/apache/datafusion/pull/9836) (jonahgao) +- fix: improve `unnest_generic_list` handling of null list [#9975](https://github.com/apache/datafusion/pull/9975) (jonahgao) +- fix: reduce lock contention in `RepartitionExec::execute` [#10009](https://github.com/apache/datafusion/pull/10009) (crepererum) +- fix: `RepartitionExec` metrics [#10025](https://github.com/apache/datafusion/pull/10025) (crepererum) +- fix: Support Dict types in `in_list` physical plans [#10031](https://github.com/apache/datafusion/pull/10031) (advancedxy) +- fix: Specify row count in sort_batch for batch with no columns [#10094](https://github.com/apache/datafusion/pull/10094) (viirya) +- fix: another non-deterministic test in `joins.slt` [#10122](https://github.com/apache/datafusion/pull/10122) (korowa) +- fix: duplicate output for HashJoinExec in CollectLeft mode [#9757](https://github.com/apache/datafusion/pull/9757) (korowa) +- fix: cargo warnings of import item [#10196](https://github.com/apache/datafusion/pull/10196) (waynexia) +- fix: reduce lock contention in distributor channels [#10026](https://github.com/apache/datafusion/pull/10026) (crepererum) +- fix: no longer support the `substring` function [#10242](https://github.com/apache/datafusion/pull/10242) (jonahgao) +- fix: Correct null_count in describe() [#10260](https://github.com/apache/datafusion/pull/10260) (Weijun-H) +- fix: schema error when parsing order-by expressions [#10234](https://github.com/apache/datafusion/pull/10234) (jonahgao) +- fix: LogFunc simplify swaps arguments [#10360](https://github.com/apache/datafusion/pull/10360) (erratic-pattern) + +**Documentation updates:** + +- Update `COPY` documentation to reflect changes [#9754](https://github.com/apache/datafusion/pull/9754) (alamb) +- doc: Add `datafusion-federation` to Integrations [#9853](https://github.com/apache/datafusion/pull/9853) (phillipleblanc) +- Improve `AggregateUDFImpl::state_fields` documentation [#9919](https://github.com/apache/datafusion/pull/9919) (alamb) +- Update datafusion-cli docs, split up [#10078](https://github.com/apache/datafusion/pull/10078) (alamb) +- Fix large futures causing stack overflows [#10033](https://github.com/apache/datafusion/pull/10033) (sergiimk) +- Update documentation to replace Apache Arrow DataFusion with Apache DataFusion [#10130](https://github.com/apache/datafusion/pull/10130) (andygrove) +- Update github repo links [#10167](https://github.com/apache/datafusion/pull/10167) (lewiszlw) +- minor: fix installation section link [#10179](https://github.com/apache/datafusion/pull/10179) (comphead) +- Improve documentation on `TreeNode` [#10035](https://github.com/apache/datafusion/pull/10035) (alamb) +- Update .asf.yaml to publish docs to datafusion.apache.org [#10190](https://github.com/apache/datafusion/pull/10190) (phillipleblanc) +- Update links to point to datafusion.apache.org [#10195](https://github.com/apache/datafusion/pull/10195) (phillipleblanc) +- doc: fix subscribe mail link to datafusion mailing lists [#10225](https://github.com/apache/datafusion/pull/10225) (jackwener) +- Fix docs.rs build for datafusion-proto (hopefully) [#10254](https://github.com/apache/datafusion/pull/10254) (alamb) +- docs: add download page [#10271](https://github.com/apache/datafusion/pull/10271) (tisonkun) +- Clarify docs explaining the relationship between `SessionState` and `SessionContext` [#10350](https://github.com/apache/datafusion/pull/10350) (alamb) +- docs: Add DataFusion subprojects to navigation menu, other minor updates [#10362](https://github.com/apache/datafusion/pull/10362) (andygrove) + +**Merged pull requests:** + +- Prepare 37.0.0 Release [#9697](https://github.com/apache/datafusion/pull/9697) (andygrove) +- move Left, Lpad, Reverse, Right, Rpad functions to datafusion_functions [#9841](https://github.com/apache/datafusion/pull/9841) (Omega359) +- Add non-column expression equality tracking to filter exec [#9819](https://github.com/apache/datafusion/pull/9819) (mustafasrepo) +- datafusion-cli support for multiple commands in a single line [#9831](https://github.com/apache/datafusion/pull/9831) (berkaysynnada) +- Add tests for filtering, grouping, aggregation of ARRAYs [#9695](https://github.com/apache/datafusion/pull/9695) (alamb) +- Remove vestigal conbench integration [#9855](https://github.com/apache/datafusion/pull/9855) (alamb) +- feat: Add display_pg_json for LogicalPlan [#9789](https://github.com/apache/datafusion/pull/9789) (liurenjie1024) +- Update `COPY` documentation to reflect changes [#9754](https://github.com/apache/datafusion/pull/9754) (alamb) +- Minor: Remove the bench most likely to cause OOM in CI [#9858](https://github.com/apache/datafusion/pull/9858) (gruuya) +- Minor: make uuid an optional dependency on datafusion-functions [#9771](https://github.com/apache/datafusion/pull/9771) (alamb) +- doc: Add `Spice.ai` to Known Users [#9852](https://github.com/apache/datafusion/pull/9852) (phillipleblanc) +- minor: add a hint how to adjust max rows displayed [#9845](https://github.com/apache/datafusion/pull/9845) (comphead) +- Exclude .github directory from release tarball [#9850](https://github.com/apache/datafusion/pull/9850) (andygrove) +- move strpos, substr functions to datafusion_functions [#9849](https://github.com/apache/datafusion/pull/9849) (Omega359) +- doc: Add `datafusion-federation` to Integrations [#9853](https://github.com/apache/datafusion/pull/9853) (phillipleblanc) +- chore(deps): update cargo requirement from 0.77.0 to 0.78.1 [#9844](https://github.com/apache/datafusion/pull/9844) (dependabot[bot]) +- chore(deps-dev): bump webpack-dev-middleware from 5.3.3 to 5.3.4 in /datafusion/wasmtest/datafusion-wasm-app [#9741](https://github.com/apache/datafusion/pull/9741) (dependabot[bot]) +- Implement semi/anti join output statistics estimation [#9800](https://github.com/apache/datafusion/pull/9800) (korowa) +- move Log2, Log10, Ln to datafusion-functions [#9869](https://github.com/apache/datafusion/pull/9869) (tinfoil-knight) +- Add CI compile checks for feature flags in datafusion-functions [#9772](https://github.com/apache/datafusion/pull/9772) (alamb) +- move the Translate, SubstrIndex, FindInSet functions to datafusion-functions [#9864](https://github.com/apache/datafusion/pull/9864) (Omega359) +- Support custom struct field names with new scalar function named_struct [#9743](https://github.com/apache/datafusion/pull/9743) (gstvg) +- Allow declaring partition columns in `PARTITION BY` clause, backwards compatible [#9599](https://github.com/apache/datafusion/pull/9599) (MohamedAbdeen21) +- Minor: Move depcheck out of datafusion crate (200 less crates to compile) [#9865](https://github.com/apache/datafusion/pull/9865) (alamb) +- Minor: delete duplicate bench test [#9866](https://github.com/apache/datafusion/pull/9866) (Lordworms) +- parquet: Add tests for pruning on Int8/Int16/Int64 columns [#9778](https://github.com/apache/datafusion/pull/9778) (progval) +- move `Atan2`, `Atan`, `Acosh`, `Asinh`, `Atanh` to `datafusion-function` [#9872](https://github.com/apache/datafusion/pull/9872) (Weijun-H) +- minor(doc): fix dead link for catalogs example [#9883](https://github.com/apache/datafusion/pull/9883) (yjshen) +- parquet: Add tests for page pruning on unsigned integers [#9888](https://github.com/apache/datafusion/pull/9888) (progval) +- fix(9870): common expression elimination optimization, should always re-find the correct expression during re-write. [#9871](https://github.com/apache/datafusion/pull/9871) (wiedld) +- [CI] Use alias for table.struct [#9894](https://github.com/apache/datafusion/pull/9894) (jayzhan211) +- fix: detect non-recursive CTEs in the recursive `WITH` clause [#9836](https://github.com/apache/datafusion/pull/9836) (jonahgao) +- Minor: Add SIGMOD paper reference to architecture guide [#9886](https://github.com/apache/datafusion/pull/9886) (alamb) +- refactor: add macro for the binary math function in `datafusion-function` [#9889](https://github.com/apache/datafusion/pull/9889) (Weijun-H) +- Add benchmark for substr_index [#9878](https://github.com/apache/datafusion/pull/9878) (Omega359) +- Add test for reading back file created with `COPY ... OPTIONS (FORMAT..)` options [#9753](https://github.com/apache/datafusion/pull/9753) (alamb) +- Add Expr->String for SimilarTo, IsNotTrue, IsNotUnknown,Negative [#9902](https://github.com/apache/datafusion/pull/9902) (yyy1000) +- refactor: make dfschema wrap schemaref [#9595](https://github.com/apache/datafusion/pull/9595) (haohuaijin) +- Add `spilled_rows` metric to `ExternalSorter` by `IPCWriter` [#9885](https://github.com/apache/datafusion/pull/9885) (erenavsarogullari) +- Minor: Add ParquetExec::table_parquet_options accessor [#9909](https://github.com/apache/datafusion/pull/9909) (alamb) +- Add support for Bloom filters on unsigned integer columns in Parquet tables [#9770](https://github.com/apache/datafusion/pull/9770) (progval) +- Move `radians`, `signum`, `sin`, `sinh` and `sqrt` functions to `datafusion-functions` crate [#9882](https://github.com/apache/datafusion/pull/9882) (erenavsarogullari) +- refactor: make all udf function impls public [#9903](https://github.com/apache/datafusion/pull/9903) (universalmind303) +- Minor: Improve math expr description [#9911](https://github.com/apache/datafusion/pull/9911) (caicancai) +- perf: Use `Arc` instead of `Cow<&'a>` in the analyzer [#9824](https://github.com/apache/datafusion/pull/9824) (comphead) +- Use `struct` instead of `named_struct` when there are no aliases [#9897](https://github.com/apache/datafusion/pull/9897) (alamb) +- Improve planning speed using `impl Into>` to create Arc rather than `&str` [#9916](https://github.com/apache/datafusion/pull/9916) (alamb) +- Make FirstValue an UDAF, Change `AggregateUDFImpl::accumulator` signature, support ORDER BY for UDAFs [#9874](https://github.com/apache/datafusion/pull/9874) (jayzhan211) +- Add TPCH-DS planning benchmark [#9907](https://github.com/apache/datafusion/pull/9907) (alamb) +- Simplify Expr::map_children [#9876](https://github.com/apache/datafusion/pull/9876) (peter-toth) +- CrossJoin Refactor [#9830](https://github.com/apache/datafusion/pull/9830) (berkaysynnada) +- Optimization: concat function [#9732](https://github.com/apache/datafusion/pull/9732) (JasonLi-cn) +- Improve `AggregateUDFImpl::state_fields` documentation [#9919](https://github.com/apache/datafusion/pull/9919) (alamb) +- chore(deps): update substrait requirement from 0.28.0 to 0.29.0 [#9942](https://github.com/apache/datafusion/pull/9942) (dependabot[bot]) +- test: fix intermittent failure in cte.slt [#9934](https://github.com/apache/datafusion/pull/9934) (jonahgao) +- Move `cbrt`, `cos`, `cosh`, `degrees` to `datafusion-functions` [#9938](https://github.com/apache/datafusion/pull/9938) (erenavsarogullari) +- Add Expr->String for Exists, Sort [#9936](https://github.com/apache/datafusion/pull/9936) (kevinmingtarja) +- Remove `OwnedTableReference` and `OwnedSchemaReference` [#9933](https://github.com/apache/datafusion/pull/9933) (comphead) +- Prune out constant expressions from output ordering. [#9947](https://github.com/apache/datafusion/pull/9947) (mustafasrepo) +- Move `AggregateExpr`, `PhysicalExpr` and `PhysicalSortExpr` to physical-expr-core [#9926](https://github.com/apache/datafusion/pull/9926) (jayzhan211) +- Minor: Update release README [#9956](https://github.com/apache/datafusion/pull/9956) (alamb) +- Optimize `COUNT(1)`: Change the sentinel value's type for COUNT(\*) to Int64 [#9944](https://github.com/apache/datafusion/pull/9944) (gruuya) +- Improve docs for `TableProvider::supports_filters_pushdown` and remove deprecated function [#9923](https://github.com/apache/datafusion/pull/9923) (alamb) +- Minor: Improve documentation for AggregateUDFImpl::accumulator and `AccumulatorArgs` [#9920](https://github.com/apache/datafusion/pull/9920) (alamb) +- Minor: improve TableReference docs [#9952](https://github.com/apache/datafusion/pull/9952) (alamb) +- Fix datafusion-cli publishing [#9955](https://github.com/apache/datafusion/pull/9955) (alamb) +- Simplify TreeNode recursions [#9965](https://github.com/apache/datafusion/pull/9965) (peter-toth) +- Validate partitions columns in `CREATE EXTERNAL TABLE` if table already exists. [#9912](https://github.com/apache/datafusion/pull/9912) (MohamedAbdeen21) +- Minor: Add additional documentation to `CommonSubexprEliminate` [#9959](https://github.com/apache/datafusion/pull/9959) (alamb) +- Fix tpcds planning stack overflows - Join planning refactoring [#9962](https://github.com/apache/datafusion/pull/9962) (Jefffrey) +- coercion vec[Dictionary, Utf8] to Dictionary for coalesce function [#9958](https://github.com/apache/datafusion/pull/9958) (Lordworms) +- Minor: Update library documentation with new crates [#9966](https://github.com/apache/datafusion/pull/9966) (alamb) +- Minor: Return InternalError rather than panic for `NamedStructField should be rewritten in OperatorToFunction` [#9968](https://github.com/apache/datafusion/pull/9968) (alamb) +- minor: update MSRV 1.73 [#9977](https://github.com/apache/datafusion/pull/9977) (comphead) +- Move First Value UDAF and builtin first / last function to `aggregate-functions` [#9960](https://github.com/apache/datafusion/pull/9960) (jayzhan211) +- Minor: Avoid copying all expressions in `Analzyer` / `check_plan` [#9974](https://github.com/apache/datafusion/pull/9974) (alamb) +- Minor: Improve documentation about optimizer [#9967](https://github.com/apache/datafusion/pull/9967) (alamb) +- Minor: Use `Expr::apply()` instead of `inspect_expr_pre()` [#9984](https://github.com/apache/datafusion/pull/9984) (peter-toth) +- Update documentation for COPY command [#9931](https://github.com/apache/datafusion/pull/9931) (alamb) +- Minor: fix bug in pruning predicate doc [#9986](https://github.com/apache/datafusion/pull/9986) (alamb) +- fix: improve `unnest_generic_list` handling of null list [#9975](https://github.com/apache/datafusion/pull/9975) (jonahgao) +- Consistent LogicalPlan subquery handling in TreeNode::apply and TreeNode::visit [#9913](https://github.com/apache/datafusion/pull/9913) (peter-toth) +- Remove unnecessary result in `DFSchema::index_of_column_by_name` [#9990](https://github.com/apache/datafusion/pull/9990) (lewiszlw) +- Removes Bloom filter for Int8/Int16/Uint8/Uint16 [#9969](https://github.com/apache/datafusion/pull/9969) (edmondop) +- Move LogicalPlan `tree_node` module [#9995](https://github.com/apache/datafusion/pull/9995) (alamb) +- Optimize performance of substr_index and add tests [#9973](https://github.com/apache/datafusion/pull/9973) (kevinmingtarja) +- move Floor, Gcd, Lcm, Pi to datafusion-functions [#9976](https://github.com/apache/datafusion/pull/9976) (Omega359) +- Minor: Improve documentation on `LogicalPlan::apply*` and `LogicalPlan::map*` [#9996](https://github.com/apache/datafusion/pull/9996) (alamb) +- move the Log, Power functions to datafusion-functions [#9983](https://github.com/apache/datafusion/pull/9983) (tinfoil-knight) +- Remove FORMAT <..> backwards compatibility options from COPY [#9985](https://github.com/apache/datafusion/pull/9985) (tinfoil-knight) +- move Trunc, Cot, Round, iszero functions to datafusion-functions [#10000](https://github.com/apache/datafusion/pull/10000) (Omega359) +- Minor: Clarify documentation on `PruningStatistics::row_counts` and `PruningStatistics::null_counts` and make test match [#10004](https://github.com/apache/datafusion/pull/10004) (alamb) +- Avoid `LogicalPlan::clone()` in `LogicalPlan::map_children` when possible [#9999](https://github.com/apache/datafusion/pull/9999) (alamb) +- Introduce `TreeNode::exists()` API, avoid copying expressions [#10008](https://github.com/apache/datafusion/pull/10008) (peter-toth) +- Minor: Make `LogicalPlan::apply_subqueries` and `LogicalPlan::map_subqueries` pub [#9998](https://github.com/apache/datafusion/pull/9998) (alamb) +- Move Nanvl and random functions to datafusion-functions [#10017](https://github.com/apache/datafusion/pull/10017) (Omega359) +- fix: reduce lock contention in `RepartitionExec::execute` [#10009](https://github.com/apache/datafusion/pull/10009) (crepererum) +- chore(deps): update rstest requirement from 0.18.0 to 0.19.0 [#10021](https://github.com/apache/datafusion/pull/10021) (dependabot[bot]) +- Minor: Document LogicalPlan tree node transformations [#10010](https://github.com/apache/datafusion/pull/10010) (alamb) +- Refactor `Optimizer` to use owned plans and `TreeNode` API (10% faster planning) [#9948](https://github.com/apache/datafusion/pull/9948) (alamb) +- Further clarification of the supports_filters_pushdown documentation [#9988](https://github.com/apache/datafusion/pull/9988) (cisaacson) +- Prune columns are all null in ParquetExec by row_counts , handle IS NOT NULL [#9989](https://github.com/apache/datafusion/pull/9989) (Ted-Jiang) +- Improve the performance of ltrim/rtrim/btrim [#10006](https://github.com/apache/datafusion/pull/10006) (JasonLi-cn) +- fix: `RepartitionExec` metrics [#10025](https://github.com/apache/datafusion/pull/10025) (crepererum) +- modify emit() of TopK to emit on `batch_size` rather than `batch_size-1` [#10030](https://github.com/apache/datafusion/pull/10030) (JasonLi-cn) +- Consolidate LogicalPlan tree node walking/rewriting code into one module [#10034](https://github.com/apache/datafusion/pull/10034) (alamb) +- Introduce `OptimizerRule::rewrite` to rewrite in place, rewrite `ExprSimplifier` (20% faster planning) [#9954](https://github.com/apache/datafusion/pull/9954) (alamb) +- Fix DistinctCount for timestamps with time zone [#10043](https://github.com/apache/datafusion/pull/10043) (joroKr21) +- Improve documentation on `LogicalPlan` TreeNode methods [#10037](https://github.com/apache/datafusion/pull/10037) (alamb) +- chore(deps): update prost-build requirement from =0.12.3 to =0.12.4 [#10045](https://github.com/apache/datafusion/pull/10045) (crepererum) +- Fix datafusion-cli cursor isn't on the right position in windows 7 cmd [#10028](https://github.com/apache/datafusion/pull/10028) (colommar) +- Always pass DataType to PrimitiveDistinctCountAccumulator [#10047](https://github.com/apache/datafusion/pull/10047) (joroKr21) +- Stop copying plans in `LogicalPlan::with_param_values` [#10016](https://github.com/apache/datafusion/pull/10016) (alamb) +- fix `NamedStructField should be rewritten in OperatorToFunction` in subquery regression (change `ApplyFunctionRewrites` to use TreeNode API [#10032](https://github.com/apache/datafusion/pull/10032) (alamb) +- Avoid copies in `InlineTableScan` via TreeNode API [#10038](https://github.com/apache/datafusion/pull/10038) (alamb) +- Bump sccache-action to v0.0.4 [#10060](https://github.com/apache/datafusion/pull/10060) (phillipleblanc) +- chore: add GitHub workflow to close stale PRs [#10046](https://github.com/apache/datafusion/pull/10046) (andygrove) +- feat: eliminate redundant sorts on monotonic expressions [#9813](https://github.com/apache/datafusion/pull/9813) (suremarc) +- Disable `crypto_expressions` feature properly for --no-default-features [#10059](https://github.com/apache/datafusion/pull/10059) (phillipleblanc) +- Return self in EmptyExec and PlaceholderRowExec with_new_children [#10052](https://github.com/apache/datafusion/pull/10052) (joroKr21) +- chore(deps): update sqllogictest requirement from 0.19.0 to 0.20.0 [#10057](https://github.com/apache/datafusion/pull/10057) (dependabot[bot]) +- Rename `FileSinkExec` to `DataSinkExec` [#10065](https://github.com/apache/datafusion/pull/10065) (phillipleblanc) +- fix: Support Dict types in `in_list` physical plans [#10031](https://github.com/apache/datafusion/pull/10031) (advancedxy) +- Prune pages are all null in ParquetExec by row_counts and fix NOT NULL prune [#10051](https://github.com/apache/datafusion/pull/10051) (Ted-Jiang) +- Refactor `EliminateOuterJoin` to implement `OptimizerRule::rewrite()` [#10081](https://github.com/apache/datafusion/pull/10081) (peter-toth) +- chore(deps): update substrait requirement from 0.29.0 to 0.30.0 [#10084](https://github.com/apache/datafusion/pull/10084) (dependabot[bot]) +- feat: optimize `lower` and `upper` functions [#9971](https://github.com/apache/datafusion/pull/9971) (JasonLi-cn) +- Prepend sqllogictest explain result with line number [#10019](https://github.com/apache/datafusion/pull/10019) (duongcongtoai) +- Use PhysicalExtensionCodec consistently [#10075](https://github.com/apache/datafusion/pull/10075) (joroKr21) +- Minor: Do not truncate `SHOW ALL` in datafusion-cli [#10079](https://github.com/apache/datafusion/pull/10079) (alamb) +- Minor: get mutable ref to `SessionConfig` in `SessionState` [#10050](https://github.com/apache/datafusion/pull/10050) (MichaelScofield) +- Move `ceil`, `exp`, `factorial` to `datafusion-functions` crate [#10083](https://github.com/apache/datafusion/pull/10083) (erenavsarogullari) +- feat: support `unnest` multiple arrays [#10044](https://github.com/apache/datafusion/pull/10044) (jonahgao) +- cleanup(tests): Move tests from `push_down_projections.rs` to `optimize_projections.rs` [#10071](https://github.com/apache/datafusion/pull/10071) (kavirajk) +- Move conversion of FIRST/LAST Aggregate function to independent physical optimizer rule [#10061](https://github.com/apache/datafusion/pull/10061) (jayzhan211) +- Avoid copies in `CountWildcardRule` via TreeNode API [#10066](https://github.com/apache/datafusion/pull/10066) (alamb) +- Coerce Dictionary types for scalar functions [#10077](https://github.com/apache/datafusion/pull/10077) (viirya) +- Refactor `UnwrapCastInComparison` to implement `OptimizerRule::rewrite()` [#10087](https://github.com/apache/datafusion/pull/10087) (peter-toth) +- Improve ApproxPercentileAccumulator merge api and fix bug [#10056](https://github.com/apache/datafusion/pull/10056) (Ted-Jiang) +- Support http s3 endpoints in datafusion-cli via `CREATE EXTERNAL TABLE` [#10080](https://github.com/apache/datafusion/pull/10080) (alamb) +- [Bug Fix]: Deem hash repartition unnecessary when input and output has 1 partition [#10095](https://github.com/apache/datafusion/pull/10095) (mustafasrepo) +- fix: Specify row count in sort_batch for batch with no columns [#10094](https://github.com/apache/datafusion/pull/10094) (viirya) +- Move concat, concat_ws, ends_with, initcap to datafusion-functions [#10089](https://github.com/apache/datafusion/pull/10089) (Omega359) +- Update datafusion-cli docs, split up [#10078](https://github.com/apache/datafusion/pull/10078) (alamb) +- Refactor physical create_initial_plan to iteratively & concurrently construct plan from the bottom up [#10023](https://github.com/apache/datafusion/pull/10023) (Jefffrey) +- Adding TPCH benchmarks for Sort Merge Join [#10092](https://github.com/apache/datafusion/pull/10092) (comphead) +- [minor] make parquet prune tests more readable [#10112](https://github.com/apache/datafusion/pull/10112) (Ted-Jiang) +- Fix intermittent CI test failure in `joins.slt` [#10120](https://github.com/apache/datafusion/pull/10120) (alamb) +- Update dependabot to consider datafusion-cli [#10108](https://github.com/apache/datafusion/pull/10108) (Jefffrey) +- fix: another non-deterministic test in `joins.slt` [#10122](https://github.com/apache/datafusion/pull/10122) (korowa) +- Minor: only trigger dependency check on changes to Cargo.toml [#10099](https://github.com/apache/datafusion/pull/10099) (alamb) +- Refactor `UnwrapCastInComparison` to remove `Expr` clones [#10115](https://github.com/apache/datafusion/pull/10115) (peter-toth) +- Fix large futures causing stack overflows [#10033](https://github.com/apache/datafusion/pull/10033) (sergiimk) +- Avoid cloning in `log::simplify` and `power::simplify` [#10086](https://github.com/apache/datafusion/pull/10086) (alamb) +- feat: `DataFrame` supports unnesting multiple columns [#10118](https://github.com/apache/datafusion/pull/10118) (jonahgao) +- Minor: Refine dev/release/README.md [#10129](https://github.com/apache/datafusion/pull/10129) (alamb) +- Minor: Add default for `Expr` [#10127](https://github.com/apache/datafusion/pull/10127) (peter-toth) +- Update documentation to replace Apache Arrow DataFusion with Apache DataFusion [#10130](https://github.com/apache/datafusion/pull/10130) (andygrove) +- Fix AVG groups accummulator ignoring return type [#10114](https://github.com/apache/datafusion/pull/10114) (gruuya) +- Port `37.1.0` changes to main [#10136](https://github.com/apache/datafusion/pull/10136) (alamb) +- chore(deps): update substrait requirement from 0.30.0 to 0.31.0 [#10140](https://github.com/apache/datafusion/pull/10140) (dependabot[bot]) +- Minor: Support more args for udaf [#10146](https://github.com/apache/datafusion/pull/10146) (jayzhan211) +- Minor: Signature check for UDAF [#10147](https://github.com/apache/datafusion/pull/10147) (jayzhan211) +- minor: avoid cloning the `SetExpr` during planning of `SelectInto` [#10152](https://github.com/apache/datafusion/pull/10152) (jonahgao) +- Add distinct aggregate tests to sqllogictest [#10158](https://github.com/apache/datafusion/pull/10158) (Jefffrey) +- Add test for LIKE newline handling [#10160](https://github.com/apache/datafusion/pull/10160) (Jefffrey) +- minor: unparser cleanup and new roundtrip test [#10150](https://github.com/apache/datafusion/pull/10150) (devinjdangelo) +- Support Duration and Union types in ScalarValue::iter_to_array [#10139](https://github.com/apache/datafusion/pull/10139) (joroKr21) +- chore(deps): update sqlparser requirement from 0.44.0 to 0.45.0 [#10137](https://github.com/apache/datafusion/pull/10137) (Jefffrey) +- fix: duplicate output for HashJoinExec in CollectLeft mode [#9757](https://github.com/apache/datafusion/pull/9757) (korowa) +- Move coalesce to datafusion-functions and remove BuiltInScalarFunction [#10098](https://github.com/apache/datafusion/pull/10098) (Omega359) +- [DOC] Add test example for backtraces [#10143](https://github.com/apache/datafusion/pull/10143) (comphead) +- Update github repo links [#10167](https://github.com/apache/datafusion/pull/10167) (lewiszlw) +- feat: support input reordering for `NestedLoopJoinExec` [#9676](https://github.com/apache/datafusion/pull/9676) (korowa) +- minor: fix installation section link [#10179](https://github.com/apache/datafusion/pull/10179) (comphead) +- Improve `TreeNode` and `LogicalPlan` APIs to accept owned closures, deprecate `transform_down_mut()` and `transform_up_mut()` [#10126](https://github.com/apache/datafusion/pull/10126) (peter-toth) +- Projection Expression - Input Field Inconsistencies during Projection [#10088](https://github.com/apache/datafusion/pull/10088) (berkaysynnada) +- implement short_circuits function for ScalarUDFImpl trait [#10168](https://github.com/apache/datafusion/pull/10168) (Lordworms) +- Improve documentation on `TreeNode` [#10035](https://github.com/apache/datafusion/pull/10035) (alamb) +- implement rewrite for ExtractEquijoinPredicate and avoid clone in filter [#10165](https://github.com/apache/datafusion/pull/10165) (Lordworms) +- Update .asf.yaml to point to new mailing list [#10189](https://github.com/apache/datafusion/pull/10189) (phillipleblanc) +- Update NOTICE.txt to be relevant to DataFusion [#10185](https://github.com/apache/datafusion/pull/10185) (alamb) +- Update .asf.yaml to publish docs to datafusion.apache.org [#10190](https://github.com/apache/datafusion/pull/10190) (phillipleblanc) +- Minor: Add `Column::from(Tableref, &FieldRef)`, `Expr::from(Column)` and `Expr::from(Tableref, &FieldRef)` [#10178](https://github.com/apache/datafusion/pull/10178) (alamb) +- implement rewrite for FilterNullJoinKeys [#10166](https://github.com/apache/datafusion/pull/10166) (Lordworms) +- Implement rewrite for EliminateOneUnion and EliminateJoin [#10184](https://github.com/apache/datafusion/pull/10184) (Lordworms) +- Update links to point to datafusion.apache.org [#10195](https://github.com/apache/datafusion/pull/10195) (phillipleblanc) +- Minor: Introduce `Expr::is_volatile()`, adjust `TreeNode::exists()` [#10191](https://github.com/apache/datafusion/pull/10191) (peter-toth) +- Doc: Modify docs to fix old naming [#10199](https://github.com/apache/datafusion/pull/10199) (comphead) +- [MINOR] Remove ScalarFunction from datafusion.proto #10173 [#10202](https://github.com/apache/datafusion/pull/10202) (dmitrybugakov) +- Allow expr_to_sql unparsing with no quotes [#10198](https://github.com/apache/datafusion/pull/10198) (phillipleblanc) +- Minor: Avoid a clone in ArrayFunctionRewriter [#10204](https://github.com/apache/datafusion/pull/10204) (alamb) +- Move coalesce function from math to core [#10201](https://github.com/apache/datafusion/pull/10201) (xxxuuu) +- fix: cargo warnings of import item [#10196](https://github.com/apache/datafusion/pull/10196) (waynexia) +- Minor: Remove some clone in `TypeCoercion` [#10203](https://github.com/apache/datafusion/pull/10203) (alamb) +- doc: fix subscribe mail link to datafusion mailing lists [#10225](https://github.com/apache/datafusion/pull/10225) (jackwener) +- Minor: Prevent empty datafusion-cli commands [#10219](https://github.com/apache/datafusion/pull/10219) (comphead) +- Optimize date_bin (2x faster) [#10215](https://github.com/apache/datafusion/pull/10215) (simonvandel) +- Refactor sessionconfig set fns to avoid an unnecessary enum to string conversion [#10141](https://github.com/apache/datafusion/pull/10141) (psvri) +- fix: reduce lock contention in distributor channels [#10026](https://github.com/apache/datafusion/pull/10026) (crepererum) +- Avoid `Expr` copies `OptimizeProjection`, 12% faster planning, encapsulate indicies [#10216](https://github.com/apache/datafusion/pull/10216) (alamb) +- chore: Create a doap file [#10233](https://github.com/apache/datafusion/pull/10233) (tisonkun) +- Allow adding user defined metadata to `ParquetSink` [#10224](https://github.com/apache/datafusion/pull/10224) (wiedld) +- refactor `EliminateDuplicatedExpr` optimizer pass to avoid clone [#10218](https://github.com/apache/datafusion/pull/10218) (Lordworms) +- Support for median(distinct) aggregation function [#10226](https://github.com/apache/datafusion/pull/10226) (Jefffrey) +- Add tests that `random()` and `uuid()` produce unique values for each row [#10248](https://github.com/apache/datafusion/pull/10248) (alamb) +- ScalarUDF: Remove `supports_zero_argument` and avoid creating null array for empty args [#10193](https://github.com/apache/datafusion/pull/10193) (jayzhan211) +- Add Expr->String for WindowFunction [#10243](https://github.com/apache/datafusion/pull/10243) (yyy1000) +- Make function modules public, add Default impl's. [#10239](https://github.com/apache/datafusion/pull/10239) (Omega359) +- chore: Update release scripts to reflect move to TLP [#10235](https://github.com/apache/datafusion/pull/10235) (andygrove) +- Stop copying plans in `EliminateLimit` [#10253](https://github.com/apache/datafusion/pull/10253) (kevinmingtarja) +- Minor Clean-up in JoinSelection Tests [#10249](https://github.com/apache/datafusion/pull/10249) (berkaysynnada) +- fix: no longer support the `substring` function [#10242](https://github.com/apache/datafusion/pull/10242) (jonahgao) +- Fix docs.rs build for datafusion-proto (hopefully) [#10254](https://github.com/apache/datafusion/pull/10254) (alamb) +- Minor: Possibility to strip datafusion error name [#10186](https://github.com/apache/datafusion/pull/10186) (comphead) +- Docs: Add governance page to contributor guide [#10238](https://github.com/apache/datafusion/pull/10238) (alamb) +- Improve documentation on `ColumnarValue` [#10265](https://github.com/apache/datafusion/pull/10265) (alamb) +- Minor: Add comments for removed protobuf nodes [#10252](https://github.com/apache/datafusion/pull/10252) (alamb) +- feat: add static_name() to ExecutionPlan [#10266](https://github.com/apache/datafusion/pull/10266) (waynexia) +- Zero-copy conversion from SchemaRef to DfSchema [#10298](https://github.com/apache/datafusion/pull/10298) (tustvold) +- chore: Update Error for Unnest Rewritter [#10263](https://github.com/apache/datafusion/pull/10263) (Weijun-H) +- feat(CLI): print column headers for empty query results [#10300](https://github.com/apache/datafusion/pull/10300) (jonahgao) +- Clean-up: Remove AggregateExec::group_by() [#10297](https://github.com/apache/datafusion/pull/10297) (berkaysynnada) +- Add mailing list descriptions to documentation [#10284](https://github.com/apache/datafusion/pull/10284) (alamb) +- chore(deps): update substrait requirement from 0.31.0 to 0.32.0 [#10279](https://github.com/apache/datafusion/pull/10279) (dependabot[bot]) +- refactor: Convert `IPCWriter` metrics from `u64` to `usize` [#10278](https://github.com/apache/datafusion/pull/10278) (erenavsarogullari) +- Validate ScalarUDF output rows and fix nulls for `array_has` and `get_field` for `Map` [#10148](https://github.com/apache/datafusion/pull/10148) (duongcongtoai) +- Minor: return NULL for range and generate_series [#10275](https://github.com/apache/datafusion/pull/10275) (Lordworms) +- docs: add download page [#10271](https://github.com/apache/datafusion/pull/10271) (tisonkun) +- Minor: Add some more tests to map.slt [#10301](https://github.com/apache/datafusion/pull/10301) (alamb) +- fix: Correct null_count in describe() [#10260](https://github.com/apache/datafusion/pull/10260) (Weijun-H) +- chore: Add datatype info to error message [#10307](https://github.com/apache/datafusion/pull/10307) (viirya) +- feat: add optimizer config param to avoid grouping partitions `prefer_existing_union` [#10259](https://github.com/apache/datafusion/pull/10259) (NGA-TRAN) +- Remove `ScalarFunctionDefinition::Name` [#10277](https://github.com/apache/datafusion/pull/10277) (lewiszlw) +- Display: Support `preserve_partitioning` on SortExec physical plan. [#10153](https://github.com/apache/datafusion/pull/10153) (kavirajk) +- Fix build with missing `use` ( `" return internal_err!("UDF returned a different ..."`) [#10317](https://github.com/apache/datafusion/pull/10317) (alamb) +- [Minor] Update link to list of committers in contributor guide [#10312](https://github.com/apache/datafusion/pull/10312) (alamb) +- Optimize EliminateFilter to avoid unnecessary copies #10288 [#10302](https://github.com/apache/datafusion/pull/10302) (dmitrybugakov) +- chore: add function to set prefer_existing_union [#10322](https://github.com/apache/datafusion/pull/10322) (NGA-TRAN) +- `ExecutionPlan` visitor example documentation [#10286](https://github.com/apache/datafusion/pull/10286) (matthewmturner) +- fix: schema error when parsing order-by expressions [#10234](https://github.com/apache/datafusion/pull/10234) (jonahgao) +- Stop copying LogicalPlan and Exprs in `RewriteDisjunctivePredicate` [#10305](https://github.com/apache/datafusion/pull/10305) (rohitrastogi) +- feat: unwrap casts of string and dictionary columns [#10323](https://github.com/apache/datafusion/pull/10323) (erratic-pattern) +- feat: Determine ordering of file groups [#9593](https://github.com/apache/datafusion/pull/9593) (suremarc) +- Stop copying LogicalPlan and Exprs in `DecorrelatePredicateSubquery` [#10318](https://github.com/apache/datafusion/pull/10318) (alamb) +- Minor: Add additional coalesce tests [#10334](https://github.com/apache/datafusion/pull/10334) (alamb) +- Minor: add a few more dictionary unwrap tests [#10335](https://github.com/apache/datafusion/pull/10335) (alamb) +- Check list size before concat in ScalarValue [#10329](https://github.com/apache/datafusion/pull/10329) (timsaucer) +- Split parquet bloom filter config and enable bloom filter on read by default [#10306](https://github.com/apache/datafusion/pull/10306) (lewiszlw) +- Improve coerce API so it does not need DFSchema [#10331](https://github.com/apache/datafusion/pull/10331) (alamb) +- Stop copying LogicalPlan and Exprs in `PropagateEmptyRelation` [#10332](https://github.com/apache/datafusion/pull/10332) (dmitrybugakov) +- Stop copying LogicalPlan and Exprs in EliminateNestedUnion [#10319](https://github.com/apache/datafusion/pull/10319) (emgeee) +- Fix clippy lints found by Clippy in Rust `1.78` [#10353](https://github.com/apache/datafusion/pull/10353) (alamb) +- Minor: Add sql level test for lead/lag on arrays [#10345](https://github.com/apache/datafusion/pull/10345) (alamb) +- fix: LogFunc simplify swaps arguments [#10360](https://github.com/apache/datafusion/pull/10360) (erratic-pattern) +- Refine documentation for `Transformed::{update,map,transform})_data` [#10355](https://github.com/apache/datafusion/pull/10355) (alamb) +- Clarify docs explaining the relationship between `SessionState` and `SessionContext` [#10350](https://github.com/apache/datafusion/pull/10350) (alamb) +- Optimized push down filter #10291 [#10366](https://github.com/apache/datafusion/pull/10366) (dmitrybugakov) +- Unparser: Support `ORDER BY` in window function definition [#10370](https://github.com/apache/datafusion/pull/10370) (yyy1000) +- docs: Add DataFusion subprojects to navigation menu, other minor updates [#10362](https://github.com/apache/datafusion/pull/10362) (andygrove) +- feat: Add CrossJoin match case to unparser [#10371](https://github.com/apache/datafusion/pull/10371) (sardination) +- Minor: Do not force analyzer to copy logical plans [#10367](https://github.com/apache/datafusion/pull/10367) (alamb) +- Minor: Move Sum aggregate function test to slt [#10382](https://github.com/apache/datafusion/pull/10382) (jayzhan211) +- chore: remove DataPtr trait since Arc::ptr_eq ignores pointer metadata [#10378](https://github.com/apache/datafusion/pull/10378) (intoraw) +- Move `Covariance` (Sample) `covar` / `covar_samp` to be a User Defined Aggregate Function [#10372](https://github.com/apache/datafusion/pull/10372) (jayzhan211) +- Support limit in StreamingTableExec [#10309](https://github.com/apache/datafusion/pull/10309) (lewiszlw) +- Minor: Move count test to slt [#10383](https://github.com/apache/datafusion/pull/10383) (jayzhan211) +- [MINOR]: Reduce test run time [#10390](https://github.com/apache/datafusion/pull/10390) (mustafasrepo) +- Fix `coalesce`, `struct` and `named_strct` expr_fn function to take multiple arguments [#10321](https://github.com/apache/datafusion/pull/10321) (alamb) +- Minor: remove old `create_physical_expr` to `scalar_function` [#10387](https://github.com/apache/datafusion/pull/10387) (jayzhan211) +- Move average unit tests to slt [#10401](https://github.com/apache/datafusion/pull/10401) (lewiszlw) +- Move array_agg unit tests to slt [#10402](https://github.com/apache/datafusion/pull/10402) (lewiszlw) +- feat: run expression simplifier in a loop until a fixedpoint or 3 cycles [#10358](https://github.com/apache/datafusion/pull/10358) (erratic-pattern) +- Add `SessionContext`/`SessionState::create_physical_expr()` to create `PhysicalExpressions` from `Expr`s [#10330](https://github.com/apache/datafusion/pull/10330) (alamb) diff --git a/dev/requirements.txt b/dev/requirements.txt new file mode 100644 index 000000000000..7fcba0493129 --- /dev/null +++ b/dev/requirements.txt @@ -0,0 +1,2 @@ +tomlkit +PyGitHub \ No newline at end of file diff --git a/dev/update_datafusion_versions.py b/dev/update_datafusion_versions.py index 12b0a90d4ab6..74a8a2ebd5b6 100755 --- a/dev/update_datafusion_versions.py +++ b/dev/update_datafusion_versions.py @@ -29,13 +29,16 @@ crates = { 'datafusion-common': 'datafusion/common/Cargo.toml', + 'datafusion-common-runtime': 'datafusion/common-runtime/Cargo.toml', 'datafusion': 'datafusion/core/Cargo.toml', 'datafusion-execution': 'datafusion/execution/Cargo.toml', 'datafusion-expr': 'datafusion/expr/Cargo.toml', 'datafusion-functions': 'datafusion/functions/Cargo.toml', + 'datafusion-functions-aggregate': 'datafusion/functions-aggregate/Cargo.toml', 'datafusion-functions-array': 'datafusion/functions-array/Cargo.toml', 'datafusion-optimizer': 'datafusion/optimizer/Cargo.toml', 'datafusion-physical-expr': 'datafusion/physical-expr/Cargo.toml', + 'datafusion-physical-expr-common': 'datafusion/physical-expr-common/Cargo.toml', 'datafusion-physical-plan': 'datafusion/physical-plan/Cargo.toml', 'datafusion-proto': 'datafusion/proto/Cargo.toml', 'datafusion-sql': 'datafusion/sql/Cargo.toml', diff --git a/docs/source/user-guide/configs.md b/docs/source/user-guide/configs.md index db192d7807ef..ef2a2a4119e3 100644 --- a/docs/source/user-guide/configs.md +++ b/docs/source/user-guide/configs.md @@ -64,7 +64,7 @@ Environment variables are read during `SessionConfig` initialisation so they mus | datafusion.execution.parquet.statistics_enabled | NULL | Sets if statistics are enabled for any column Valid values are: "none", "chunk", and "page" These values are not case sensitive. If NULL, uses default parquet writer setting | | datafusion.execution.parquet.max_statistics_size | NULL | Sets max statistics size for any column. If NULL, uses default parquet writer setting | | datafusion.execution.parquet.max_row_group_size | 1048576 | Target maximum number of rows in each row group (defaults to 1M rows). Writing larger row groups requires more memory to write, but can get better compression and be faster to read. | -| datafusion.execution.parquet.created_by | datafusion version 37.1.0 | Sets "created by" property | +| datafusion.execution.parquet.created_by | datafusion version 38.0.0 | Sets "created by" property | | datafusion.execution.parquet.column_index_truncate_length | NULL | Sets column index truncate length | | datafusion.execution.parquet.data_page_row_count_limit | 18446744073709551615 | Sets best effort maximum number of rows in data page | | datafusion.execution.parquet.encoding | NULL | Sets default encoding for any column Valid values are: plain, plain_dictionary, rle, bit_packed, delta_binary_packed, delta_length_byte_array, delta_byte_array, rle_dictionary, and byte_stream_split. These values are not case sensitive. If NULL, uses default parquet writer setting |