From 5a9ef0d8ef52b999c67f751f06ec2d96f0e14d71 Mon Sep 17 00:00:00 2001 From: lancedb automation Date: Fri, 5 Jun 2026 12:01:29 +0000 Subject: [PATCH] chore: update lance dependency to v8.0.0-beta.4 --- Cargo.lock | 90 ++++++++++--------- Cargo.toml | 28 +++--- java/pom.xml | 2 +- .../src/dataloader/permutation/shuffle.rs | 4 +- 4 files changed, 67 insertions(+), 57 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index af372ab84..1f5e1b00b 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -3473,8 +3473,8 @@ checksum = "42703706b716c37f96a77aea830392ad231f44c9e9a67872fa5548707e11b11c" [[package]] name = "fsst" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "rand 0.9.4", @@ -4776,8 +4776,8 @@ checksum = "e037a2e1d8d5fdbd49b16a4ea09d5d6401c1f29eca5ff29d03d3824dba16256a" [[package]] name = "lance" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arc-swap", "arrow", @@ -4852,8 +4852,8 @@ dependencies = [ [[package]] name = "lance-arrow" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-buffer", @@ -4874,7 +4874,7 @@ dependencies = [ [[package]] name = "lance-arrow-scalar" version = "58.0.0" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-buffer", @@ -4888,7 +4888,7 @@ dependencies = [ [[package]] name = "lance-arrow-stats" version = "58.0.0" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-schema", @@ -4897,8 +4897,8 @@ dependencies = [ [[package]] name = "lance-bitpacking" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrayref", "paste", @@ -4907,8 +4907,8 @@ dependencies = [ [[package]] name = "lance-core" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-buffer", @@ -4943,8 +4943,8 @@ dependencies = [ [[package]] name = "lance-datafusion" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow", "arrow-array", @@ -4974,8 +4974,8 @@ dependencies = [ [[package]] name = "lance-datagen" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow", "arrow-array", @@ -4993,8 +4993,8 @@ dependencies = [ [[package]] name = "lance-encoding" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-arith", "arrow-array", @@ -5029,8 +5029,8 @@ dependencies = [ [[package]] name = "lance-file" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-arith", "arrow-array", @@ -5061,8 +5061,8 @@ dependencies = [ [[package]] name = "lance-index" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arc-swap", "arrow", @@ -5104,6 +5104,7 @@ dependencies = [ "lance-table", "lance-tokenizer", "libm", + "libsais-rs", "log", "ndarray", "num-traits", @@ -5128,8 +5129,8 @@ dependencies = [ [[package]] name = "lance-io" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow", "arrow-arith", @@ -5171,8 +5172,8 @@ dependencies = [ [[package]] name = "lance-linalg" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-buffer", @@ -5188,8 +5189,8 @@ dependencies = [ [[package]] name = "lance-namespace" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow", "async-trait", @@ -5201,8 +5202,8 @@ dependencies = [ [[package]] name = "lance-namespace-impls" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow", "arrow-ipc", @@ -5237,9 +5238,9 @@ dependencies = [ [[package]] name = "lance-namespace-reqwest-client" -version = "0.8.0" +version = "0.8.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3eefb02ded2c3d4b6b60669bb74822d9fa628e144fc748c79ee31f13f566e87b" +checksum = "7a09733325812e046cb217d548afc4864dedb59545389d45cd498b3d8ecb0d20" dependencies = [ "reqwest 0.12.28", "serde", @@ -5251,8 +5252,8 @@ dependencies = [ [[package]] name = "lance-select" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-buffer", @@ -5268,8 +5269,8 @@ dependencies = [ [[package]] name = "lance-table" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow", "arrow-array", @@ -5309,8 +5310,8 @@ dependencies = [ [[package]] name = "lance-testing" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "arrow-array", "arrow-schema", @@ -5323,8 +5324,8 @@ dependencies = [ [[package]] name = "lance-tokenizer" -version = "8.0.0-beta.2" -source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.2#f154b4e84942e5b8028f7f4a7a77b1d963107202" +version = "8.0.0-beta.4" +source = "git+https://github.com/lance-format/lance.git?tag=v8.0.0-beta.4#6b6c4866e5dda7c63742b33faabff18a99be3b99" dependencies = [ "icu_segmenter", "jieba-rs", @@ -5570,6 +5571,15 @@ dependencies = [ "libc", ] +[[package]] +name = "libsais-rs" +version = "0.2.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "40fe164dbd47ea0c20e78a121c980ef673326905f1d4fba55e3645a20ef6717f" +dependencies = [ + "rayon", +] + [[package]] name = "lindera" version = "3.0.7" diff --git a/Cargo.toml b/Cargo.toml index 26b5c8f5b..d07a3f4cb 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -13,20 +13,20 @@ categories = ["database-implementations"] rust-version = "1.91.0" [workspace.dependencies] -lance = { "version" = "=8.0.0-beta.2", default-features = false, "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-core = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-datagen = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-file = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-io = { "version" = "=8.0.0-beta.2", default-features = false, "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-index = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-linalg = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-namespace = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-namespace-impls = { "version" = "=8.0.0-beta.2", default-features = false, "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-table = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-testing = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-datafusion = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-encoding = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } -lance-arrow = { "version" = "=8.0.0-beta.2", "tag" = "v8.0.0-beta.2", "git" = "https://github.com/lance-format/lance.git" } +lance = { "version" = "=8.0.0-beta.4", default-features = false, "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-core = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-datagen = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-file = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-io = { "version" = "=8.0.0-beta.4", default-features = false, "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-index = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-linalg = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-namespace = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-namespace-impls = { "version" = "=8.0.0-beta.4", default-features = false, "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-table = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-testing = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-datafusion = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-encoding = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } +lance-arrow = { "version" = "=8.0.0-beta.4", "tag" = "v8.0.0-beta.4", "git" = "https://github.com/lance-format/lance.git" } ahash = "0.8" # Note that this one does not include pyarrow arrow = { version = "58.0.0", optional = false } diff --git a/java/pom.xml b/java/pom.xml index b4b271d70..f946be72e 100644 --- a/java/pom.xml +++ b/java/pom.xml @@ -28,7 +28,7 @@ UTF-8 15.0.0 - 8.0.0-beta.2 + 8.0.0-beta.4 false 2.30.0 1.7 diff --git a/rust/lancedb/src/dataloader/permutation/shuffle.rs b/rust/lancedb/src/dataloader/permutation/shuffle.rs index b26db7bea..6c0e35d7d 100644 --- a/rust/lancedb/src/dataloader/permutation/shuffle.rs +++ b/rust/lancedb/src/dataloader/permutation/shuffle.rs @@ -203,11 +203,11 @@ impl Shuffler { // Finish writing files for (file_idx, mut writer) in file_writers.into_iter().enumerate() { - let num_written = writer.finish().await?; + let write_summary = writer.finish().await?; log::debug!( "Shuffle job {}: wrote {} rows to file {}", self.id, - num_written, + write_summary.num_rows, file_idx ); }