mirror of
https://github.com/ModernRelay/omnigraph.git
synced 2026-07-03 02:51:04 +02:00
iss-merge-rowid-overlap-corrupts-filtered-reads / lance#7444: an
update-style merge_insert over a merge-written fragment legally reuses the
updated rows' stable row ids (row-id-lineage spec: updates preserve
_rowid) while the superseded fragment keeps its full sequence plus a
deletion vector. A later delete leaves the overlapping id range sparsely
tiled, and lance-table 7.0.0's RowIdIndex::new asserted dense tiling —
failing every filtered read that builds the id→address map ("Wrong range"
debug assert; "all columns in a record batch must have the same length"
or a silently-wrong batch in release).
The upstream fix (lance#7480, merged 2026-07-01) landed hours AFTER
v8.0.0 was cut, so no release ≤ 8.0.0 carries it. Consume it now as a
vendored pin: vendor/lance-table is the pristine published 7.0.0 source
plus ONLY the #7480 rowids/index.rs hunk (drop the false tiling assert;
hard-error on the true invariant — one live id claimed by two fragments)
and upstream's regression unit test, wired via [patch.crates-io]. The fix
is read-side only, so already-written graphs become readable as-is — no
data repair.
Removal condition (see vendor/lance-table/README.omnigraph.md): drop the
vendor dir + patch entry at the first Lance bump whose lance-table ships
lance#7480 (9.0.0, or a backported 8.0.1). The surface guard
filtered_scan_tolerates_merge_update_row_id_overlap keeps that honest in
both directions.
Turns the previous commit's red tests green. Full workspace gate passes
(cargo test --workspace --locked --no-fail-fast, 68 suites).
263 lines
4.5 KiB
TOML
263 lines
4.5 KiB
TOML
# THIS FILE IS AUTOMATICALLY GENERATED BY CARGO
|
|
#
|
|
# When uploading crates to the registry Cargo will automatically
|
|
# "normalize" Cargo.toml files for maximal compatibility
|
|
# with all versions of Cargo and also rewrite `path` dependencies
|
|
# to registry (e.g., crates.io) dependencies.
|
|
#
|
|
# If you are reading this file be aware that the original Cargo.toml
|
|
# will likely look very different (and much more reasonable).
|
|
# See Cargo.toml.orig for the original contents.
|
|
|
|
[package]
|
|
edition = "2024"
|
|
rust-version = "1.91.0"
|
|
name = "lance-table"
|
|
version = "7.0.0"
|
|
authors = ["Lance Devs <dev@lance.org>"]
|
|
build = "build.rs"
|
|
autolib = false
|
|
autobins = false
|
|
autoexamples = false
|
|
autotests = false
|
|
autobenches = false
|
|
description = "Utilities for the Lance table format"
|
|
readme = "README.md"
|
|
keywords = [
|
|
"data-format",
|
|
"data-science",
|
|
"machine-learning",
|
|
"apache-arrow",
|
|
"data-analytics",
|
|
]
|
|
categories = [
|
|
"database-implementations",
|
|
"data-structures",
|
|
"development-tools",
|
|
"science",
|
|
]
|
|
license = "Apache-2.0"
|
|
repository = "https://github.com/lance-format/lance"
|
|
|
|
[package.metadata.docs.rs]
|
|
features = ["protoc"]
|
|
|
|
[features]
|
|
dynamodb = [
|
|
"dep:aws-sdk-dynamodb",
|
|
"dep:aws-credential-types",
|
|
"lance-io/aws",
|
|
]
|
|
protoc = ["dep:protobuf-src"]
|
|
|
|
[lib]
|
|
name = "lance_table"
|
|
path = "src/lib.rs"
|
|
|
|
[[bench]]
|
|
name = "manifest_intern"
|
|
path = "benches/manifest_intern.rs"
|
|
harness = false
|
|
|
|
[[bench]]
|
|
name = "row_id_index"
|
|
path = "benches/row_id_index.rs"
|
|
harness = false
|
|
|
|
[dependencies.arrow]
|
|
version = "58.0.0"
|
|
features = ["prettyprint"]
|
|
|
|
[dependencies.arrow-array]
|
|
version = "58.0.0"
|
|
|
|
[dependencies.arrow-buffer]
|
|
version = "58.0.0"
|
|
|
|
[dependencies.arrow-ipc]
|
|
version = "58.0.0"
|
|
features = ["zstd"]
|
|
|
|
[dependencies.arrow-schema]
|
|
version = "58.0.0"
|
|
|
|
[dependencies.async-trait]
|
|
version = "0.1"
|
|
|
|
[dependencies.aws-credential-types]
|
|
version = "1.2.0"
|
|
optional = true
|
|
|
|
[dependencies.aws-sdk-dynamodb]
|
|
version = "1.38.0"
|
|
features = [
|
|
"default-https-client",
|
|
"rt-tokio",
|
|
]
|
|
optional = true
|
|
default-features = false
|
|
|
|
[dependencies.byteorder]
|
|
version = "1.5"
|
|
|
|
[dependencies.bytes]
|
|
version = "1.11.1"
|
|
|
|
[dependencies.chrono]
|
|
version = "0.4.41"
|
|
features = [
|
|
"std",
|
|
"now",
|
|
"serde",
|
|
]
|
|
default-features = false
|
|
|
|
[dependencies.deepsize]
|
|
version = "0.2.0"
|
|
|
|
[dependencies.futures]
|
|
version = "0.3"
|
|
|
|
[dependencies.lance-arrow]
|
|
version = "=7.0.0"
|
|
|
|
[dependencies.lance-core]
|
|
version = "=7.0.0"
|
|
|
|
[dependencies.lance-file]
|
|
version = "=7.0.0"
|
|
|
|
[dependencies.lance-io]
|
|
version = "=7.0.0"
|
|
default-features = false
|
|
|
|
[dependencies.log]
|
|
version = "0.4"
|
|
|
|
[dependencies.object_store]
|
|
version = "0.13.2"
|
|
|
|
[dependencies.prost]
|
|
version = "0.14.1"
|
|
|
|
[dependencies.prost-types]
|
|
version = "0.14.1"
|
|
|
|
[dependencies.rand]
|
|
version = "0.9.1"
|
|
features = ["small_rng"]
|
|
|
|
[dependencies.rangemap]
|
|
version = "1.0"
|
|
|
|
[dependencies.roaring]
|
|
version = "0.11"
|
|
|
|
[dependencies.semver]
|
|
version = "1.0"
|
|
|
|
[dependencies.serde]
|
|
version = "^1"
|
|
|
|
[dependencies.serde_json]
|
|
version = "1"
|
|
|
|
[dependencies.snafu]
|
|
version = "0.9"
|
|
|
|
[dependencies.tokio]
|
|
version = "1.23"
|
|
features = [
|
|
"rt-multi-thread",
|
|
"macros",
|
|
"fs",
|
|
"sync",
|
|
]
|
|
|
|
[dependencies.tracing]
|
|
version = "0.1"
|
|
|
|
[dependencies.url]
|
|
version = "2.5.7"
|
|
|
|
[dependencies.uuid]
|
|
version = "1.2"
|
|
features = [
|
|
"v4",
|
|
"serde",
|
|
]
|
|
|
|
[dev-dependencies.arrow-schema]
|
|
version = "58.0.0"
|
|
|
|
[dev-dependencies.criterion]
|
|
version = "0.5"
|
|
features = [
|
|
"async",
|
|
"async_tokio",
|
|
"html_reports",
|
|
]
|
|
|
|
[dev-dependencies.lance-datagen]
|
|
version = "=7.0.0"
|
|
|
|
[dev-dependencies.pretty_assertions]
|
|
version = "1.4.0"
|
|
|
|
[dev-dependencies.proptest]
|
|
version = "1.3.1"
|
|
|
|
[dev-dependencies.rstest]
|
|
version = "0.23.0"
|
|
|
|
[build-dependencies.prost-build]
|
|
version = "0.14.1"
|
|
|
|
[build-dependencies.protobuf-src]
|
|
version = "2.1"
|
|
optional = true
|
|
|
|
[target.'cfg(target_os = "linux")'.dev-dependencies.pprof]
|
|
version = "0.14.0"
|
|
features = [
|
|
"flamegraph",
|
|
"criterion",
|
|
]
|
|
|
|
[lints.clippy]
|
|
dbg_macro = "deny"
|
|
disallowed_macros = "deny"
|
|
fallible_impl_from = "deny"
|
|
large_futures = "deny"
|
|
manual_let_else = "deny"
|
|
multiple-crate-versions = "allow"
|
|
print_stderr = "deny"
|
|
print_stdout = "deny"
|
|
redundant_clone = "deny"
|
|
redundant_pub_crate = "deny"
|
|
single_range_in_vec_init = "allow"
|
|
string_add = "deny"
|
|
string_add_assign = "deny"
|
|
string_lit_as_bytes = "deny"
|
|
trait_duplication_in_bounds = "deny"
|
|
use_self = "deny"
|
|
|
|
[lints.clippy.all]
|
|
level = "deny"
|
|
priority = -1
|
|
|
|
[lints.clippy.cargo]
|
|
level = "deny"
|
|
priority = -1
|
|
|
|
[lints.clippy.style]
|
|
level = "deny"
|
|
priority = -1
|
|
|
|
[lints.rust]
|
|
unsafe_op_in_unsafe_fn = "allow"
|
|
|
|
[lints.rust.unexpected_cfgs]
|
|
level = "warn"
|
|
priority = 0
|
|
check-cfg = ["cfg(coverage,coverage_nightly)"]
|