Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
32 commits
Select commit Hold shift + click to select a range
f5b5338
feat(datafusion): add IcebergPartitionedTableProvider and IcebergPart…
toutane Mar 31, 2026
5076f9e
docs(datafusion): update comment in IcebergPartitionedScan
toutane Mar 31, 2026
4c4b962
Update crates/integrations/datafusion/src/table/mod.rs
toutane Apr 20, 2026
6a8e1e3
fix(datafusion): reject non-empty children in IcebergPartitionedScan:…
toutane Apr 20, 2026
bf9d689
fix(datafusion): use ArrowReaderBuilder existing configuration path
toutane Apr 21, 2026
e7c1a48
feat(datafusion): bucket FileScanTasks across target_partitions with …
timsaucer Apr 24, 2026
8770e0c
feat(datafusion): mark identity-partition filters as Exact pushdown
timsaucer Apr 24, 2026
e0d6add
feat(datafusion): allow Exact pushdown across spec evolution via per-…
timsaucer Apr 24, 2026
f25c911
Revert "feat(datafusion): allow Exact pushdown across spec evolution …
toutane Apr 28, 2026
5093b82
Revert "feat(datafusion): mark identity-partition filters as Exact pu…
toutane Apr 28, 2026
34d6f4c
refactor(datafusion): merge IcebergPartitionedTableProvider into Iceb…
toutane Apr 28, 2026
00527f8
refactor(datafusion): polish scan API and add bucketing tests
toutane Apr 29, 2026
c0ffb36
test(sqllogictest): update EXPLAIN snapshots for eager bucketing output
toutane Apr 29, 2026
89bc410
fix(datafusion): resolve conflicts
toutane Apr 29, 2026
d83b29b
refactor(datafusion): read preplanned tasks with ArrowReaderBuilder
toutane Jun 15, 2026
c29c059
refactor(datafusion): distinguish lazy and eager scan buckets
toutane Jun 15, 2026
c748e23
refactor(datafusion): introduce IcebergTableScanBuilder
toutane Jun 15, 2026
cd2b68b
perf(datafusion): avoid cloning task buckets during execute
toutane Jun 15, 2026
8fe57aa
refactor(datafusion): centralize scan stream error mapping
toutane Jun 15, 2026
ace9b7e
test(datafusion): verify identity bucket hashes match repartitioning
toutane Jun 15, 2026
f3ac17d
fix(datafusion): reuse eager scan predicates during execution
toutane Jun 15, 2026
b6369e2
perf(datafusion): batch identity partition hashing
toutane Jun 15, 2026
6f17acf
refactor(datafusion): share Iceberg scan config
toutane Jun 15, 2026
971aa0f
fix(datafusion): use unknown partitioning for empty eager scans
toutane Jun 16, 2026
2802af4
test(datafusion): cover hash partitioning fallback cases
toutane Jun 16, 2026
f4c407f
fix(datafusion): give table runtime to ArrowReaderBuilder::new()
toutane Jun 16, 2026
277ee9c
fix(datafusion): give table runtime to table_with_additional_partitio…
toutane Jun 16, 2026
41ae275
fix(datafusion): make check green
toutane Jun 16, 2026
3d0297b
refactor(datafusion): reuse iceberg::util::available_parallelism
toutane Jun 16, 2026
39da3c0
docs(datafusion): note count-based bucketing limitation
toutane Jun 16, 2026
eff04fb
docs(datafusion): explain conservative multi-spec bucketing gate
toutane Jun 16, 2026
d54684d
fix: generate-public-api
toutane Jun 16, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 9 additions & 0 deletions crates/iceberg/public-api.txt
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,11 @@ pub fn iceberg::arrow::PartitionValueCalculator::partition_type(&self) -> &icebe
pub fn iceberg::arrow::PartitionValueCalculator::try_new(partition_spec: &iceberg::spec::PartitionSpec, table_schema: &iceberg::spec::Schema) -> iceberg::Result<Self>
impl core::fmt::Debug for iceberg::arrow::PartitionValueCalculator
pub fn iceberg::arrow::PartitionValueCalculator::fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result
pub struct iceberg::arrow::PrimitiveLiteralArrayBuilder
impl iceberg::arrow::PrimitiveLiteralArrayBuilder
pub fn iceberg::arrow::PrimitiveLiteralArrayBuilder::append_or_null(&mut self, prim_lit: core::option::Option<&iceberg::spec::PrimitiveLiteral>) -> iceberg::Result<bool>
pub fn iceberg::arrow::PrimitiveLiteralArrayBuilder::finish(self) -> iceberg::Result<arrow_array::array::ArrayRef>
pub fn iceberg::arrow::PrimitiveLiteralArrayBuilder::try_new(data_type: &arrow_schema::datatype::DataType, capacity: usize) -> iceberg::Result<Self>
pub struct iceberg::arrow::RecordBatchPartitionSplitter
impl iceberg::arrow::RecordBatchPartitionSplitter
pub fn iceberg::arrow::RecordBatchPartitionSplitter::split(&self, batch: &arrow_array::record_batch::RecordBatch) -> iceberg::Result<alloc::vec::Vec<(iceberg::spec::PartitionKey, arrow_array::record_batch::RecordBatch)>>
Expand Down Expand Up @@ -127,6 +132,7 @@ pub fn iceberg::arrow::arrow_schema_to_schema(schema: &arrow_schema::schema::Sch
pub fn iceberg::arrow::arrow_schema_to_schema_auto_assign_ids(schema: &arrow_schema::schema::Schema) -> iceberg::Result<iceberg::spec::Schema>
pub fn iceberg::arrow::arrow_struct_to_literal(struct_array: &arrow_array::array::ArrayRef, ty: &iceberg::spec::StructType) -> iceberg::Result<alloc::vec::Vec<core::option::Option<iceberg::spec::Literal>>>
pub fn iceberg::arrow::arrow_type_to_type(ty: &arrow_schema::datatype::DataType) -> iceberg::Result<iceberg::spec::Type>
pub fn iceberg::arrow::create_primitive_array_single_element(data_type: &arrow_schema::datatype::DataType, prim_lit: &core::option::Option<iceberg::spec::PrimitiveLiteral>) -> iceberg::Result<arrow_array::array::ArrayRef>
pub fn iceberg::arrow::datum_to_arrow_type_with_ree(datum: &iceberg::spec::Datum) -> arrow_schema::datatype::DataType
pub fn iceberg::arrow::schema_to_arrow_schema(schema: &iceberg::spec::Schema) -> iceberg::Result<arrow_schema::schema::Schema>
pub fn iceberg::arrow::strip_metadata_from_schema(schema: &arrow_schema::schema::Schema) -> iceberg::Result<arrow_schema::schema::Schema>
Expand Down Expand Up @@ -1289,6 +1295,7 @@ pub fn iceberg::scan::TableScan::column_names(&self) -> core::option::Option<&[a
pub async fn iceberg::scan::TableScan::plan_files(&self) -> iceberg::Result<iceberg::scan::FileScanTaskStream>
pub fn iceberg::scan::TableScan::snapshot(&self) -> core::option::Option<&iceberg::spec::SnapshotRef>
pub async fn iceberg::scan::TableScan::to_arrow(&self) -> iceberg::Result<iceberg::scan::ArrowRecordBatchStream>
pub fn iceberg::scan::TableScan::to_arrow_from_tasks(&self, tasks: iceberg::scan::FileScanTaskStream) -> iceberg::Result<iceberg::scan::ArrowRecordBatchStream>
impl core::fmt::Debug for iceberg::scan::TableScan
pub fn iceberg::scan::TableScan::fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result
pub struct iceberg::scan::TableScanBuilder<'a>
Expand Down Expand Up @@ -3034,6 +3041,7 @@ pub fn iceberg::table::Table::metadata_location_result(&self) -> iceberg::Result
pub fn iceberg::table::Table::metadata_ref(&self) -> iceberg::spec::TableMetadataRef
pub fn iceberg::table::Table::reader_builder(&self) -> iceberg::arrow::ArrowReaderBuilder
pub fn iceberg::table::Table::readonly(&self) -> bool
pub fn iceberg::table::Table::runtime(&self) -> &iceberg::Runtime
pub fn iceberg::table::Table::scan(&self) -> iceberg::scan::TableScanBuilder<'_>
impl core::clone::Clone for iceberg::table::Table
pub fn iceberg::table::Table::clone(&self) -> iceberg::table::Table
Expand Down Expand Up @@ -3094,6 +3102,7 @@ pub mod iceberg::util
pub mod iceberg::util::snapshot
pub fn iceberg::util::snapshot::ancestors_between(table_metadata: &iceberg::spec::TableMetadataRef, latest_snapshot_id: i64, oldest_snapshot_id: core::option::Option<i64>) -> impl core::iter::traits::iterator::Iterator<Item = iceberg::spec::SnapshotRef> + core::marker::Send
pub fn iceberg::util::snapshot::ancestors_of(table_metadata: &iceberg::spec::TableMetadataRef, snapshot_id: i64) -> impl core::iter::traits::iterator::Iterator<Item = iceberg::spec::SnapshotRef> + core::marker::Send
pub fn iceberg::util::available_parallelism() -> core::num::nonzero::NonZeroUsize
pub mod iceberg::writer
pub mod iceberg::writer::base_writer
pub mod iceberg::writer::base_writer::data_file_writer
Expand Down
Loading
Loading