|
13 | 13 | //! This module provides structures for efficient batch processing, focusing on file action |
14 | 14 | //! deduplication with `FileActionDeduplicator` which tracks unique files across log batches |
15 | 15 | //! to minimize memory usage for tables with extensive history. |
16 | | -use crate::actions::deletion_vector::DeletionVectorDescriptor; |
17 | | -use crate::engine_data::{GetData, TypedGetData}; |
| 16 | +use crate::engine_data::GetData; |
18 | 17 | use crate::log_replay::deduplicator::Deduplicator; |
19 | 18 | use crate::scan::data_skipping::DataSkippingFilter; |
20 | 19 | use crate::{DeltaResult, EngineData}; |
@@ -90,35 +89,6 @@ impl<'seen> FileActionDeduplicator<'seen> { |
90 | 89 | remove_dv_start_index, |
91 | 90 | } |
92 | 91 | } |
93 | | - |
94 | | - /// Extracts the deletion vector unique ID if it exists. |
95 | | - /// |
96 | | - /// This function retrieves the necessary fields for constructing a deletion vector unique ID |
97 | | - /// by accessing `getters` at `dv_start_index` and the following two indices. Specifically: |
98 | | - /// - `dv_start_index` retrieves the storage type (`deletionVector.storageType`). |
99 | | - /// - `dv_start_index + 1` retrieves the path or inline deletion vector (`deletionVector.pathOrInlineDv`). |
100 | | - /// - `dv_start_index + 2` retrieves the optional offset (`deletionVector.offset`). |
101 | | - fn extract_dv_unique_id<'a>( |
102 | | - &self, |
103 | | - i: usize, |
104 | | - getters: &[&'a dyn GetData<'a>], |
105 | | - dv_start_index: usize, |
106 | | - ) -> DeltaResult<Option<String>> { |
107 | | - match getters[dv_start_index].get_opt(i, "deletionVector.storageType")? { |
108 | | - Some(storage_type) => { |
109 | | - let path_or_inline = |
110 | | - getters[dv_start_index + 1].get(i, "deletionVector.pathOrInlineDv")?; |
111 | | - let offset = getters[dv_start_index + 2].get_opt(i, "deletionVector.offset")?; |
112 | | - |
113 | | - Ok(Some(DeletionVectorDescriptor::unique_id_from_parts( |
114 | | - storage_type, |
115 | | - path_or_inline, |
116 | | - offset, |
117 | | - ))) |
118 | | - } |
119 | | - None => Ok(None), |
120 | | - } |
121 | | - } |
122 | 92 | } |
123 | 93 |
|
124 | 94 | impl<'seen> Deduplicator for FileActionDeduplicator<'seen> { |
|
0 commit comments