Skip to content

Commit

Permalink
Update Parquet thrift generated structures (#6045)
Browse files Browse the repository at this point in the history
* update to latest thrift (as of 11 Jul 2024) from parquet-format

* pass None for optional size statistics

* escape HTML tags

* don't need to escape brackets in arrays
  • Loading branch information
etseidl authored Jul 16, 2024
1 parent 756b1fb commit fe04e09
Show file tree
Hide file tree
Showing 3 changed files with 339 additions and 65 deletions.
2 changes: 1 addition & 1 deletion parquet/regen.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@
# specific language governing permissions and limitations
# under the License.

REVISION=46cc3a0647d301bb9579ca8dd2cc356caf2a72d2
REVISION=5b564f3c47679526cf72e54f207013f28f53acc4

SOURCE_DIR="$(cd "$(dirname "${BASH_SOURCE[0]:-$0}")" && pwd)"

Expand Down
5 changes: 4 additions & 1 deletion parquet/src/file/metadata/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -790,6 +790,7 @@ impl ColumnChunkMetaData {
.map(|vec| vec.iter().map(page_encoding_stats::to_thrift).collect()),
bloom_filter_offset: self.bloom_filter_offset,
bloom_filter_length: self.bloom_filter_length,
size_statistics: None,
}
}

Expand Down Expand Up @@ -1004,6 +1005,8 @@ impl ColumnIndexBuilder {
self.max_values,
self.boundary_order,
self.null_counts,
None,
None,
)
}
}
Expand Down Expand Up @@ -1052,7 +1055,7 @@ impl OffsetIndexBuilder {
.zip(self.first_row_index_array.iter())
.map(|((offset, size), row_index)| PageLocation::new(*offset, *size, *row_index))
.collect::<Vec<_>>();
OffsetIndex::new(locations)
OffsetIndex::new(locations, None)
}
}

Expand Down
Loading

0 comments on commit fe04e09

Please sign in to comment.