From 4e042908fe240c544172e71c0389f0db8ecc1ac4 Mon Sep 17 00:00:00 2001 From: Andrew Lamb Date: Tue, 25 Jun 2024 09:29:28 -0400 Subject: [PATCH] PARQUET-2139: Clarify ColumnChunk::file_offset is not used --- src/main/thrift/parquet.thrift | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/src/main/thrift/parquet.thrift b/src/main/thrift/parquet.thrift index 934b3cadd..b40d5bf4e 100644 --- a/src/main/thrift/parquet.thrift +++ b/src/main/thrift/parquet.thrift @@ -867,7 +867,12 @@ struct ColumnChunk { **/ 1: optional string file_path - /** Byte offset in file_path to the ColumnMetaData **/ + /** Byte offset in file_path to the ColumnMetaData. + Note: most writers include the ColumnMetadata inline (via meta_data). + While the presence of this field implies that ColumnMetaData can be + stored separately in the file, this is is not supported by many implementations + which assume meta_data is set. + **/ 2: required i64 file_offset /** Column metadata for this chunk. This is the same content as what is at