@@ -280,7 +280,7 @@ struct Statistics {
280280 */
281281 1: optional binary max ;
282282 2: optional binary min ;
283- /**
283+ /**
284284 * Count of null values in the column.
285285 *
286286 * Writers SHOULD always write this field even if it is zero (i.e. no null value)
@@ -717,7 +717,7 @@ struct DictionaryPageHeader {
717717 * The remaining section containing the data is compressed if is_compressed is true
718718 *
719719 * Implementation note - this header is not necessarily a strict improvement over
720- * `DataPageHeader` (in particular the original header might provide better compression
720+ * `DataPageHeader` (in particular the original header might provide better compression
721721 * in some scenarios). Page indexes require pages to start and end at row boundaries,
722722 * regardless of which page header is used.
723723 **/
@@ -897,7 +897,7 @@ struct ColumnMetaData {
897897 /** total byte size of all uncompressed pages in this column chunk (including the headers) **/
898898 6: required i64 total_uncompressed_size
899899
900- /** total byte size of all compressed, and potentially encrypted, pages
900+ /** total byte size of all compressed, and potentially encrypted, pages
901901 * in this column chunk (including the headers) **/
902902 7: required i64 total_compressed_size
903903
@@ -964,19 +964,19 @@ struct ColumnChunk {
964964 /** File where column data is stored. If not set, assumed to be same file as
965965 * metadata. This path is relative to the current file.
966966 *
967- * As of December 2025, the only known use-case for this field is writing summary
968- * parquet files (i.e. "_metadata" files). These files consolidate footers from
969- * multiple parquet files to allow for efficient reading of footers to avoid file
967+ * As of December 2025, the only known use-case for this field is writing summary
968+ * parquet files (i.e. "_metadata" files). These files consolidate footers from
969+ * multiple parquet files to allow for efficient reading of footers to avoid file
970970 * listing costs and prune out files that do not need to be read based on statistics.
971971 *
972972 * These files do not appear to have ever been formally specified in the specification.
973973 * and are potentially problematic from a correctness perspective [1].
974- *
974+ *
975975 * [1] https://lists.apache.org/thread/ootf2kmyg3p01b1bvplpvp4ftd1bt72d
976976 *
977- * There is no other known usage of this field. Specifically, there are no known
978- * reference implementations that will read externally stored column data if this field is populated
979- * within a standard parquet file. Making use of the field for this purpose is
977+ * There is no other known usage of this field. Specifically, there are no known
978+ * reference implementations that will read externally stored column data if this field is populated
979+ * within a standard parquet file. Making use of the field for this purpose is
980980 * not considered part of the Parquet specification.
981981 **/
982982 1: optional string file_path
@@ -1039,10 +1039,10 @@ struct RowGroup {
10391039 * in this row group **/
10401040 5: optional i64 file_offset
10411041
1042- /** Total byte size of all compressed (and potentially encrypted) column data
1042+ /** Total byte size of all compressed (and potentially encrypted) column data
10431043 * in this row group **/
10441044 6: optional i64 total_compressed_size
1045-
1045+
10461046 /** Row group ordinal in the file **/
10471047 7: optional i16 ordinal
10481048}
@@ -1119,7 +1119,7 @@ union ColumnOrder {
11191119 * - If the min is +0, the row group may contain -0 values as well.
11201120 * - If the max is -0, the row group may contain +0 values as well.
11211121 * - When looking for NaN values, min and max should be ignored.
1122- *
1122+ *
11231123 * When writing statistics the following rules should be followed:
11241124 * - NaNs should not be written to min or max statistics fields.
11251125 * - If the computed max value is zero (whether negative or positive),
@@ -1212,13 +1212,13 @@ struct ColumnIndex {
12121212 4: required BoundaryOrder boundary_order
12131213
12141214 /**
1215- * A list containing the number of null values for each page
1215+ * A list containing the number of null values for each page
12161216 *
12171217 * Writers SHOULD always write this field even if no null values
12181218 * are present or the column is not nullable.
1219- * Readers MUST distinguish between null_counts not being present
1219+ * Readers MUST distinguish between null_counts not being present
12201220 * and null_count being 0.
1221- * If null_counts are not present, readers MUST NOT assume all
1221+ * If null_counts are not present, readers MUST NOT assume all
12221222 * null counts are 0.
12231223 */
12241224 5: optional list<i64> null_counts
@@ -1275,12 +1275,12 @@ union EncryptionAlgorithm {
12751275 * Description for file metadata
12761276 */
12771277struct FileMetaData {
1278- /** Version of this file
1279- *
1280- * As of December 2025, there is no agreed upon consensus of what constitutes
1281- * version 2 of the file. For maximum compatibility with readers, writers should
1282- * always populate "1" for version. For maximum compatibility with writers,
1283- * readers should accept "1" and "2" interchangeably. All other versions are
1278+ /** Version of this file
1279+ *
1280+ * As of December 2025, there is no agreed upon consensus of what constitutes
1281+ * version 2 of the file. For maximum compatibility with readers, writers should
1282+ * always populate "1" for version. For maximum compatibility with writers,
1283+ * readers should accept "1" and "2" interchangeably. All other versions are
12841284 * reserved for potential future use-cases.
12851285 */
12861286 1: required i32 version
@@ -1326,30 +1326,30 @@ struct FileMetaData {
13261326 */
13271327 7: optional list<ColumnOrder> column_orders ;
13281328
1329- /**
1329+ /**
13301330 * Encryption algorithm. This field is set only in encrypted files
13311331 * with plaintext footer. Files with encrypted footer store algorithm id
13321332 * in FileCryptoMetaData structure.
13331333 */
13341334 8: optional EncryptionAlgorithm encryption_algorithm
13351335
1336- /**
1337- * Retrieval metadata of key used for signing the footer.
1338- * Used only in encrypted files with plaintext footer.
1339- */
1336+ /**
1337+ * Retrieval metadata of key used for signing the footer.
1338+ * Used only in encrypted files with plaintext footer.
1339+ */
13401340 9: optional binary footer_signing_key_metadata
13411341}
13421342
13431343/** Crypto metadata for files with encrypted footer **/
13441344struct FileCryptoMetaData {
1345- /**
1345+ /**
13461346 * Encryption algorithm. This field is only used for files
13471347 * with encrypted footer. Files with plaintext footer store algorithm id
13481348 * inside footer (FileMetaData structure).
13491349 */
13501350 1: required EncryptionAlgorithm encryption_algorithm
1351-
1352- /** Retrieval metadata of key used for encryption of footer,
1351+
1352+ /** Retrieval metadata of key used for encryption of footer,
13531353 * and (possibly) columns **/
13541354 2: optional binary key_metadata
13551355}
0 commit comments