From 9d0ff4260def60789e3923bf5a1e61142f7b5c2c Mon Sep 17 00:00:00 2001 From: Antoine Pitrou Date: Tue, 21 May 2024 16:11:23 +0200 Subject: [PATCH] GH-41748: [Python][Parquet] Update BYTE_STREAM_SPLIT description in write_table() docstring --- python/pyarrow/parquet/core.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/python/pyarrow/parquet/core.py b/python/pyarrow/parquet/core.py index f54a203c8794c..81798b1544474 100644 --- a/python/pyarrow/parquet/core.py +++ b/python/pyarrow/parquet/core.py @@ -797,8 +797,9 @@ def _sanitize_table(table, new_schema, flavor): Specify if the byte_stream_split encoding should be used in general or only for some columns. If both dictionary and byte_stream_stream are enabled, then dictionary is preferred. - The byte_stream_split encoding is valid only for floating-point data types - and should be combined with a compression codec. + The byte_stream_split encoding is valid for integer, floating-point + and fixed-size binary data types (including decimals); it should be + combined with a compression codec so as to achieve size reduction. column_encoding : string or dict, default None Specify the encoding scheme on a per column basis. Can only be used when ``use_dictionary`` is set to False, and