apache
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpCompression.java‎
Lines changed: 4 additions & 8 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpCompression.java‎
Lines changed: 4 additions & 8 deletions
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpConstants.java‎
Lines changed: 2 additions & 2 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpConstants.java‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpSampler.java‎
Lines changed: 4 additions & 9 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpSampler.java‎
Lines changed: 4 additions & 9 deletions
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpValuesReader.java‎
Lines changed: 4 additions & 8 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpValuesReader.java‎
Lines changed: 4 additions & 8 deletions
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpWrapper.java‎
Lines changed: 32 additions & 45 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpWrapper.java‎
Lines changed: 32 additions & 45 deletions
@@ -89,8 +89,7 @@ void store(byte[] output, int offset) {
     }
 
     void storeDataOnly(byte[] output, int offset) {
-      ByteBuffer buf =
-          ByteBuffer.wrap(output, offset, dataStoredSize()).order(ByteOrder.LITTLE_ENDIAN);
+      ByteBuffer buf = ByteBuffer.wrap(output, offset, dataStoredSize()).order(ByteOrder.LITTLE_ENDIAN);
       storeDataTo(buf);
     }
 
@@ -169,8 +168,7 @@ void store(byte[] output, int offset) {
     }
 
     void storeDataOnly(byte[] output, int offset) {
-      ByteBuffer buf =
-          ByteBuffer.wrap(output, offset, dataStoredSize()).order(ByteOrder.LITTLE_ENDIAN);
+      ByteBuffer buf = ByteBuffer.wrap(output, offset, dataStoredSize()).order(ByteOrder.LITTLE_ENDIAN);
       storeDataTo(buf);
     }
 
@@ -212,8 +210,7 @@ static DoubleCompressedVector load(byte[] input, int offset, int numElements) {
 
   // ========== Compress float ==========
 
-  static FloatCompressedVector compressFloatVector(
-      float[] input, int count, AlpEncodingPreset preset) {
+  static FloatCompressedVector compressFloatVector(float[] input, int count, AlpEncodingPreset preset) {
     if (count == 0) {
       FloatCompressedVector r = new FloatCompressedVector();
       r.packedValues = new byte[0];
@@ -321,8 +318,7 @@ static void decompressFloatVector(FloatCompressedVector v, float[] output) {
 
   // ========== Compress double ==========
 
-  static DoubleCompressedVector compressDoubleVector(
-      double[] input, int count, AlpEncodingPreset preset) {
+  static DoubleCompressedVector compressDoubleVector(double[] input, int count, AlpEncodingPreset preset) {
     if (count == 0) {
       DoubleCompressedVector r = new DoubleCompressedVector();
       r.packedValues = new byte[0];
 
@@ -88,8 +88,8 @@ private AlpConstants() {
 
   // Negative powers of 10 as double, matching C++ PowerOfTenDouble(-power).
   static final double[] DOUBLE_POW10_NEGATIVE = {
-    1e0, 1e-1, 1e-2, 1e-3, 1e-4, 1e-5, 1e-6, 1e-7, 1e-8, 1e-9, 1e-10,
-    1e-11, 1e-12, 1e-13, 1e-14, 1e-15, 1e-16, 1e-17, 1e-18
+    1e0, 1e-1, 1e-2, 1e-3, 1e-4, 1e-5, 1e-6, 1e-7, 1e-8, 1e-9, 1e-10, 1e-11, 1e-12, 1e-13, 1e-14, 1e-15, 1e-16,
+    1e-17, 1e-18
   };
 
   // ========== Per-vector metadata sizes ==========
 
@@ -21,7 +21,6 @@
 import static org.apache.parquet.column.values.alp.AlpConstants.*;
 
 import java.util.ArrayList;
-import java.util.Arrays;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
@@ -63,8 +62,7 @@ void addSample(float[] data, int count) {
     }
 
     private void addSampleVector(float[] data, int offset, int length) {
-      boolean mustSkip = mustSkipSamplingFromCurrentVector(
-          vectorsCount, vectorsSampledCount, length);
+      boolean mustSkip = mustSkipSamplingFromCurrentVector(vectorsCount, vectorsSampledCount, length);
       vectorsCount++;
       totalValuesCount += length;
       if (mustSkip) {
@@ -129,8 +127,7 @@ void addSample(double[] data, int count) {
     }
 
     private void addSampleVector(double[] data, int offset, int length) {
-      boolean mustSkip = mustSkipSamplingFromCurrentVector(
-          vectorsCount, vectorsSampledCount, length);
+      boolean mustSkip = mustSkipSamplingFromCurrentVector(vectorsCount, vectorsSampledCount, length);
       vectorsCount++;
       totalValuesCount += length;
       if (mustSkip) {
@@ -209,8 +206,7 @@ private static long estimateFloatCompressedSize(
     return estimatedSize;
   }
 
-  static AlpCompression.AlpEncodingPreset createFloatEncodingPreset(
-      List<float[]> vectorsSampled) {
+  static AlpCompression.AlpEncodingPreset createFloatEncodingPreset(List<float[]> vectorsSampled) {
     // For each sampled vector, find the best (e,f) combo by estimated compressed size.
     // Count how many times each best combo appears across all sampled vectors.
     Map<Long, int[]> bestCombosCount = new HashMap<>(); // key = e<<8|f, value = [count]
@@ -299,8 +295,7 @@ private static long estimateDoubleCompressedSize(
     return estimatedSize;
   }
 
-  static AlpCompression.AlpEncodingPreset createDoubleEncodingPreset(
-      List<double[]> vectorsSampled) {
+  static AlpCompression.AlpEncodingPreset createDoubleEncodingPreset(List<double[]> vectorsSampled) {
     Map<Long, int[]> bestCombosCount = new HashMap<>();
 
     for (double[] sample : vectorsSampled) {
 
@@ -48,8 +48,7 @@ abstract class AlpValuesReader extends ValuesReader {
   public void initFromPage(int valueCount, ByteBufferInputStream stream) throws IOException {
     int available = (int) stream.available();
     if (available < HEADER_SIZE) {
-      throw new ParquetDecodingException(
-          "ALP page too small for header: " + available + " bytes");
+      throw new ParquetDecodingException("ALP page too small for header: " + available + " bytes");
     }
 
     // Read header
@@ -63,12 +62,10 @@ public void initFromPage(int valueCount, ByteBufferInputStream stream) throws IO
     totalCount = header.getInt();
 
     if (compressionMode != COMPRESSION_MODE_ALP) {
-      throw new ParquetDecodingException(
-          "Unsupported ALP compression mode: " + compressionMode);
+      throw new ParquetDecodingException("Unsupported ALP compression mode: " + compressionMode);
     }
     if (integerEncoding != INTEGER_ENCODING_FOR) {
-      throw new ParquetDecodingException(
-          "Unsupported ALP integer encoding: " + integerEncoding);
+      throw new ParquetDecodingException("Unsupported ALP integer encoding: " + integerEncoding);
     }
 
     vectorSize = 1 << logVectorSize;
@@ -88,8 +85,7 @@ public void initFromPage(int valueCount, ByteBufferInputStream stream) throws IO
     stream.read(rawData);
 
     // Parse offsets from rawData
-    ByteBuffer body = ByteBuffer.wrap(rawData, 0, numVectors * OFFSET_SIZE)
-        .order(ByteOrder.LITTLE_ENDIAN);
+    ByteBuffer body = ByteBuffer.wrap(rawData, 0, numVectors * OFFSET_SIZE).order(ByteOrder.LITTLE_ENDIAN);
     vectorOffsets = new int[numVectors];
     for (int i = 0; i < numVectors; i++) {
       vectorOffsets[i] = body.getInt();
 
@@ -47,16 +47,14 @@ private AlpWrapper() {}
   // ========== Sampling presets ==========
 
   /** Create a sampling-based encoding preset for float data. */
-  public static AlpCompression.AlpEncodingPreset createFloatSamplingPreset(
-      float[] data, int count) {
+  public static AlpCompression.AlpEncodingPreset createFloatSamplingPreset(float[] data, int count) {
     AlpSampler.FloatSampler sampler = new AlpSampler.FloatSampler();
     sampler.addSample(data, count);
     return sampler.finalizeSampling();
   }
 
   /** Create a sampling-based encoding preset for double data. */
-  public static AlpCompression.AlpEncodingPreset createDoubleSamplingPreset(
-      double[] data, int count) {
+  public static AlpCompression.AlpEncodingPreset createDoubleSamplingPreset(double[] data, int count) {
     AlpSampler.DoubleSampler sampler = new AlpSampler.DoubleSampler();
     sampler.addSample(data, count);
     return sampler.finalizeSampling();
@@ -73,12 +71,10 @@ public static AlpCompression.AlpEncodingPreset createDoubleSamplingPreset(
    * @param preset the encoding preset from sampling
    * @return the number of compressed bytes written
    */
-  public static int encodeFloats(
-      float[] input, int count, byte[] output, AlpCompression.AlpEncodingPreset preset) {
+  public static int encodeFloats(float[] input, int count, byte[] output, AlpCompression.AlpEncodingPreset preset) {
     Preconditions.checkArgument(count >= 0, "count must be non-negative, got: %s", count);
     if (count == 0) {
-      writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR,
-          DEFAULT_VECTOR_SIZE_LOG, 0);
+      writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR, DEFAULT_VECTOR_SIZE_LOG, 0);
       return HEADER_SIZE;
     }
 
@@ -101,14 +97,14 @@ public static int encodeFloats(
     int currentOffset = offsetsSectionSize;
     for (int i = 0; i < numVectors; i++) {
       vectorOffsets[i] = currentOffset;
-      currentOffset += ALP_INFO_SIZE + FLOAT_FOR_INFO_SIZE + vectors.get(i).dataStoredSize();
+      currentOffset +=
+          ALP_INFO_SIZE + FLOAT_FOR_INFO_SIZE + vectors.get(i).dataStoredSize();
     }
     int bodySize = currentOffset;
     int totalSize = HEADER_SIZE + bodySize;
 
     // Phase 3: Write header
-    writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR,
-        DEFAULT_VECTOR_SIZE_LOG, count);
+    writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR, DEFAULT_VECTOR_SIZE_LOG, count);
 
     // Phase 4: Write offsets
     ByteBuffer buf = ByteBuffer.wrap(output, HEADER_SIZE, bodySize).order(ByteOrder.LITTLE_ENDIAN);
@@ -128,12 +124,10 @@ public static int encodeFloats(
 
   // ========== Encode doubles ==========
 
-  public static int encodeDoubles(
-      double[] input, int count, byte[] output, AlpCompression.AlpEncodingPreset preset) {
+  public static int encodeDoubles(double[] input, int count, byte[] output, AlpCompression.AlpEncodingPreset preset) {
     Preconditions.checkArgument(count >= 0, "count must be non-negative, got: %s", count);
     if (count == 0) {
-      writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR,
-          DEFAULT_VECTOR_SIZE_LOG, 0);
+      writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR, DEFAULT_VECTOR_SIZE_LOG, 0);
       return HEADER_SIZE;
     }
 
@@ -146,8 +140,7 @@ public static int encodeDoubles(
       int elementsInVector = Math.min(vectorSize, count - offset);
       double[] vectorInput = new double[elementsInVector];
       System.arraycopy(input, offset, vectorInput, 0, elementsInVector);
-      vectors.add(
-          AlpCompression.compressDoubleVector(vectorInput, elementsInVector, preset));
+      vectors.add(AlpCompression.compressDoubleVector(vectorInput, elementsInVector, preset));
     }
 
     int offsetsSectionSize = numVectors * OFFSET_SIZE;
@@ -161,8 +154,7 @@ public static int encodeDoubles(
     int bodySize = currentOffset;
     int totalSize = HEADER_SIZE + bodySize;
 
-    writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR,
-        DEFAULT_VECTOR_SIZE_LOG, count);
+    writeHeader(output, 0, COMPRESSION_MODE_ALP, INTEGER_ENCODING_FOR, DEFAULT_VECTOR_SIZE_LOG, count);
 
     ByteBuffer buf = ByteBuffer.wrap(output, HEADER_SIZE, bodySize).order(ByteOrder.LITTLE_ENDIAN);
     for (int offset : vectorOffsets) {
@@ -188,30 +180,28 @@ public static int encodeDoubles(
    * @param output output float array (must hold numElements values)
    * @param numElements number of elements to decode
    */
-  public static void decodeFloats(
-      byte[] compressed, int compSize, float[] output, int numElements) {
-    Preconditions.checkArgument(compSize >= HEADER_SIZE,
-        "compressed size too small for header: %s", compSize);
+  public static void decodeFloats(byte[] compressed, int compSize, float[] output, int numElements) {
+    Preconditions.checkArgument(compSize >= HEADER_SIZE, "compressed size too small for header: %s", compSize);
 
     ByteBuffer header = ByteBuffer.wrap(compressed, 0, HEADER_SIZE).order(ByteOrder.LITTLE_ENDIAN);
     int compressionMode = header.get() & 0xFF;
     int integerEncoding = header.get() & 0xFF;
     int logVectorSize = header.get() & 0xFF;
     int storedNumElements = header.getInt();
 
-    Preconditions.checkArgument(compressionMode == COMPRESSION_MODE_ALP,
-        "unsupported compression mode: %s", compressionMode);
-    Preconditions.checkArgument(integerEncoding == INTEGER_ENCODING_FOR,
-        "unsupported integer encoding: %s", integerEncoding);
+    Preconditions.checkArgument(
+        compressionMode == COMPRESSION_MODE_ALP, "unsupported compression mode: %s", compressionMode);
+    Preconditions.checkArgument(
+        integerEncoding == INTEGER_ENCODING_FOR, "unsupported integer encoding: %s", integerEncoding);
 
     int vectorSize = 1 << logVectorSize;
     int numVectors = (storedNumElements + vectorSize - 1) / vectorSize;
 
     if (numVectors == 0) return;
 
     // Read offsets
-    ByteBuffer body = ByteBuffer.wrap(compressed, HEADER_SIZE, compSize - HEADER_SIZE)
-        .order(ByteOrder.LITTLE_ENDIAN);
+    ByteBuffer body =
+        ByteBuffer.wrap(compressed, HEADER_SIZE, compSize - HEADER_SIZE).order(ByteOrder.LITTLE_ENDIAN);
     int[] vectorOffsets = new int[numVectors];
     for (int i = 0; i < numVectors; i++) {
       vectorOffsets[i] = body.getInt();
@@ -234,37 +224,35 @@ public static void decodeFloats(
 
       float[] vectorOutput = new float[elementsInVector];
       AlpCompression.decompressFloatVector(cv, vectorOutput);
-      System.arraycopy(vectorOutput, 0, output, outputOffset,
-          Math.min(elementsInVector, numElements - outputOffset));
+      System.arraycopy(
+          vectorOutput, 0, output, outputOffset, Math.min(elementsInVector, numElements - outputOffset));
       outputOffset += elementsInVector;
     }
   }
 
   // ========== Decode doubles ==========
 
-  public static void decodeDoubles(
-      byte[] compressed, int compSize, double[] output, int numElements) {
-    Preconditions.checkArgument(compSize >= HEADER_SIZE,
-        "compressed size too small for header: %s", compSize);
+  public static void decodeDoubles(byte[] compressed, int compSize, double[] output, int numElements) {
+    Preconditions.checkArgument(compSize >= HEADER_SIZE, "compressed size too small for header: %s", compSize);
 
     ByteBuffer header = ByteBuffer.wrap(compressed, 0, HEADER_SIZE).order(ByteOrder.LITTLE_ENDIAN);
     int compressionMode = header.get() & 0xFF;
     int integerEncoding = header.get() & 0xFF;
     int logVectorSize = header.get() & 0xFF;
     int storedNumElements = header.getInt();
 
-    Preconditions.checkArgument(compressionMode == COMPRESSION_MODE_ALP,
-        "unsupported compression mode: %s", compressionMode);
-    Preconditions.checkArgument(integerEncoding == INTEGER_ENCODING_FOR,
-        "unsupported integer encoding: %s", integerEncoding);
+    Preconditions.checkArgument(
+        compressionMode == COMPRESSION_MODE_ALP, "unsupported compression mode: %s", compressionMode);
+    Preconditions.checkArgument(
+        integerEncoding == INTEGER_ENCODING_FOR, "unsupported integer encoding: %s", integerEncoding);
 
     int vectorSize = 1 << logVectorSize;
     int numVectors = (storedNumElements + vectorSize - 1) / vectorSize;
 
     if (numVectors == 0) return;
 
-    ByteBuffer body = ByteBuffer.wrap(compressed, HEADER_SIZE, compSize - HEADER_SIZE)
-        .order(ByteOrder.LITTLE_ENDIAN);
+    ByteBuffer body =
+        ByteBuffer.wrap(compressed, HEADER_SIZE, compSize - HEADER_SIZE).order(ByteOrder.LITTLE_ENDIAN);
     int[] vectorOffsets = new int[numVectors];
     for (int i = 0; i < numVectors; i++) {
       vectorOffsets[i] = body.getInt();
@@ -286,8 +274,8 @@ public static void decodeDoubles(
 
       double[] vectorOutput = new double[elementsInVector];
       AlpCompression.decompressDoubleVector(cv, vectorOutput);
-      System.arraycopy(vectorOutput, 0, output, outputOffset,
-          Math.min(elementsInVector, numElements - outputOffset));
+      System.arraycopy(
+          vectorOutput, 0, output, outputOffset, Math.min(elementsInVector, numElements - outputOffset));
       outputOffset += elementsInVector;
     }
   }
@@ -322,8 +310,7 @@ public static long maxCompressedSizeDouble(int numElements) {
   // ========== Header helpers ==========
 
   private static void writeHeader(
-      byte[] output, int offset, int compressionMode, int integerEncoding,
-      int logVectorSize, int numElements) {
+      byte[] output, int offset, int compressionMode, int integerEncoding, int logVectorSize, int numElements) {
     ByteBuffer buf = ByteBuffer.wrap(output, offset, HEADER_SIZE).order(ByteOrder.LITTLE_ENDIAN);
     buf.put((byte) compressionMode);
     buf.put((byte) integerEncoding);