apache
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpConstants.java‎
Lines changed: 15 additions & 2 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpConstants.java‎
Lines changed: 15 additions & 2 deletions
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpEncoderDecoder.java‎
Lines changed: 40 additions & 44 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpEncoderDecoder.java‎
Lines changed: 40 additions & 44 deletions
diff --git a/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpValuesReader.java‎
Lines changed: 1 addition & 5 deletions b/‎parquet-column/src/main/java/org/apache/parquet/column/values/alp/AlpValuesReader.java‎
Lines changed: 1 addition & 5 deletions
@@ -38,10 +38,9 @@ private AlpConstants() {
   }
 
   // Page header fields
-  public static final int ALP_VERSION = 1;
   public static final int ALP_COMPRESSION_MODE = 0;
   public static final int ALP_INTEGER_ENCODING_FOR = 0;
-  public static final int ALP_HEADER_SIZE = 8;
+  public static final int ALP_HEADER_SIZE = 7;
 
   public static final int DEFAULT_VECTOR_SIZE = 1024;
   public static final int DEFAULT_VECTOR_SIZE_LOG = 10;
@@ -67,12 +66,26 @@ private AlpConstants() {
   public static final int FLOAT_FOR_INFO_SIZE = 5; // frame_of_reference(4) + bit_width(1)
   public static final int DOUBLE_FOR_INFO_SIZE = 9; // frame_of_reference(8) + bit_width(1)
 
+  // POWERS_OF_TEN: positive powers used for scaling up during encode/decode.
+  // Encode: fastRound(value * POW10[e] * POW10_NEGATIVE[f])
+  // Decode: encoded * POW10[f] * POW10_NEGATIVE[e]
   static final float[] FLOAT_POW10 = {1e0f, 1e1f, 1e2f, 1e3f, 1e4f, 1e5f, 1e6f, 1e7f, 1e8f, 1e9f, 1e10f};
 
   static final double[] DOUBLE_POW10 = {
     1e0, 1e1, 1e2, 1e3, 1e4, 1e5, 1e6, 1e7, 1e8, 1e9, 1e10, 1e11, 1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18
   };
 
+  // NEGATIVE_POWERS_OF_TEN: reciprocals used for scaling down (multiply-by-reciprocal).
+  // Using separate negative-power arrays instead of division ensures C++ wire compatibility.
+  static final float[] FLOAT_POW10_NEGATIVE = {
+    1e0f, 1e-1f, 1e-2f, 1e-3f, 1e-4f, 1e-5f, 1e-6f, 1e-7f, 1e-8f, 1e-9f, 1e-10f
+  };
+
+  static final double[] DOUBLE_POW10_NEGATIVE = {
+    1e0, 1e-1, 1e-2, 1e-3, 1e-4, 1e-5, 1e-6, 1e-7, 1e-8, 1e-9, 1e-10, 1e-11, 1e-12, 1e-13, 1e-14, 1e-15, 1e-16,
+    1e-17, 1e-18
+  };
+
   static final int FLOAT_NEGATIVE_ZERO_BITS = 0x80000000;
   static final long DOUBLE_NEGATIVE_ZERO_BITS = 0x8000000000000000L;
 
 
@@ -27,8 +27,13 @@
  * then applying Frame of Reference encoding and bit-packing.
  * Values that cannot be losslessly converted are stored as exceptions.
  *
- * <p>Encoding formula: encoded = round(value * 10^(exponent - factor))
- * <p>Decoding formula: value = encoded / 10^(exponent - factor)
+ * <p>Encoding formula: encoded = fastRound(value * POW10[e] * POW10_NEGATIVE[f])
+ * <p>Decoding formula: value = encoded * POW10[f] * POW10_NEGATIVE[e]
+ *
+ * <p>The order of operations is critical for IEEE 754 correctness. Both formulas must
+ * be evaluated as single expressions — storing the intermediate multiplication result
+ * in a variable before the second multiply changes IEEE 754 rounding and produces extra
+ * exceptions. Uses multiply-by-reciprocal (via POW10_NEGATIVE) for C++ wire compatibility.
  *
  * <p>Exception conditions:
  * <ul>
@@ -41,26 +46,15 @@
  */
 final class AlpEncoderDecoder {
 
+  private static final double ENCODING_UPPER_LIMIT = 9223372036854774784.0;
+  private static final double ENCODING_LOWER_LIMIT = -9223372036854774784.0;
+  private static final float FLOAT_ENCODING_UPPER_LIMIT = 2147483520.0f;
+  private static final float FLOAT_ENCODING_LOWER_LIMIT = -2147483520.0f;
+
   private AlpEncoderDecoder() {
     // Utility class
   }
 
-  static float getFloatMultiplier(int exponent, int factor) {
-    float multiplier = FLOAT_POW10[exponent];
-    if (factor > 0) {
-      multiplier /= FLOAT_POW10[factor];
-    }
-    return multiplier;
-  }
-
-  static double getDoubleMultiplier(int exponent, int factor) {
-    double multiplier = DOUBLE_POW10[exponent];
-    if (factor > 0) {
-      multiplier /= DOUBLE_POW10[factor];
-    }
-    return multiplier;
-  }
-
   /** NaN, Inf, and -0.0 can never be encoded regardless of exponent/factor. */
   static boolean isFloatException(float value) {
     if (Float.isNaN(value)) {
@@ -77,27 +71,17 @@ static boolean isFloatException(float value, int exponent, int factor) {
     if (isFloatException(value)) {
       return true;
     }
-    float multiplier = getFloatMultiplier(exponent, factor);
-    float scaled = value * multiplier;
-    if (scaled > Integer.MAX_VALUE || scaled < Integer.MIN_VALUE) {
+    // Check before rounding: overflow or non-finite after scaling
+    float scaled = value * FLOAT_POW10[exponent] * FLOAT_POW10_NEGATIVE[factor];
+    if (!Float.isFinite(scaled) || scaled > FLOAT_ENCODING_UPPER_LIMIT || scaled < FLOAT_ENCODING_LOWER_LIMIT) {
       return true;
     }
     int encoded = encodeFloat(value, exponent, factor);
     float decoded = decodeFloat(encoded, exponent, factor);
     return Float.floatToRawIntBits(value) != Float.floatToRawIntBits(decoded);
   }
 
-  /** Encode: round(value * 10^exponent / 10^factor) */
-  static int encodeFloat(float value, int exponent, int factor) {
-    return fastRoundFloat(value * getFloatMultiplier(exponent, factor));
-  }
-
-  /** Decode: encoded / 10^exponent * 10^factor */
-  static float decodeFloat(int encoded, int exponent, int factor) {
-    return encoded / getFloatMultiplier(exponent, factor);
-  }
-
-  // Uses the 2^22+2^23 magic-number trick to round without branching on the FPU.
+  /** Round float to nearest integer using magic-number trick with sign branching. */
   static int fastRoundFloat(float value) {
     if (value >= 0) {
       return (int) ((value + MAGIC_FLOAT) - MAGIC_FLOAT);
@@ -106,6 +90,16 @@ static int fastRoundFloat(float value) {
     }
   }
 
+  /** Encode: fastRound(value * POW10[e] * POW10_NEGATIVE[f]) — single expression. */
+  static int encodeFloat(float value, int exponent, int factor) {
+    return fastRoundFloat(value * FLOAT_POW10[exponent] * FLOAT_POW10_NEGATIVE[factor]);
+  }
+
+  /** Decode: encoded * POW10[f] * POW10_NEGATIVE[e] — single expression. */
+  static float decodeFloat(int encoded, int exponent, int factor) {
+    return encoded * FLOAT_POW10[factor] * FLOAT_POW10_NEGATIVE[exponent];
+  }
+
   static boolean isDoubleException(double value) {
     if (Double.isNaN(value)) {
       return true;
@@ -120,25 +114,17 @@ static boolean isDoubleException(double value, int exponent, int factor) {
     if (isDoubleException(value)) {
       return true;
     }
-    double multiplier = getDoubleMultiplier(exponent, factor);
-    double scaled = value * multiplier;
-    if (scaled > Long.MAX_VALUE || scaled < Long.MIN_VALUE) {
+    // Check before rounding: overflow or non-finite after scaling
+    double scaled = value * DOUBLE_POW10[exponent] * DOUBLE_POW10_NEGATIVE[factor];
+    if (!Double.isFinite(scaled) || scaled > ENCODING_UPPER_LIMIT || scaled < ENCODING_LOWER_LIMIT) {
       return true;
     }
     long encoded = encodeDouble(value, exponent, factor);
     double decoded = decodeDouble(encoded, exponent, factor);
     return Double.doubleToRawLongBits(value) != Double.doubleToRawLongBits(decoded);
   }
 
-  static long encodeDouble(double value, int exponent, int factor) {
-    return fastRoundDouble(value * getDoubleMultiplier(exponent, factor));
-  }
-
-  static double decodeDouble(long encoded, int exponent, int factor) {
-    return encoded / getDoubleMultiplier(exponent, factor);
-  }
-
-  // Same trick but with 2^51+2^52 for double precision.
+  /** Round double to nearest integer using magic-number trick with sign branching. */
   static long fastRoundDouble(double value) {
     if (value >= 0) {
       return (long) ((value + MAGIC_DOUBLE) - MAGIC_DOUBLE);
@@ -147,6 +133,16 @@ static long fastRoundDouble(double value) {
     }
   }
 
+  /** Encode: fastRound(value * POW10[e] * POW10_NEGATIVE[f]) — single expression. */
+  static long encodeDouble(double value, int exponent, int factor) {
+    return fastRoundDouble(value * DOUBLE_POW10[exponent] * DOUBLE_POW10_NEGATIVE[factor]);
+  }
+
+  /** Decode: encoded * POW10[f] * POW10_NEGATIVE[e] — single expression. */
+  static double decodeDouble(long encoded, int exponent, int factor) {
+    return encoded * DOUBLE_POW10[factor] * DOUBLE_POW10_NEGATIVE[exponent];
+  }
+
   /** Number of bits needed to represent maxDelta as an unsigned value. */
   static int bitWidthForInt(int maxDelta) {
     if (maxDelta == 0) {
 
@@ -34,7 +34,7 @@
  * <pre>
  * ┌─────────┬──────────────────────┬──────────────┬──────────────┬─────┐
  * │ Header  │ Offset Array         │ Vector 0     │ Vector 1     │ ... │
- * │ 8 bytes │ 4B &times; numVectors │ (interleaved)│ (interleaved)│     │
+ * │ 7 bytes │ 4B &times; numVectors │ (interleaved)│ (interleaved)│     │
  * └─────────┴──────────────────────┴──────────────┴──────────────┴─────┘
  * </pre>
  *
@@ -63,15 +63,11 @@ abstract class AlpValuesReader extends ValuesReader {
   public void initFromPage(int valuesCount, ByteBufferInputStream stream)
       throws ParquetDecodingException, IOException {
     ByteBuffer headerBuf = stream.slice(ALP_HEADER_SIZE).order(ByteOrder.LITTLE_ENDIAN);
-    int version = headerBuf.get() & 0xFF;
     int compressionMode = headerBuf.get() & 0xFF;
     int integerEncoding = headerBuf.get() & 0xFF;
     int logVectorSize = headerBuf.get() & 0xFF;
     int numElements = headerBuf.getInt();
 
-    if (version != ALP_VERSION) {
-      throw new ParquetDecodingException("Unsupported ALP version: " + version + ", expected " + ALP_VERSION);
-    }
     if (compressionMode != ALP_COMPRESSION_MODE) {
       throw new ParquetDecodingException("Unsupported ALP compression mode: " + compressionMode);
     }