some refactoring +++ fix and test 128 bit subtraction

TilmanNeumann · TilmanNeumann · commit 89aff196b4b2 · 2026-04-11T17:02:31.000+02:00
diff --git a/src/main/java/de/tilman_neumann/jml/base/Uint128.java b/src/main/java/de/tilman_neumann/jml/base/Uint128.java
@@ -21,10 +21,10 @@
 import de.tilman_neumann.util.Ensure;
 
 /**
- * An incomplete 128 bit unsigned int implementation.
+ * An incomplete 128 bit integer implementation.
  * 
- * Implementation notes:
- * * a+Long.MIN_VALUE <> b+Long-MIN_VALUE is an inlined compareUnsigned(a, b) <> 0.
+ * Implementation note:
+ * r_lo+Long.MIN_VALUE < low+Long.MIN_VALUE is an inlined compareUnsigned(r_lo, low) < 0.
  * 
  * @author Tilman Neumann
  */
@@ -51,64 +51,88 @@ public long getLow() {
 	}
 
 	/**
-	 * Add two unsigned 128 bit integers.
-	 * @param other
-	 * @return this + other
+	 * Add two 128 bit integers.
+	 * @param b
+	 * @return this + b
 	 */
-	public Uint128 add_v1(Uint128 other) {
-		// We know for sure that low overflows if both low and o_lo are 64 bit. If only one of the input 'low's
-		// is 64 bit, then we can recognize an overflow if the result.lo is not 64 bit.
-		final long o_lo = other.getLow();
-		final long o_hi = other.getHigh();
-		final long r_lo = low + o_lo;
-		long r_hi = high + o_hi;
-		if ((low<0 && o_lo<0) || ((low<0 || o_lo<0) && (r_lo >= 0))) r_hi++;
+	public Uint128 add_v1(Uint128 b) {
+		// We know for sure that low overflows if both low and b_lo are 64 bit. If only one of the input 'low's
+		// is 64 bit, then we can recognize an overflow if r_lo is not 64 bit.
+		final long b_lo = b.getLow();
+		final long b_hi = b.getHigh();
+		final long r_lo = low + b_lo;
+		long r_hi = high + b_hi;
+		if ((low<0 && b_lo<0) || ((low<0 || b_lo<0) && (r_lo >= 0))) r_hi++;
 		return new Uint128(r_hi, r_lo);
 	}
 
 	/**
-	 * Add two unsigned 128 bit integers.
+	 * Add two 128 bit integers.
 	 * 
-	 * Simpler carry recognition and thus much faster than the first version,
-	 * thanks to Ben, see https://www.mersenneforum.org/showpost.php?p=524300&postcount=173.
+	 * Simpler carry recognition thanks to Ben Buhrow,
+	 * see https://www.mersenneforum.org/showpost.php?p=524300&postcount=173.
 	 * 
-	 * @param other
-	 * @return this + other
+	 * @param b
+	 * @return this + b
 	 */
-	public Uint128 add/*_v2*/(Uint128 other) {
-		long a = low + other.getLow();
-		long b = high + other.getHigh();
-		if (a+Long.MIN_VALUE < low+Long.MIN_VALUE) b++;
-		return new Uint128(b, a);
+	public Uint128 add/*_v2*/(Uint128 b) {
+		long r_lo = low + b.getLow();
+		long r_hi = high + b.getHigh();
+		if (r_lo+Long.MIN_VALUE < low+Long.MIN_VALUE) r_hi++;
+		return new Uint128(r_hi, r_lo);
 	}
 
 	/**
-	 * Compute the sum of this and other, return the high part.
-	 * @param other
-	 * @return high part of this + other
+	 * Add two 128 bit integers, AI-generated version.
+	 * 
+	 * @param b
+	 * @return this + b
 	 */
-	public long add_getHigh(Uint128 other) {
-		long a = low + other.getLow();
-		long b = high + other.getHigh();
-		return (a+Long.MIN_VALUE < low+Long.MIN_VALUE) ? b + 1 : b;
+	public Uint128 add_v3(Uint128 b) {
+	    long r_lo = low + b.getLow();
+	    long carry = Long.compareUnsigned(r_lo, low) < 0 ? 1 : 0;
+	    long r_hi = high + b.getHigh() + carry;
+		return new Uint128(r_hi, r_lo);
+	}
+	
+	/**
+	 * Add two 128 bit integers, return the high part.
+	 * @param b
+	 * @return high part of this + b
+	 */
+	public long add_getHigh(Uint128 b) {
+		long r_lo = low + b.getLow();
+		long r_hi = high + b.getHigh();
+		return r_lo+Long.MIN_VALUE < low+Long.MIN_VALUE ? r_hi + 1 : r_hi;
 	}
 
 	/**
-	 * Subtract two unsigned 128 bit integers.
+	 * Subtract two 128 bit integers.
 	 * 
-	 * @param other
-	 * @return this - other
+	 * @param b
+	 * @return this - b, may be negative
 	 */
-	// XXX experimental, probably wrong...
-	public Uint128 subtract(Uint128 other) {
-		long r_lo = low - other.getLow();
-		long r_hi = high - other.getHigh();
-        // check for underflow of low 64 bits, subtract carry to high
-        if (Long.compareUnsigned(r_lo, low) > 0) {
-            --r_hi;
-        }
+	public Uint128 subtract(Uint128 b) {
+    	long b_lo = b.getLow();
+		long r_lo = low - b_lo;
+		long r_hi = high - b.getHigh();
+        if (Long.compareUnsigned(low, b_lo) < 0) --r_hi;
         return new Uint128(r_hi, r_lo);
 	}
+	
+	/**
+	 * Subtract two 128 bit integers. AI-generated version.
+	 * 
+	 * @param b
+	 * @return this - b, may be negative
+	 */
+    public Uint128 subtract_v2(Uint128 b) {
+    	long b_lo = b.getLow();
+        long r_lo = low - b_lo;
+        long borrow = Long.compareUnsigned(low, b_lo) < 0 ? 1 : 0;
+        long r_hi = high - b.getHigh() - borrow;
+		return new Uint128(r_hi, r_lo);
+    }
 
 	/**
 	 * Multiplication of unsigned 63 bit integers,
@@ -547,17 +571,48 @@ public long and(long other) {
 	public double doubleValue() {
 		return toBigInteger().doubleValue(); // TODO more efficient solution
 	}
+
+	public double doubleValueUnsigned() {
+		return toBigIntegerUnsigned().doubleValue(); // TODO more efficient solution
+	}
 	
 	/**
-	 * Convert this to BigInteger.
-	 * @return this unsigned 128 bit integer converted to BigInteger
+	 * Signed conversion to BigInteger.
+	 * @return this as a signed 127 bit integer converted to BigInteger
 	 */
 	public BigInteger toBigInteger() {
-		return new BigInteger(Long.toBinaryString(high), 2).shiftLeft(64).add(new BigInteger(Long.toBinaryString(low), 2));
+		return BigInteger.valueOf(high).shiftLeft(64).or(toBigIntegerUnsigned(low));
+	}
+
+	/**
+	 * Unsigned conversion to BigInteger.
+	 * @return this as an unsigned 128 bit integer converted to BigInteger
+	 */
+	public BigInteger toBigIntegerUnsigned() {
+		return toBigIntegerUnsigned(high).shiftLeft(64).or(toBigIntegerUnsigned(low));
+	}
+
+	// helper method
+	private static BigInteger toBigIntegerUnsigned(long n) {
+		BigInteger big = BigInteger.valueOf(n & Long.MAX_VALUE); // drop sign bit
+	    if (n < 0) {
+	    	big = big.setBit(63); // now big is unsigned 64 bit
+	    }
+	    return big;
 	}
 	
+	/**
+	 * @return a string representing this as a signed integer
+	 */
 	@Override
 	public String toString() {
-		return toBigInteger().toString();
+		return toBigInteger().toString(); // TODO more efficient solution
+	}
+	
+	/**
+	 * @return a string representing this as an unsigned integer
+	 */
+	public String toStringUnsigned() {
+		return toBigIntegerUnsigned().toString(); // TODO more efficient solution
 	}
 }
diff --git a/src/test/java/de/tilman_neumann/jml/base/Uint128PerformanceTest.java b/src/test/java/de/tilman_neumann/jml/base/Uint128PerformanceTest.java
@@ -26,9 +26,10 @@ public class Uint128PerformanceTest {
 	private static final Random RNG = new Random();
 
 	private static void testPerformance() {
-		// Performance tests are carried out in double loops over the same numbers.
+		// Performance tests of 2-argument methods are carried out in double loops over the same numbers.
 		// Otherwise number creation is much more expensive than testing the operations themselves.
 		int NCOUNT = 300000;
+		int NCOUNT_MUL = 40000;
 		int NCOUNT_DIV = 20000;
 		
 		// set up test numbers
@@ -42,15 +43,31 @@ private static void testPerformance() {
 			a128_arr[i] = new Uint128(a_arr[i], b_arr[i]);
 		}
 		
-		// test performance of add implementations
+		// test performance of conversion
 		
 		long t0 = System.currentTimeMillis();
+		for (int i=0; i<NCOUNT; i++) {
+			a128_arr[i].toBigInteger();
+		}
+		long t1 = System.currentTimeMillis();
+		LOG.info("toBigInteger took " + (t1-t0) + "ms");
+
+		t0 = System.currentTimeMillis();
+		for (int i=0; i<NCOUNT; i++) {
+			a128_arr[i].toBigIntegerUnsigned();
+		}
+		t1 = System.currentTimeMillis();
+		LOG.info("toBigIntegerUnsigned took " + (t1-t0) + "ms");
+
+		// test performance of add implementations
+		
+		t0 = System.currentTimeMillis();
 		for (int i=0; i<NCOUNT; i++) {
 			for (int j=0; j<NCOUNT; j++) {
 				a128_arr[i].add_v1(a128_arr[j]);
 			}
 		}
-		long t1 = System.currentTimeMillis();
+		t1 = System.currentTimeMillis();
 		LOG.info("add_v1 took " + (t1-t0) + "ms");
 
 		t0 = System.currentTimeMillis();
@@ -61,45 +78,97 @@ private static void testPerformance() {
 		}
 		t1 = System.currentTimeMillis();
 		LOG.info("add_v2 took " + (t1-t0) + "ms");
-		
-		// test performance of mul64 implementations
-		
+
 		t0 = System.currentTimeMillis();
 		for (int i=0; i<NCOUNT; i++) {
 			for (int j=0; j<NCOUNT; j++) {
-				Uint128.mul64_v1(a_arr[i], a_arr[j]);
+				a128_arr[i].add_v3(a128_arr[j]);
 			}
 		}
 		t1 = System.currentTimeMillis();
-		LOG.info("mul64_v1 took " + (t1-t0) + "ms");
-		
+		LOG.info("add_v3 took " + (t1-t0) + "ms");
+
 		t0 = System.currentTimeMillis();
 		for (int i=0; i<NCOUNT; i++) {
 			for (int j=0; j<NCOUNT; j++) {
-				Uint128.mul64/*_v2*/(a_arr[i], a_arr[j]);
+				a128_arr[i].subtract(a128_arr[j]);
 			}
 		}
 		t1 = System.currentTimeMillis();
-		LOG.info("mul64_v2 took " + (t1-t0) + "ms");
-		
+		LOG.info("subtract took " + (t1-t0) + "ms");
+
 		t0 = System.currentTimeMillis();
 		for (int i=0; i<NCOUNT; i++) {
 			for (int j=0; j<NCOUNT; j++) {
-				Uint128.mul64_v3(a_arr[i], a_arr[j]);
+				a128_arr[i].subtract_v2(a128_arr[j]);
+			}
+		}
+		t1 = System.currentTimeMillis();
+		LOG.info("subtract_v2 took " + (t1-t0) + "ms");
+
+		// Test performance of mul64 implementations:
+		// Here we need to do something with the results to avoid the compiler optimizing thhe tests to nothing
+		
+		long r = 0;
+		t0 = System.currentTimeMillis();
+		for (int i=0; i<NCOUNT_MUL; i++) {
+			for (int j=0; j<NCOUNT_MUL; j++) {
+				Uint128 result = Uint128.mul63(a_arr[i], a_arr[j]);
+				r += result.getHigh() + result.getLow();
+			}
+		}
+		t1 = System.currentTimeMillis();
+		LOG.info("mul63 took " + (t1-t0) + "ms");
+		LOG.trace("r = " + r);
+
+		r = 0;
+		t0 = System.currentTimeMillis();
+		for (int i=0; i<NCOUNT_MUL; i++) {
+			for (int j=0; j<NCOUNT_MUL; j++) {
+				Uint128 result = Uint128.mul64_v1(a_arr[i], a_arr[j]);
+				r += result.getHigh() + result.getLow();
+			}
+		}
+		t1 = System.currentTimeMillis();
+		LOG.info("mul64_v1 took " + (t1-t0) + "ms");
+		LOG.trace("r = " + r);
+		
+		r = 0;
+		t0 = System.currentTimeMillis();
+		for (int i=0; i<NCOUNT_MUL; i++) {
+			for (int j=0; j<NCOUNT_MUL; j++) {
+				Uint128 result = Uint128.mul64/*_v2*/(a_arr[i], a_arr[j]);
+				r += result.getHigh() + result.getLow();
+			}
+		}
+		t1 = System.currentTimeMillis();
+		LOG.info("mul64_v2 took " + (t1-t0) + "ms");
+		LOG.trace("r = " + r);
+
+		r = 0;
+		t0 = System.currentTimeMillis();
+		for (int i=0; i<NCOUNT_MUL; i++) {
+			for (int j=0; j<NCOUNT_MUL; j++) {
+				Uint128 result = Uint128.mul64_v3(a_arr[i], a_arr[j]);
+				r += result.getHigh() + result.getLow();
 			}
 		}
 		t1 = System.currentTimeMillis();
 		LOG.info("mul64_v3 took " + (t1-t0) + "ms");
+		LOG.trace("r = " + r);
 
+		r = 0;
 		t0 = System.currentTimeMillis();
-		for (int i=0; i<NCOUNT; i++) {
-			for (int j=0; j<NCOUNT; j++) {
-				Uint128.mul64_MH(a_arr[i], a_arr[j]);
+		for (int i=0; i<NCOUNT_MUL; i++) {
+			for (int j=0; j<NCOUNT_MUL; j++) {
+				Uint128 result = Uint128.mul64_MH(a_arr[i], a_arr[j]);
+				r += result.getHigh() + result.getLow();
 			}
 		}
 		t1 = System.currentTimeMillis();
 		LOG.info("mul64_MH took " + (t1-t0) + "ms");
-		
+		LOG.trace("r = " + r);
+
 		// test performance of 128 / 64 bit division and modulus
 		
 		t0 = System.currentTimeMillis();
diff --git a/src/test/java/de/tilman_neumann/jml/base/Uint128Test.java b/src/test/java/de/tilman_neumann/jml/base/Uint128Test.java