add test divUnit

author: MITSUNARI Shigeo <herumi@nifty.com> 2017-08-03 13:00:16 +0800
committer: MITSUNARI Shigeo <herumi@nifty.com> 2017-08-03 13:00:16 +0800
commit: a6171527f8d35c1eefbebcffd33d9255a179db44 (patch)
tree: 90c85482f540992494f54fc277f8117aff17ab08
parent: 57e8185b2946d389be7ea46d33288cfccb2f854d (diff)
download: dexon-mcl-a6171527f8d35c1eefbebcffd33d9255a179db44.tar.gz
dexon-mcl-a6171527f8d35c1eefbebcffd33d9255a179db44.tar.zst
dexon-mcl-a6171527f8d35c1eefbebcffd33d9255a179db44.zip
2 files changed, 75 insertions, 117 deletions
diff --git a/include/mcl/vint.hpp b/include/mcl/vint.hpp
index f9163b6..ea7eae4 100644
--- a/include/mcl/vint.hpp
+++ b/include/mcl/vint.hpp
@@ -120,27 +120,6 @@ inline uint64_t mulUnit(uint64_t *pH, uint64_t x, uint64_t y)
 #endif
 
 template<class T>
-size_t getRealSize(const T *x, size_t xn)
-{
-	int i = (int)xn - 1;
-	for (; i > 0; i--) {
-		if (x[i]) {
-			return i + 1;
-		}
-	}
-	return 1;
-}
-
-template<class T>
-size_t getBitSize(const T *x, size_t n)
-{
-	if (n == 1 && x[0] == 0) return 1;
-	T v = x[n - 1];
-	assert(v);
-	return (n - 1) * sizeof(T) * 8 + 1 + cybozu::bsr<Unit>(v);
-}
-
-template<class T>
 void divNM(T *q, size_t qn, T *r, const T *x, size_t xn, const T *y, size_t yn);
 
 /*
@@ -161,7 +140,6 @@ inline uint64_t divUnit(uint64_t *pr, uint64_t H, uint64_t L, uint64_t y)
 #if defined(MCL_VINT_64BIT_PORTABLE)
 	uint32_t px[4] = { uint32_t(L), uint32_t(L >> 32), uint32_t(H), uint32_t(H >> 32) };
 	uint32_t py[2] = { uint32_t(y), uint32_t(y >> 32) };
-#if 1
 	size_t xn = 4;
 	size_t yn = 2;
 	uint32_t q[4];
@@ -170,25 +148,6 @@ inline uint64_t divUnit(uint64_t *pr, uint64_t H, uint64_t L, uint64_t y)
 	divNM(q, qn, r, px, xn, py, yn);
 	*pr = make64(r[1], r[0]);
 	return make64(q[1], q[0]);
-#else
-	size_t xn = getRealSize(px, 4);
-	size_t yn = getRealSize(py, 2);
-	if (yn > xn) {
-		*pr = L;
-		return 0;
-	}
-	if (xn == yn) {
-		*pr = L % y;
-		return L / y;
-	}
-	assert(xn > yn);
-	uint32_t q[4];
-	uint32_t r[2];
-	size_t qn = xn - yn + 1;
-	divNM(q, qn, r, px, xn, py, yn);
-	*pr = (yn == 1) ? r[0] : make64(r[1], r[0]);
-	return (qn == 1) ? q[0] : make64(q[1], q[0]);
-#endif
 #elif defined(_MSC_VER)
 	#error "divUnit for uint64_t is not supported"
 #else
@@ -634,6 +593,7 @@ void shrN(T *y, const T *x, size_t xn, size_t bit)
 	const size_t unitBitSize = sizeof(T) * 8;
 	size_t q = bit / unitBitSize;
 	size_t r = bit % unitBitSize;
+	assert(xn >= q);
 	if (r == 0) {
 		copyN(y, x + q, xn - q);
 	} else {
@@ -641,50 +601,25 @@ void shrN(T *y, const T *x, size_t xn, size_t bit)
 	}
 }
 
-
-/*
-	get approximate value from x[xn - 1..]
-	@param up [in] round up if true
-*/
 template<class T>
-static inline double getApprox(const T *x, size_t xn, bool up)
+size_t getRealSize(const T *x, size_t xn)
 {
-	union di {
-		double f;
-		uint64_t i;
-	};
-	assert(xn >= 2);
-	T H = x[xn - 1];
-	assert(H);
-	union di di;
-	di.f = (double)H;
-	unsigned int len = int(di.i >> 52) - 1023 + 1;
-#if MCL_SIZEOF_UNIT == 4
-	uint32_t M = x[xn - 2];
-	if (len >= 21) {
-		di.i |= M >> (len - 21);
-	} else {
-		di.i |= uint64_t(M) << (21 - len);
-		if (xn >= 3) {
-			uint32_t L = x[xn - 3];
-			di.i |= L >> (len + 11);
+	int i = (int)xn - 1;
+	for (; i > 0; i--) {
+		if (x[i]) {
+			return i + 1;
 		}
 	}
-#else
-	if (len < 53) {
-		uint64_t L = x[xn - 2];
-		di.i |= L >> (len + 11);
-	} else {
-		// avoid rounding in converting from uint64_t to double
-		di.f = (double)(H & ~((uint64_t(1) << (len - 53)) - 1));
-	}
-#endif
-	double t = di.f;
-	if (up) {
-		di.i = uint64_t(len + 1022 - 52 + 1) << 52;
-		t += di.f;
-	}
-	return t;
+	return 1;
+}
+
+template<class T>
+size_t getBitSize(const T *x, size_t n)
+{
+	if (n == 1 && x[0] == 0) return 1;
+	T v = x[n - 1];
+	assert(v);
+	return (n - 1) * sizeof(T) * 8 + 1 + cybozu::bsr<Unit>(v);
 }
 
 /*
@@ -733,16 +668,15 @@ void divNM(T *q, size_t qn, T *r, const T *x, size_t xn, const T *y, size_t yn)
 		}
 		return;
 	}
-	T *qq = q;
+	T *qOrg = q;
 	if (q) {
 		if (q == x || q == y) {
-			qq = (T*)CYBOZU_ALLOCA(sizeof(T) * qn);
+			q = (T*)CYBOZU_ALLOCA(sizeof(T) * qn);
 		}
-		clearN(qq, qn);
+		clearN(q, qn);
 	}
 	T *rr = (T*)CYBOZU_ALLOCA(sizeof(T) * xn);
 	copyN(rr, x, xn);
-#if 1
 	T *t = (T*)CYBOZU_ALLOCA(sizeof(T) * (xn + 2));
 	size_t yb = getBitSize(y, yn);
 	const size_t unitBitSize = sizeof(T) * 8;
@@ -751,7 +685,7 @@ void divNM(T *q, size_t qn, T *r, const T *x, size_t xn, const T *y, size_t yn)
 		if (xb <= yb + 1) {
 			vint::subNM(rr, rr, xn, y, yn);
 			xn = getRealSize(rr, xn);
-			if (qq) vint::addu1<T>(qq, qq, qn, 1);
+			if (q) vint::addu1<T>(q, q, qn, 1);
 			continue;
 		}
 		assert(xb > yb + 1);
@@ -766,36 +700,12 @@ void divNM(T *q, size_t qn, T *r, const T *x, size_t xn, const T *y, size_t yn)
 			clearN(t, qn);
 			t[0] = q0;
 			vint::shlN(t, t, 1, xb - w - yb);
-			vint::addN(qq, qq, t, qn);
+			vint::addN(q, q, t, qn);
 		}
 	}
-#else
-	T *t = (T*)CYBOZU_ALLOCA(sizeof(T) * (yn + 1));
-	double yt = getApprox(y, yn, true);
-	while (vint::compareNM(rr, xn, y, yn) >= 0) {
-		size_t len = yn;
-		double xt = getApprox(rr, xn, false);
-		if (vint::compareNM(&rr[xn - len], yn, y, yn) < 0) {
-			xt *= double(1ULL << (sizeof(T) * 8 - 1)) * 2;
-			len++;
-		}
-		T qt = T(xt / yt);
-		if (qt == 0) qt = 1;
-		t[yn] = vint::mulu1(&t[0], y, yn, qt);
-		T b = vint::subN(&rr[xn - len], &rr[xn - len], &t[0], len);
-		if (b) {
-			assert(!b);
-		}
-		if (qq) qq[xn - len] += qt;
-
-		while (xn >= yn && rr[xn - 1] == 0) {
-			xn--;
-		}
-	}
-#endif
 	copyN(r, rr, rn);
-	if (q && q != qq) {
-		copyN(q, qq, qn);
+	if (q && q != qOrg) {
+		copyN(qOrg, q, qn);
 	}
 }
 
diff --git a/test/vint_test.cpp b/test/vint_test.cpp
index d992bf8..198987d 100644
--- a/test/vint_test.cpp
+++ b/test/vint_test.cpp
@@ -3,10 +3,6 @@
 #include <iostream>
 #include <sstream>
 #include <set>
-#ifndef _MSC_VER
-#define CYBOZU_BENCH_DONT_USE_RDTSC
-#define CYBOZU_BENCH_USE_GETTIMEOFDAY
-#endif
 #include <cybozu/benchmark.hpp>
 #include <cybozu/test.hpp>
 
@@ -1126,3 +1122,55 @@ CYBOZU_TEST_AUTO(bench)
 	CYBOZU_BENCH_C("mul", N, Vint::mul, z, x, y);
 	CYBOZU_BENCH_C("div", N, Vint::div, y, z, x);
 }
+
+struct Seq {
+	const uint32_t *tbl;
+	size_t n;
+	size_t i, j;
+	Seq(const uint32_t *tbl, size_t n) : tbl(tbl), n(n), i(0), j(0) {}
+	bool next(uint64_t *v)
+	{
+		if (i == n) {
+			if (j == n - 1) return false;
+			i = 0;
+			j++;
+		}
+		*v = (uint64_t(tbl[j]) << 32) | tbl[i];
+		i++;
+		return true;
+	}
+};
+
+CYBOZU_TEST_AUTO(divUnit)
+{
+	const uint32_t tbl[] = {
+		0, 1, 3,
+		0x7fffffff,
+		0x80000000,
+		0x80000001,
+		0xffffffff,
+	};
+	const size_t n = sizeof(tbl) / sizeof(tbl[0]);
+	Seq seq3(tbl, n);
+	uint64_t y;
+	while (seq3.next(&y)) {
+		if (y == 0) continue;
+		Seq seq2(tbl, n);
+		uint64_t r;
+		while (seq2.next(&r)) {
+			if (r >= y) break;
+			Seq seq1(tbl, n);
+			uint64_t q;
+			while (seq1.next(&q)) {
+				uint64_t x[2];
+				x[0] = mcl::vint::mulUnit(&x[1], q, y);
+				mcl::vint::addu1(x, x, 2, r);
+				uint64_t Q, R;
+//printf("q=0x%016llxull, r=0x%016llxull, y=0x%016llxull\n", (long long)q, (long long)r, (long long)y);
+				Q = mcl::vint::divUnit(&R, x[1], x[0], y);
+				CYBOZU_TEST_EQUAL(q, Q);
+				CYBOZU_TEST_EQUAL(r, R);
+			}
+		}
+	}
+}
author	MITSUNARI Shigeo <herumi@nifty.com>	2017-08-03 13:00:16 +0800
committer	MITSUNARI Shigeo <herumi@nifty.com>	2017-08-03 13:00:16 +0800
commit	a6171527f8d35c1eefbebcffd33d9255a179db44 (patch)
tree	90c85482f540992494f54fc277f8117aff17ab08
parent	57e8185b2946d389be7ea46d33288cfccb2f854d (diff)
download	dexon-mcl-a6171527f8d35c1eefbebcffd33d9255a179db44.tar.gz dexon-mcl-a6171527f8d35c1eefbebcffd33d9255a179db44.tar.zst dexon-mcl-a6171527f8d35c1eefbebcffd33d9255a179db44.zip